{"id":"https://openalex.org/W4220947755","doi":"https://doi.org/10.1109/kst53302.2022.9729062","title":"Efficient Image Embedding for Fine-Grained Visual Classification","display_name":"Efficient Image Embedding for Fine-Grained Visual Classification","publication_year":2022,"publication_date":"2022-01-26","ids":{"openalex":"https://openalex.org/W4220947755","doi":"https://doi.org/10.1109/kst53302.2022.9729062"},"language":"en","primary_location":{"id":"doi:10.1109/kst53302.2022.9729062","is_oa":false,"landing_page_url":"https://doi.org/10.1109/kst53302.2022.9729062","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 14th International Conference on Knowledge and Smart Technology (KST)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071025210","display_name":"Soranan Payatsuporn","orcid":null},"institutions":[{"id":"https://openalex.org/I158708052","display_name":"Chulalongkorn University","ror":"https://ror.org/028wp3y58","country_code":"TH","type":"education","lineage":["https://openalex.org/I158708052"]}],"countries":["TH"],"is_corresponding":true,"raw_author_name":"Soranan Payatsuporn","raw_affiliation_strings":["Chulalongkorn University,Computer Engineering,Bangkok,Thailand","Computer Engineering, Chulalongkorn University, Bangkok, Thailand"],"affiliations":[{"raw_affiliation_string":"Chulalongkorn University,Computer Engineering,Bangkok,Thailand","institution_ids":["https://openalex.org/I158708052"]},{"raw_affiliation_string":"Computer Engineering, Chulalongkorn University, Bangkok, Thailand","institution_ids":["https://openalex.org/I158708052"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065724368","display_name":"Boonserm Kijsirikul","orcid":"https://orcid.org/0000-0002-9046-7151"},"institutions":[{"id":"https://openalex.org/I158708052","display_name":"Chulalongkorn University","ror":"https://ror.org/028wp3y58","country_code":"TH","type":"education","lineage":["https://openalex.org/I158708052"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Boonserm Kijsirikul","raw_affiliation_strings":["Chulalongkorn University,Computer Engineering,Bangkok,Thailand","Computer Engineering, Chulalongkorn University, Bangkok, Thailand"],"affiliations":[{"raw_affiliation_string":"Chulalongkorn University,Computer Engineering,Bangkok,Thailand","institution_ids":["https://openalex.org/I158708052"]},{"raw_affiliation_string":"Computer Engineering, Chulalongkorn University, Bangkok, Thailand","institution_ids":["https://openalex.org/I158708052"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5071025210"],"corresponding_institution_ids":["https://openalex.org/I158708052"],"apc_list":null,"apc_paid":null,"fwci":0.2013,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.44572206,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"40","last_page":"45"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7786945104598999},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.750604510307312},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.744257390499115},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7230087518692017},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.6581770181655884},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5905430912971497},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.5814845561981201},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5607173442840576},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5474283695220947},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5406320691108704},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.5289759039878845},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5284290909767151},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.5176013708114624},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5042494535446167},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.49061480164527893},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4677097201347351},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.44109126925468445},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33685174584388733}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7786945104598999},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.750604510307312},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.744257390499115},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7230087518692017},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.6581770181655884},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5905430912971497},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.5814845561981201},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5607173442840576},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5474283695220947},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5406320691108704},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.5289759039878845},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5284290909767151},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.5176013708114624},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5042494535446167},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.49061480164527893},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4677097201347351},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.44109126925468445},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33685174584388733},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/kst53302.2022.9729062","is_oa":false,"landing_page_url":"https://doi.org/10.1109/kst53302.2022.9729062","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 14th International Conference on Knowledge and Smart Technology (KST)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.75,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W56385144","https://openalex.org/W603908379","https://openalex.org/W1686810756","https://openalex.org/W1797268635","https://openalex.org/W1846799578","https://openalex.org/W2104657103","https://openalex.org/W2108598243","https://openalex.org/W2138011018","https://openalex.org/W2194775991","https://openalex.org/W2202499615","https://openalex.org/W2520774990","https://openalex.org/W2737725206","https://openalex.org/W2750672897","https://openalex.org/W2763070548","https://openalex.org/W2773003563","https://openalex.org/W2798365843","https://openalex.org/W2807931652","https://openalex.org/W2883888092","https://openalex.org/W2891951760","https://openalex.org/W2953915809","https://openalex.org/W2955425717","https://openalex.org/W2962858109","https://openalex.org/W2962898354","https://openalex.org/W2963066927","https://openalex.org/W2963090248","https://openalex.org/W2963166243","https://openalex.org/W2963351448","https://openalex.org/W2963407932","https://openalex.org/W2963446712","https://openalex.org/W2963466847","https://openalex.org/W2969985801","https://openalex.org/W2990495699","https://openalex.org/W2997426000","https://openalex.org/W3008809756","https://openalex.org/W3009337595","https://openalex.org/W3081907075","https://openalex.org/W6725739302","https://openalex.org/W6748257384","https://openalex.org/W6762718338"],"related_works":["https://openalex.org/W4237171675","https://openalex.org/W3036286480","https://openalex.org/W3192357901","https://openalex.org/W2387360586","https://openalex.org/W4287027631","https://openalex.org/W2952736415","https://openalex.org/W3209723314","https://openalex.org/W3205398323","https://openalex.org/W2883297582","https://openalex.org/W2945311944"],"abstract_inverted_index":{"Fine-grained":[0],"visual":[1],"classification":[2],"(FGVC)":[3],"is":[4,13,70,82,106],"a":[5,14,44],"task":[6,16],"belonging":[7],"to":[8,18,30,35,107,132],"multiple":[9],"sub-categories":[10],"classification.":[11,84],"It":[12,123],"challenging":[15],"due":[17],"high":[19],"intraclass":[20],"variation":[21],"and":[22,51,54,79,98,115,141],"inter-class":[23,99],"similarity.":[24],"Most":[25],"exiting":[26],"methods":[27],"pay":[28],"attention":[29],"capture":[31],"discriminative":[32],"semantic":[33],"parts":[34],"address":[36],"those":[37],"problems.":[38],"In":[39],"this":[40],"paper,":[41],"we":[42,55],"introduce":[43],"two-level":[45,86],"network":[46],"which":[47,67,93,136],"consists":[48],"of":[49,76,101],"raw-level":[50,69],"object-level":[52],"networks,":[53],"name":[56],"it":[57],"\u201cEfficient":[58],"Image":[59],"Embedding\u201d.":[60],"Its":[61],"training":[62],"procedure":[63],"has":[64,124],"two":[65,129],"stages":[66],"the":[68,74,80,133],"for":[71,83,139,143],"localization":[72],"by":[73],"aggregation":[75],"feature":[77],"maps,":[78],"last":[81],"The":[85],"use":[87],"Adaptive":[88],"Angular":[89],"Margin":[90],"loss":[91],"(AAM-loss),":[92],"improve":[94],"an":[95,120],"intra-class":[96],"compactness":[97],"variety":[100],"image":[102],"embedding.":[103],"Our":[104],"approach":[105],"identify":[108],"object":[109],"regions":[110],"without":[111],"any":[112],"hand-crafted":[113],"bounding-box,":[114],"can":[116],"be":[117],"trained":[118],"in":[119],"end-to-end":[121],"manner.":[122],"achieved":[125],"better":[126],"accuracy":[127],"on":[128],"datasets":[130],"compared":[131],"existing":[134],"work,":[135],"are":[137],"89.0%":[138],"CUB200-2011":[140],"93.3%":[142],"FGVC-Aircraft.":[144]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
