{"id":"https://openalex.org/W2912684514","doi":"https://doi.org/10.1145/3231739","title":"Visual Content Recognition by Exploiting Semantic Feature Map with Attention and Multi-task Learning","display_name":"Visual Content Recognition by Exploiting Semantic Feature Map with Attention and Multi-task Learning","publication_year":2019,"publication_date":"2019-01-31","ids":{"openalex":"https://openalex.org/W2912684514","doi":"https://doi.org/10.1145/3231739","mag":"2912684514"},"language":"en","primary_location":{"id":"doi:10.1145/3231739","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3231739","pdf_url":null,"source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100626035","display_name":"Rui-Wei Zhao","orcid":"https://orcid.org/0000-0002-8498-5761"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Rui-Wei Zhao","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100665639","display_name":"Qi Zhang","orcid":"https://orcid.org/0000-0003-0709-3273"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Zhang","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026167547","display_name":"Zuxuan Wu","orcid":"https://orcid.org/0000-0002-8689-5807"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zuxuan Wu","raw_affiliation_strings":["University of Maryland, Maryland, USA"],"affiliations":[{"raw_affiliation_string":"University of Maryland, Maryland, USA","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100368377","display_name":"Jianguo Li","orcid":"https://orcid.org/0000-0002-8645-0680"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jianguo Li","raw_affiliation_strings":["Intel Labs China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Intel Labs China, Beijing, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047962986","display_name":"Yu\u2013Gang Jiang","orcid":"https://orcid.org/0000-0002-1907-8567"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu-Gang Jiang","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100626035"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":1.2147,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.82847741,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"15","issue":"1s","first_page":"1","last_page":"22"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pascal","display_name":"Pascal (unit)","score":0.7959283590316772},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7904621362686157},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7684577107429504},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.708587646484375},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6273288726806641},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5903634428977966},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.519023060798645},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.47575992345809937},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.46753212809562683},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4468402564525604},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4467763900756836},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4298180043697357},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.42229732871055603},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.4143086373806},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3414984345436096}],"concepts":[{"id":"https://openalex.org/C75608658","wikidata":"https://www.wikidata.org/wiki/Q44395","display_name":"Pascal (unit)","level":2,"score":0.7959283590316772},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7904621362686157},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7684577107429504},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.708587646484375},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6273288726806641},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5903634428977966},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.519023060798645},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.47575992345809937},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.46753212809562683},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4468402564525604},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4467763900756836},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4298180043697357},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.42229732871055603},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.4143086373806},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3414984345436096},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3231739","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3231739","pdf_url":null,"source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7300000190734863,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G3368050527","display_name":null,"funder_award_id":"16QA1400500","funder_id":"https://openalex.org/F4320321885","funder_display_name":"Science and Technology Commission of Shanghai Municipality"},{"id":"https://openalex.org/G8303758602","display_name":null,"funder_award_id":"61572134, 61622204","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321885","display_name":"Science and Technology Commission of Shanghai Municipality","ror":"https://ror.org/03kt66j61"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W7746136","https://openalex.org/W603908379","https://openalex.org/W1514535095","https://openalex.org/W1524680991","https://openalex.org/W1536680647","https://openalex.org/W1538021842","https://openalex.org/W1567302070","https://openalex.org/W1599220855","https://openalex.org/W1720875375","https://openalex.org/W1777628566","https://openalex.org/W1861492603","https://openalex.org/W1903029394","https://openalex.org/W1928906481","https://openalex.org/W1965555842","https://openalex.org/W1986482242","https://openalex.org/W2010181071","https://openalex.org/W2012592962","https://openalex.org/W2024051019","https://openalex.org/W2035192458","https://openalex.org/W2037227137","https://openalex.org/W2063438554","https://openalex.org/W2064675550","https://openalex.org/W2066650804","https://openalex.org/W2088049833","https://openalex.org/W2093367888","https://openalex.org/W2097117768","https://openalex.org/W2102605133","https://openalex.org/W2109255472","https://openalex.org/W2110628941","https://openalex.org/W2117539524","https://openalex.org/W2120176405","https://openalex.org/W2142521298","https://openalex.org/W2156303437","https://openalex.org/W2161381512","https://openalex.org/W2161565164","https://openalex.org/W2164507085","https://openalex.org/W2172806452","https://openalex.org/W2186222003","https://openalex.org/W2191616647","https://openalex.org/W2194775991","https://openalex.org/W2205968144","https://openalex.org/W2237880439","https://openalex.org/W2257307118","https://openalex.org/W2269165052","https://openalex.org/W2288122362","https://openalex.org/W2460852148","https://openalex.org/W2473032611","https://openalex.org/W2499974702","https://openalex.org/W2521365688","https://openalex.org/W2526479943","https://openalex.org/W2527457059","https://openalex.org/W2612703655","https://openalex.org/W2618530766","https://openalex.org/W2765823242","https://openalex.org/W2773003563","https://openalex.org/W2919115771","https://openalex.org/W2953106684","https://openalex.org/W2962835968","https://openalex.org/W2963037989","https://openalex.org/W2963173190","https://openalex.org/W2963745697","https://openalex.org/W2964227963","https://openalex.org/W3106250896","https://openalex.org/W3124951096","https://openalex.org/W4236965008"],"related_works":["https://openalex.org/W2406522397","https://openalex.org/W2732542196","https://openalex.org/W2914959431","https://openalex.org/W2518599539","https://openalex.org/W2059299633","https://openalex.org/W2557461402","https://openalex.org/W1482242411","https://openalex.org/W2784396512","https://openalex.org/W2888527098","https://openalex.org/W2463113024"],"abstract_inverted_index":{"Recent":[0],"studies":[1,169],"have":[2],"shown":[3],"that":[4,195],"spatial":[5,61,108],"relationships":[6],"among":[7,110],"objects":[8,83,111],"are":[9,92,153],"very":[10],"important":[11,82],"for":[12,47,81,134,185,212],"visual":[13],"recognition,":[14],"since":[15],"they":[16],"can":[17,203],"provide":[18],"rich":[19],"clues":[20],"on":[21,129,178],"object":[22,62,79,90,146],"contexts":[23,63],"within":[24,64],"the":[25,37,60,65,72,77,96,107,127,132,160,172,175,190,196,200],"images.":[26,66],"In":[27,67,188],"this":[28],"article,":[29],"we":[30,69,114],"introduce":[31],"a":[32,101],"novel":[33,138],"method":[34],"to":[35,57,76,156,170,207],"learn":[36,159],"Semantic":[38],"Feature":[39],"Map":[40],"(SFM)":[41],"with":[42,106,142],"attention-based":[43],"deep":[44],"neural":[45],"networks":[46],"image":[48,143,186,201],"and":[49,85,103,149,167,182,209],"video":[50,213],"classification":[51,144],"in":[52],"an":[53],"end-to-end":[54],"manner,":[55],"aiming":[56],"explicitly":[58,70],"model":[59,161],"particular,":[68],"apply":[71],"designed":[73],"gate":[74],"units":[75],"extracted":[78],"features":[80,91],"selection":[84],"noise":[86],"removal.":[87],"These":[88],"selected":[89],"then":[93],"organized":[94],"into":[95],"proposed":[97,176],"SFM,":[98],"which":[99],"is":[100],"compact":[102],"discriminative":[104],"representation":[105],"information":[109],"preserved.":[112],"Finally,":[113],"employ":[115],"either":[116],"Fully":[117],"Convolutional":[118],"Networks":[119],"(FCN)":[120],"or":[121],"Long-Short":[122],"Term":[123],"Memory":[124],"(LSTM)":[125],"as":[126],"classifiers":[128],"top":[130],"of":[131,174],"SFM":[133],"content":[135],"recognition.":[136],"A":[137],"multi-task":[139],"learning":[140],"framework":[141],"loss,":[145,148],"localization":[147],"grid":[150],"labeling":[151],"loss":[152],"also":[154,193],"introduced":[155],"help":[157],"better":[158],"parameters.":[162],"We":[163],"conduct":[164],"extensive":[165],"evaluations":[166],"comparative":[168],"verify":[171],"effectiveness":[173],"approach":[177],"Pascal":[179],"VOC":[180],"2007/2012":[181],"MS-COCO":[183],"benchmarks":[184,211],"classification.":[187,214],"addition,":[189],"experimental":[191],"results":[192],"show":[194],"SFMs":[197],"learned":[198],"from":[199],"domain":[202],"be":[204],"successfully":[205],"transferred":[206],"CCV":[208],"FCVID":[210]},"counts_by_year":[{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
