{"id":"https://openalex.org/W4376852307","doi":"https://doi.org/10.1145/3573942.3574072","title":"Research on Image Description Generation Method Based on G-AoANet","display_name":"Research on Image Description Generation Method Based on G-AoANet","publication_year":2022,"publication_date":"2022-09-23","ids":{"openalex":"https://openalex.org/W4376852307","doi":"https://doi.org/10.1145/3573942.3574072"},"language":"en","primary_location":{"id":"doi:10.1145/3573942.3574072","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1145/3573942.3574072","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 5th International Conference on Artificial Intelligence and Pattern Recognition","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005451272","display_name":"Pingan Qiao","orcid":"https://orcid.org/0000-0002-4821-2518"},"institutions":[{"id":"https://openalex.org/I4210136859","display_name":"Xi\u2019an University of Posts and Telecommunications","ror":"https://ror.org/04jn0td46","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210136859"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Pingan Qiao","raw_affiliation_strings":["Xi'an University of Posts and Telecommunications, China"],"raw_orcid":"https://orcid.org/0000-0002-4821-2518","affiliations":[{"raw_affiliation_string":"Xi'an University of Posts and Telecommunications, China","institution_ids":["https://openalex.org/I4210136859"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055868469","display_name":"Ruixue Shen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210136859","display_name":"Xi\u2019an University of Posts and Telecommunications","ror":"https://ror.org/04jn0td46","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210136859"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruixue Shen","raw_affiliation_strings":["Xi'an University of Posts and Telecommunications, China"],"raw_orcid":"https://orcid.org/0000-0002-2705-1436","affiliations":[{"raw_affiliation_string":"Xi'an University of Posts and Telecommunications, China","institution_ids":["https://openalex.org/I4210136859"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101895506","display_name":"Yuan Li","orcid":"https://orcid.org/0000-0002-3383-3573"},"institutions":[{"id":"https://openalex.org/I4210136859","display_name":"Xi\u2019an University of Posts and Telecommunications","ror":"https://ror.org/04jn0td46","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210136859"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan Li","raw_affiliation_strings":["Xi'an University of Posts and Telecommunications, China"],"raw_orcid":"https://orcid.org/0000-0002-3383-3573","affiliations":[{"raw_affiliation_string":"Xi'an University of Posts and Telecommunications, China","institution_ids":["https://openalex.org/I4210136859"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5005451272"],"corresponding_institution_ids":["https://openalex.org/I4210136859"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17196463,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"631","last_page":"636"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7698416709899902},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.7461051940917969},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6897492408752441},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6893825531005859},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.6320493221282959},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.593492865562439},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5838932991027832},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.40794894099235535},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.35713934898376465},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3356831669807434},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3267848491668701}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7698416709899902},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.7461051940917969},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6897492408752441},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6893825531005859},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.6320493221282959},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.593492865562439},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5838932991027832},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40794894099235535},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.35713934898376465},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3356831669807434},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3267848491668701},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3573942.3574072","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1145/3573942.3574072","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 5th International Conference on Artificial Intelligence and Pattern Recognition","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1502957213","https://openalex.org/W1861492603","https://openalex.org/W1897761818","https://openalex.org/W1902237438","https://openalex.org/W1931639407","https://openalex.org/W1956340063","https://openalex.org/W1969616664","https://openalex.org/W2122710056","https://openalex.org/W2133564696","https://openalex.org/W2149172860","https://openalex.org/W2157331557","https://openalex.org/W2183341477","https://openalex.org/W2293453011","https://openalex.org/W2506483933","https://openalex.org/W2986670728","https://openalex.org/W6898505805"],"related_works":["https://openalex.org/W4390516098","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W2142795561","https://openalex.org/W2012531322","https://openalex.org/W4205302943","https://openalex.org/W2561132942","https://openalex.org/W2402761219","https://openalex.org/W3155418658","https://openalex.org/W4243199227"],"abstract_inverted_index":{"Most":[0],"of":[1,23,108],"the":[2,8,18,50,62,75,106,109,116,119,128],"image":[3,47],"description":[4],"generation":[5],"methods":[6],"in":[7,61],"attention-based":[9],"encoder-decoder":[10],"framework":[11],"extract":[12],"local":[13,24,89],"features":[14,87],"from":[15],"images.":[16],"Despite":[17],"relatively":[19],"high":[20],"semantic":[21],"level":[22],"features,":[25],"it":[26],"still":[27],"has":[28],"two":[29],"problems":[30],"to":[31,73,84],"be":[32,43,59],"solved,":[33],"one":[34],"is":[35,52,71],"object":[36,57,101],"loss,":[37],"where":[38],"some":[39],"important":[40],"objects":[41],"may":[42,58],"lost":[44],"when":[45],"generating":[46],"descriptions,":[48],"and":[49,102,124,134],"other":[51],"prediction":[53],"error,":[54],"as":[55],"an":[56,81],"identified":[60],"wrong":[63],"class.":[64],"In":[65,91],"this":[66,92],"paper,":[67],"a":[68],"G-AoANet":[69],"model":[70,79,95,117],"proposed":[72],"solve":[74],"above":[76],"problems.":[77],"The":[78],"uses":[80],"attention":[82],"mechanism":[83],"combine":[85],"global":[86],"with":[88],"features.":[90],"way,":[93],"our":[94],"can":[96],"selectively":[97],"focus":[98],"on":[99,127],"both":[100],"contextual":[103],"information,":[104],"improving":[105],"quality":[107],"generated":[110],"descriptions.":[111],"Experimental":[112],"results":[113],"show":[114],"that":[115],"improves":[118],"initially":[120],"reported":[121],"best":[122],"CIDEr-D":[123],"SPICE":[125],"scores":[126],"MS":[129],"COCO":[130],"dataset":[131],"by":[132],"9.3%":[133],"5.1%":[135],"respectively.":[136]},"counts_by_year":[],"updated_date":"2025-12-24T23:09:58.560324","created_date":"2025-10-10T00:00:00"}
