{"id":"https://openalex.org/W4396214409","doi":"https://doi.org/10.1109/tcsvt.2024.3394551","title":"Multi-Layer Probabilistic Association Reasoning Network for Image-Text Retrieval","display_name":"Multi-Layer Probabilistic Association Reasoning Network for Image-Text Retrieval","publication_year":2024,"publication_date":"2024-04-29","ids":{"openalex":"https://openalex.org/W4396214409","doi":"https://doi.org/10.1109/tcsvt.2024.3394551"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3394551","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3394551","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100739626","display_name":"Wenrui Li","orcid":"https://orcid.org/0000-0003-0635-7919"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wenrui Li","raw_affiliation_strings":["Department of Computer Science and Technology, Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013727612","display_name":"Ruiqin Xiong","orcid":"https://orcid.org/0000-0001-9796-0478"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruiqin Xiong","raw_affiliation_strings":["School of Electronic Engineering and Computer Science, Institute of Digital Media, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Engineering and Computer Science, Institute of Digital Media, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079412089","display_name":"Xiaopeng Fan","orcid":"https://orcid.org/0000-0002-9660-3636"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaopeng Fan","raw_affiliation_strings":["Department of Computer Science and Technology, Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100739626"],"corresponding_institution_ids":["https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":2.6651,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.90965789,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"34","issue":"10","first_page":"9706","last_page":"9717"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9453999996185303,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9453999996185303,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7081307768821716},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.6436174511909485},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5294879078865051},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.527317464351654},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5044976472854614},{"id":"https://openalex.org/keywords/association","display_name":"Association (psychology)","score":0.5011703968048096},{"id":"https://openalex.org/keywords/case-based-reasoning","display_name":"Case-based reasoning","score":0.4409831166267395},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.42876705527305603},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.37692636251449585},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36295223236083984}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7081307768821716},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.6436174511909485},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5294879078865051},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.527317464351654},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5044976472854614},{"id":"https://openalex.org/C142853389","wikidata":"https://www.wikidata.org/wiki/Q744778","display_name":"Association (psychology)","level":2,"score":0.5011703968048096},{"id":"https://openalex.org/C20162079","wikidata":"https://www.wikidata.org/wiki/Q1151406","display_name":"Case-based reasoning","level":2,"score":0.4409831166267395},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.42876705527305603},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.37692636251449585},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36295223236083984},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2024.3394551","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3394551","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3445816967","display_name":null,"funder_award_id":"2021YFF0900500","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G5430980299","display_name":null,"funder_award_id":"U22B2035","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5887223637","display_name":null,"funder_award_id":"62441202","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W1773149199","https://openalex.org/W1861492603","https://openalex.org/W2885272854","https://openalex.org/W2894786240","https://openalex.org/W2962964995","https://openalex.org/W2964271799","https://openalex.org/W2966715458","https://openalex.org/W2969679616","https://openalex.org/W2981586349","https://openalex.org/W2988823324","https://openalex.org/W2991118492","https://openalex.org/W3005971801","https://openalex.org/W3015686016","https://openalex.org/W3035454331","https://openalex.org/W3035605030","https://openalex.org/W3072820880","https://openalex.org/W3090449556","https://openalex.org/W3093199520","https://openalex.org/W3099614098","https://openalex.org/W3118694826","https://openalex.org/W3138516171","https://openalex.org/W3155230099","https://openalex.org/W3155471926","https://openalex.org/W3168433561","https://openalex.org/W3197809352","https://openalex.org/W3207608362","https://openalex.org/W3207778762","https://openalex.org/W3213100861","https://openalex.org/W4200051180","https://openalex.org/W4225329158","https://openalex.org/W4226391640","https://openalex.org/W4283693981","https://openalex.org/W4283812943","https://openalex.org/W4285118104","https://openalex.org/W4287511972","https://openalex.org/W4293518982","https://openalex.org/W4294891625","https://openalex.org/W4304091789","https://openalex.org/W4304092370","https://openalex.org/W4306933361","https://openalex.org/W4312761738","https://openalex.org/W4313477296","https://openalex.org/W4322576838","https://openalex.org/W4385895960","https://openalex.org/W4386071847","https://openalex.org/W4387968071","https://openalex.org/W4388190088","https://openalex.org/W4389675233","https://openalex.org/W6620707391","https://openalex.org/W6766904570","https://openalex.org/W6803448863"],"related_works":["https://openalex.org/W2352440174","https://openalex.org/W4309440960","https://openalex.org/W2494523064","https://openalex.org/W2943623134","https://openalex.org/W2588219639","https://openalex.org/W2215759665","https://openalex.org/W2030292806","https://openalex.org/W2960358116","https://openalex.org/W4287727129","https://openalex.org/W2062168445"],"abstract_inverted_index":{"With":[0],"the":[1,6,17,28,42,60,69,95,109,119,135,140,146,156,191,197,212,215],"advancement":[2],"of":[3,8,139,214],"deep":[4],"learning,":[5],"task":[7],"image-text":[9],"retrieval":[10,200],"has":[11],"received":[12],"widespread":[13],"attention":[14],"for":[15,38],"addressing":[16],"semantic":[18,147,158,173],"heterogeneity":[19],"in":[20,31,48,52],"multimodal":[21],"data.":[22],"However,":[23],"many":[24],"existing":[25],"methods":[26],"ignore":[27],"uncertainty":[29],"present":[30],"manually":[32],"annotated":[33],"datasets.":[34],"It":[35],"is":[36,74,152,168],"crucial":[37],"models":[39],"to":[40,76,91,154,170,179,204],"learn":[41],"potential":[43],"corresponding":[44],"relationships":[45,100],"between":[46,101,112],"regions":[47],"images":[49],"and":[50,80,93,98,103,114,178,193],"words":[51],"sentences.":[53],"To":[54,106],"tackle":[55],"these":[56,129],"challenges,":[57],"we":[58,117,144],"introduce":[59,145],"Multi-layer":[61],"Probabilistic":[62],"Association":[63],"Reasoning":[64],"Network":[65],"(MPARN).":[66],"In":[67],"MPARN,":[68],"region-word":[70],"association":[71,110,121,217],"reasoning":[72,149],"module":[73],"developed":[75],"treat":[77],"each":[78,161,176],"visual":[79,102,113],"textual":[81,104,115],"fragment":[82],"as":[83],"unique":[84],"probability":[85,122],"distributions.":[86,218],"This":[87,124],"allows":[88],"our":[89],"model":[90],"imagine":[92],"capture":[94],"intricate":[96],"one-to-many":[97],"many-to-many":[99],"objects.":[105],"effectively":[107,131],"integrate":[108],"distributions":[111,130],"modalities,":[116],"propose":[118],"cross-modal":[120],"composer.":[123],"composer":[125,167],"not":[126],"only":[127],"combines":[128],"but":[132],"also":[133],"preserves":[134],"intrinsic":[136],"hierarchical":[137],"structure":[138],"elements":[141],"involved.":[142],"Furthermore,":[143],"relationship":[148],"module,":[150],"which":[151],"designed":[153],"analyze":[155],"contextual":[157],"information":[159],"within":[160,175],"modality.":[162],"The":[163,207],"multi-layer":[164],"adaptive":[165],"aggregate":[166],"employed":[169],"progressively":[171],"explore":[172],"correlations":[174],"modality":[177],"dynamically":[180],"synthesize":[181],"outputs":[182],"based":[183],"on":[184,190],"their":[185],"relevance.":[186],"Our":[187],"extensive":[188],"experiments":[189],"Flickr30K":[192],"MSCOCO":[194],"datasets":[195],"demonstrate":[196],"MPARN\u2019s":[198],"state-of-the-art":[199],"performance":[201],"when":[202],"compared":[203],"other":[205],"baselines.":[206],"qualitative":[208],"results":[209],"further":[210],"validate":[211],"effectiveness":[213],"probabilistic":[216]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":8}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
