{"id":"https://openalex.org/W3205408642","doi":"https://doi.org/10.1145/3474085.3475621","title":"Progressive Semantic Matching for Video-Text Retrieval","display_name":"Progressive Semantic Matching for Video-Text Retrieval","publication_year":2021,"publication_date":"2021-10-17","ids":{"openalex":"https://openalex.org/W3205408642","doi":"https://doi.org/10.1145/3474085.3475621","mag":"3205408642"},"language":"en","primary_location":{"id":"doi:10.1145/3474085.3475621","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475621","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100757725","display_name":"Hongying Liu","orcid":"https://orcid.org/0000-0002-8475-2749"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hongying Liu","raw_affiliation_strings":["Xidian University &amp; Peng Cheng Laboratory, xi'an, China"],"affiliations":[{"raw_affiliation_string":"Xidian University &amp; Peng Cheng Laboratory, xi'an, China","institution_ids":["https://openalex.org/I4210136793","https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036093027","display_name":"Ru\u2010Yi Luo","orcid":"https://orcid.org/0000-0002-2224-5792"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruyi Luo","raw_affiliation_strings":["Xidian University, xi'an, China"],"affiliations":[{"raw_affiliation_string":"Xidian University, xi'an, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067858777","display_name":"Fanhua Shang","orcid":"https://orcid.org/0000-0002-1040-352X"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fanhua Shang","raw_affiliation_strings":["Xidian University &amp; Peng Cheng Laboratory, xi'an, China"],"affiliations":[{"raw_affiliation_string":"Xidian University &amp; Peng Cheng Laboratory, xi'an, China","institution_ids":["https://openalex.org/I4210136793","https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087793098","display_name":"Mantang Niu","orcid":null},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mantang Niu","raw_affiliation_strings":["Xidian University, xi'an, China"],"affiliations":[{"raw_affiliation_string":"Xidian University, xi'an, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100405051","display_name":"Yuanyuan Liu","orcid":"https://orcid.org/0009-0006-0220-6362"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanyuan Liu","raw_affiliation_strings":["Xidian University, xi'an, China"],"affiliations":[{"raw_affiliation_string":"Xidian University, xi'an, China","institution_ids":["https://openalex.org/I149594827"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100757725"],"corresponding_institution_ids":["https://openalex.org/I149594827","https://openalex.org/I4210136793"],"apc_list":null,"apc_paid":null,"fwci":1.345,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.83196078,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"5083","last_page":"5091"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8624932169914246},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.6819882392883301},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6783246397972107},{"id":"https://openalex.org/keywords/semantic-gap","display_name":"Semantic gap","score":0.6415044069290161},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6134201884269714},{"id":"https://openalex.org/keywords/semantic-matching","display_name":"Semantic matching","score":0.5964014530181885},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5517522692680359},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5200297832489014},{"id":"https://openalex.org/keywords/semantic-space","display_name":"Semantic space","score":0.5123856663703918},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.48278582096099854},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.4676501452922821},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.430003821849823},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3538988530635834},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2228311002254486},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.19866472482681274}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8624932169914246},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.6819882392883301},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6783246397972107},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.6415044069290161},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6134201884269714},{"id":"https://openalex.org/C2778493491","wikidata":"https://www.wikidata.org/wiki/Q7449072","display_name":"Semantic matching","level":3,"score":0.5964014530181885},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5517522692680359},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5200297832489014},{"id":"https://openalex.org/C2986420190","wikidata":"https://www.wikidata.org/wiki/Q39045939","display_name":"Semantic space","level":2,"score":0.5123856663703918},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.48278582096099854},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.4676501452922821},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.430003821849823},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3538988530635834},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2228311002254486},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.19866472482681274},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3474085.3475621","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475621","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7099999785423279}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W1573040851","https://openalex.org/W1832693441","https://openalex.org/W1964073652","https://openalex.org/W2106053110","https://openalex.org/W2119062120","https://openalex.org/W2123024445","https://openalex.org/W2139501017","https://openalex.org/W2162659160","https://openalex.org/W2194775991","https://openalex.org/W2425121537","https://openalex.org/W2549139847","https://openalex.org/W2620629206","https://openalex.org/W2753311918","https://openalex.org/W2808399042","https://openalex.org/W2885775891","https://openalex.org/W2948859046","https://openalex.org/W2950512756","https://openalex.org/W2951019013","https://openalex.org/W2956018683","https://openalex.org/W2963293463","https://openalex.org/W2966146145","https://openalex.org/W2972073579","https://openalex.org/W2975813532","https://openalex.org/W2981716253","https://openalex.org/W2984008963","https://openalex.org/W3003460937","https://openalex.org/W3028831795","https://openalex.org/W3035309251","https://openalex.org/W3035356601","https://openalex.org/W3040166514","https://openalex.org/W3043990051","https://openalex.org/W3102887392","https://openalex.org/W3130796238"],"related_works":["https://openalex.org/W2275988210","https://openalex.org/W2128807628","https://openalex.org/W2083132573","https://openalex.org/W117618596","https://openalex.org/W2584816862","https://openalex.org/W3205408642","https://openalex.org/W4317515582","https://openalex.org/W2157224911","https://openalex.org/W2389678293","https://openalex.org/W2965398302"],"abstract_inverted_index":{"Cross-modal":[0],"retrieval":[1],"between":[2,41,79],"texts":[3,159],"and":[4,28,43,101,119,121,158,178],"videos":[5,42,118,157],"is":[6,32,71],"important":[7],"yet":[8],"challenging.":[9],"Until":[10],"recently,":[11],"previous":[12],"works":[13],"in":[14,135],"this":[15,84,150],"domain":[16],"typically":[17],"rely":[18],"on":[19,171],"learning":[20,95],"a":[21,93,98,103,113,161,166],"common":[22,58,125,141,163],"space":[23,164],"to":[24,34,37,53,147],"match":[25,35],"the":[26,38,75,131,140,152,181],"text":[27],"video,":[29],"but":[30],"it":[31],"difficult":[33],"due":[36],"semantic":[39,77,90],"gap":[40,78,91],"texts.":[44],"Although":[45],"some":[46,123],"methods":[47],"employ":[48],"coarse-to-fine":[49,99],"or":[50,56],"multi-expert":[51],"networks":[52],"encode":[54,156],"one":[55,67],"more":[57],"spaces":[59,142],"for":[60,117],"easier":[61],"matching,":[62],"they":[63],"almost":[64],"directly":[65],"optimize":[66],"matching":[68],"space,":[69],"which":[70,127,186],"challenging,":[72],"because":[73],"of":[74,133,183],"huge":[76],"different":[80,136],"modalities.":[81],"To":[82],"address":[83],"issue,":[85],"we":[86],"aim":[87],"at":[88],"narrowing":[89],"by":[92,130,165],"progressive":[94,167],"process":[96],"with":[97,192],"architecture,":[100],"propose":[102],"novel":[104],"Progressive":[105],"Semantic":[106],"Matching":[107],"(PSM)":[108],"method.":[109],"We":[110],"first":[111],"construct":[112],"multilevel":[114],"encoding":[115],"network":[116],"texts,":[120],"design":[122],"auxiliary":[124],"spaces,":[126],"are":[128,143],"mapped":[129],"outputs":[132],"encoders":[134],"levels.":[137],"Then":[138],"all":[139],"jointly":[144],"trained":[145],"end":[146],"end.":[148],"In":[149],"way,":[151],"model":[153],"can":[154],"effectively":[155],"into":[160],"fusion":[162],"paradigm.":[168],"Experimental":[169],"results":[170],"three":[172],"video-text":[173],"datasets":[174],"(i.e.,":[175],"MSR-VTT,":[176],"TIGF":[177],"MSVD)":[179],"demonstrate":[180],"advantages":[182],"our":[184],"PSM,":[185],"achieves":[187],"significant":[188],"performance":[189],"improvement":[190],"compared":[191],"state-of-the-art":[193],"approaches.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
