{"id":"https://openalex.org/W7131661060","doi":"https://doi.org/10.1109/ickg66886.2025.00034","title":"Efficient Text-Video Aligner Method for Text-Video Retrieval","display_name":"Efficient Text-Video Aligner Method for Text-Video Retrieval","publication_year":2025,"publication_date":"2025-11-13","ids":{"openalex":"https://openalex.org/W7131661060","doi":"https://doi.org/10.1109/ickg66886.2025.00034"},"language":null,"primary_location":{"id":"doi:10.1109/ickg66886.2025.00034","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ickg66886.2025.00034","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Knowledge Graph (ICKG)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Huaiqi Li","orcid":null},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Huaiqi Li","raw_affiliation_strings":["School of Computer Science and Information Engineering, Hefei University of Technology,Hefei,China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Information Engineering, Hefei University of Technology,Hefei,China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5126865593","display_name":"Chunxiao Fan","orcid":null},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunxiao Fan","raw_affiliation_strings":["School of Computer Science and Information Engineering, Hefei University of Technology,Hefei,China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Information Engineering, Hefei University of Technology,Hefei,China","institution_ids":["https://openalex.org/I16365422"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I16365422"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.72284458,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"208","last_page":"215"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.7645999789237976,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.7645999789237976,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.04230000078678131,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.03590000048279762,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.7339000105857849},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.527999997138977},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4952000081539154},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.49059998989105225},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.45820000767707825},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.45399999618530273},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.4309000074863434},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.40119999647140503}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7943000197410583},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.7339000105857849},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.527999997138977},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4952999949455261},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4952000081539154},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.49059998989105225},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.45820000767707825},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.45399999618530273},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.4309000074863434},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40119999647140503},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.38589999079704285},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.37290000915527344},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.357699990272522},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3264999985694885},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.32199999690055847},{"id":"https://openalex.org/C2983787585","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature matching","level":3,"score":0.29910001158714294},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.28349998593330383},{"id":"https://openalex.org/C142853389","wikidata":"https://www.wikidata.org/wiki/Q744778","display_name":"Association (psychology)","level":2,"score":0.2797999978065491},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.27959999442100525},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.27649998664855957},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.26930001378059387},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2687999904155731},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.2590999901294708},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.25679999589920044}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ickg66886.2025.00034","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ickg66886.2025.00034","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Knowledge Graph (ICKG)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G560437458","display_name":null,"funder_award_id":"61802105","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1522734439","https://openalex.org/W2130372245","https://openalex.org/W2250539671","https://openalex.org/W2547626548","https://openalex.org/W2963524571","https://openalex.org/W2970641574","https://openalex.org/W3035309251","https://openalex.org/W3035356601","https://openalex.org/W3043840704","https://openalex.org/W3204588463","https://openalex.org/W3206683855","https://openalex.org/W4285606530","https://openalex.org/W4293567872","https://openalex.org/W4304014690","https://openalex.org/W4312372711","https://openalex.org/W4386072365","https://openalex.org/W4390873165","https://openalex.org/W4390874668","https://openalex.org/W4390889802","https://openalex.org/W4402704596","https://openalex.org/W4403791665","https://openalex.org/W4404752290"],"related_works":[],"abstract_inverted_index":{"To":[0],"address":[1],"the":[2,13,20,76,90,147,161],"challenges":[3],"of":[4,15,53,96,150],"global":[5,33,62,118,123],"alignment":[6,63,70,119,125,134],"methods":[7],"in":[8,27,153],"text-video":[9,61,67],"retrieval,":[10],"such":[11],"as":[12,173],"lack":[14],"fine-grained":[16,68,132],"semantic":[17,22,94,124,148],"matching":[18],"and":[19,30,34,65,93,114,128,155,165,170,176],"cross-modal":[21,97],"gap":[23],"leading":[24],"to":[25,107,191],"difficulties":[26],"feature":[28],"alignment,":[29],"considering":[31],"that":[32,179],"local":[35,69,133,151],"information":[36,111],"has":[37],"not":[38],"been":[39],"fully":[40],"utilized,":[41],"we":[42],"propose":[43],"an":[44],"Efficient":[45],"Text-video":[46],"Aligner":[47],"(ETVA)":[48],"method.":[49],"The":[50,72,99,117,131],"model":[51],"consists":[52],"a":[54,57,60,66,103,140],"text":[55,73,82,154],"encoder,":[56,59],"video":[58,100,110],"module,":[64,135],"module.":[71],"encoder":[74,101],"employs":[75],"ALBERT":[77],"model,":[78],"which":[79,136],"accurately":[80],"extracts":[81],"features":[83],"through":[84],"its":[85],"bidirectional":[86],"encoding":[87],"capability,":[88],"enhancing":[89],"temporal":[91],"consistency":[92],"correlation":[95],"features.":[98,130],"utilizes":[102],"multi-expert":[104],"module":[105,120],"strategy":[106],"comprehensively":[108],"capture":[109],"from":[112],"multi-modal":[113],"multi-feature":[115],"perspectives.":[116],"effectively":[121],"achieves":[122],"by":[126],"aggregating":[127],"transforming":[129],"is":[137],"based":[138],"on":[139,160],"shared":[141],"clustering":[142],"center":[143],"mechanism,":[144],"deeply":[145],"explores":[146],"association":[149],"details":[152],"video.":[156],"Experiments":[157],"are":[158],"conducted":[159],"MSRVTT,":[162],"ActivityNet":[163],"Captions,":[164],"LSMDC":[166],"datasets,":[167,185],"using":[168],"Recall@K":[169],"Median":[171],"Rank":[172],"evaluation":[174],"metrics,":[175],"results":[177],"demonstrate":[178],"ETVA":[180],"performs":[181],"well":[182],"across":[183],"different":[184],"with":[186],"improved":[187],"retrieval":[188],"accuracy":[189],"compared":[190],"other":[192],"methods.":[193]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-02-27T00:00:00"}
