{"id":"https://openalex.org/W2789779524","doi":"https://doi.org/10.1109/vcip.2017.8305114","title":"Learning multi-view embedding in joint space for bidirectional image-text retrieval","display_name":"Learning multi-view embedding in joint space for bidirectional image-text retrieval","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2789779524","doi":"https://doi.org/10.1109/vcip.2017.8305114","mag":"2789779524"},"language":"en","primary_location":{"id":"doi:10.1109/vcip.2017.8305114","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip.2017.8305114","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000248129","display_name":"Ran Lu","orcid":"https://orcid.org/0000-0003-3239-3331"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lu Ran","raw_affiliation_strings":["School of Electronic and Computer Engineering, Peking University, Shenzhen, Guangdong Province, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University, Shenzhen, Guangdong Province, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017052768","display_name":"Wenmin Wang","orcid":"https://orcid.org/0000-0003-2664-4413"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenmin Wang","raw_affiliation_strings":["School of Electronic and Computer Engineering, Peking University, Shenzhen, Guangdong Province, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Computer Engineering, Peking University, Shenzhen, Guangdong Province, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5000248129"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.091,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.5084854,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7607139945030212},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.7258855104446411},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.6986227035522461},{"id":"https://openalex.org/keywords/phrase","display_name":"Phrase","score":0.6517391800880432},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6406351923942566},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.5661011934280396},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4591606855392456},{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.4427911043167114},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4234750270843506},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3166046738624573}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7607139945030212},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.7258855104446411},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.6986227035522461},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.6517391800880432},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6406351923942566},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.5661011934280396},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4591606855392456},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.4427911043167114},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4234750270843506},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3166046738624573}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/vcip.2017.8305114","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip.2017.8305114","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.47999998927116394,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W68733909","https://openalex.org/W639708223","https://openalex.org/W1686810756","https://openalex.org/W1905882502","https://openalex.org/W1949478088","https://openalex.org/W1957706851","https://openalex.org/W2112912048","https://openalex.org/W2119775030","https://openalex.org/W2123024445","https://openalex.org/W2149557440","https://openalex.org/W2164019165","https://openalex.org/W2189070436","https://openalex.org/W2346425926","https://openalex.org/W2481240925","https://openalex.org/W2613718673","https://openalex.org/W2963758027","https://openalex.org/W6620707391","https://openalex.org/W6637373629","https://openalex.org/W6677994088","https://openalex.org/W6678470764","https://openalex.org/W6684165356","https://openalex.org/W6686883664"],"related_works":["https://openalex.org/W1980381208","https://openalex.org/W2039546652","https://openalex.org/W2364594919","https://openalex.org/W2081900870","https://openalex.org/W2167092671","https://openalex.org/W4234886518","https://openalex.org/W2389591058","https://openalex.org/W1861706286","https://openalex.org/W2382112581","https://openalex.org/W2597655663"],"abstract_inverted_index":{"In":[0,42,69,112],"this":[1],"paper,":[2],"we":[3,46,73,123],"propose":[4],"a":[5,9,32,39,60,90,107,120],"framework":[6],"for":[7,13],"learning":[8],"joint":[10,139],"embedding":[11,20],"space":[12,140],"bidirectional":[14],"image-text":[15,162],"retrieval":[16,163],"task,":[17],"which":[18],"fuses":[19],"spaces":[21],"in":[22,99,151],"multi-views.":[23],"We":[24,93],"have":[25],"implemented":[26],"two":[27,101],"views":[28],"currently,":[29],"one":[30],"is":[31,38],"frame-sentence":[33,44],"view":[34],"and":[35,53,80,86,149,154,179],"the":[36,43,51,57,65,70,78,84,96,100,125,131,158,161,171,174,177],"other":[37],"region-phrase":[40,71],"view.":[41],"view,":[45,72,114],"project":[47],"each":[48,54,75,81,113],"frame":[49],"of":[50,56,77,83,173],"images":[52,148],"sentence":[55],"texts":[58,150],"into":[59,89,119],"holistic-level":[61],"subspace":[62],"to":[63,115,129],"explore":[64],"correlation":[66],"between":[67,147],"them.":[68],"extract":[74],"region":[76],"frames":[79],"phrase":[82],"sentences":[85],"map":[87],"them":[88,105],"local-level":[91],"subspace.":[92],"separately":[94],"mine":[95],"semantic":[97,145],"correlations":[98,146],"views,":[102],"then":[103],"merge":[104],"by":[106],"multi-view":[108,138],"fusion":[109],"ranking":[110],"method.":[111],"embed":[116],"heterogeneous":[117],"data":[118],"common":[121],"space,":[122],"adopt":[124],"two-branch":[126],"neural":[127],"network":[128],"transform":[130],"data.":[132],"Extensive":[133],"experiments":[134],"show":[135],"that":[136],"our":[137],"can":[141,155],"preserve":[142],"more":[143],"accurate":[144],"different":[152],"granularities":[153],"significantly":[156],"improve":[157],"performance":[159],"on":[160,176],"task.":[164],"Our":[165],"method":[166],"achieves":[167],"better":[168],"results":[169],"than":[170],"state":[172],"art":[175],"Pascal1K":[178],"Flickr8K":[180],"image-sentence":[181],"datasets.":[182]},"counts_by_year":[{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
