{"id":"https://openalex.org/W2251084241","doi":"https://doi.org/10.14778/2732296.2732301","title":"Effective multi-modal retrieval based on stacked auto-encoders","display_name":"Effective multi-modal retrieval based on stacked auto-encoders","publication_year":2014,"publication_date":"2014-04-01","ids":{"openalex":"https://openalex.org/W2251084241","doi":"https://doi.org/10.14778/2732296.2732301","mag":"2251084241"},"language":"en","primary_location":{"id":"doi:10.14778/2732296.2732301","is_oa":false,"landing_page_url":"https://doi.org/10.14778/2732296.2732301","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100391659","display_name":"Wei Wang","orcid":"https://orcid.org/0000-0001-5367-7056"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Wei Wang","raw_affiliation_strings":["National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024892041","display_name":"Beng Chin Ooi","orcid":"https://orcid.org/0000-0003-4446-1100"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Beng Chin Ooi","raw_affiliation_strings":["National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101767360","display_name":"Xiaoyan Yang","orcid":"https://orcid.org/0000-0001-8546-3589"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiaoyan Yang","raw_affiliation_strings":["Illinois at Singapore Pte, Singapore"],"affiliations":[{"raw_affiliation_string":"Illinois at Singapore Pte, Singapore","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011200911","display_name":"Dongxiang Zhang","orcid":"https://orcid.org/0000-0002-9964-2470"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Dongxiang Zhang","raw_affiliation_strings":["National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008666077","display_name":"Yueting Zhuang","orcid":"https://orcid.org/0000-0001-9017-2508"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yueting Zhuang","raw_affiliation_strings":["Zhejiang University, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100391659"],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":16.0585,"has_fulltext":false,"cited_by_count":146,"citation_normalized_percentile":{"value":0.9936014,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":100},"biblio":{"volume":"7","issue":"8","first_page":"649","last_page":"660"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7920682430267334},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.6404147148132324},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.5912213325500488},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.563091516494751},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.4991424083709717},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.478145956993103},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.474784791469574},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4538801908493042},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45311933755874634},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.41962867975234985},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.38202932476997375},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.36115044355392456},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.08207497000694275}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7920682430267334},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.6404147148132324},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.5912213325500488},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.563091516494751},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.4991424083709717},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.478145956993103},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.474784791469574},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4538801908493042},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45311933755874634},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.41962867975234985},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38202932476997375},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36115044355392456},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.08207497000694275},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.14778/2732296.2732301","is_oa":false,"landing_page_url":"https://doi.org/10.14778/2732296.2732301","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.493.7045","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.493.7045","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.comp.nus.edu.sg/~ooibc/crossmodalvldb14.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.635.7663","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.635.7663","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.vldb.org/pvldb/vol7/p649-wang.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W44815768","https://openalex.org/W71795751","https://openalex.org/W154472438","https://openalex.org/W199018803","https://openalex.org/W1498436455","https://openalex.org/W1532325895","https://openalex.org/W1541459201","https://openalex.org/W1970055505","https://openalex.org/W2007972815","https://openalex.org/W2025768430","https://openalex.org/W2038436420","https://openalex.org/W2049993534","https://openalex.org/W2064797228","https://openalex.org/W2065528935","https://openalex.org/W2106277773","https://openalex.org/W2112037975","https://openalex.org/W2155803963","https://openalex.org/W2159373756","https://openalex.org/W2164587673","https://openalex.org/W2168231600","https://openalex.org/W2184188583","https://openalex.org/W2218318129","https://openalex.org/W2251864938","https://openalex.org/W2290318471","https://openalex.org/W2293597654","https://openalex.org/W2913932916","https://openalex.org/W2914484425","https://openalex.org/W2963650755","https://openalex.org/W3118608800","https://openalex.org/W4213009331","https://openalex.org/W6684859321","https://openalex.org/W6686207219","https://openalex.org/W6691474080","https://openalex.org/W6697214482"],"related_works":["https://openalex.org/W4390516098","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W2188500270","https://openalex.org/W2303858293","https://openalex.org/W2915512527","https://openalex.org/W2798198862","https://openalex.org/W51364034","https://openalex.org/W2898073868","https://openalex.org/W4284663758"],"abstract_inverted_index":{"Multi-modal":[0],"retrieval":[1,13],"is":[2,164],"emerging":[3],"as":[4,125],"a":[5,25,38,57,94,118,141],"new":[6,95],"search":[7,29,187],"paradigm":[8],"that":[9,62,179],"enables":[10],"seamless":[11],"information":[12],"from":[14,50,108],"various":[15],"types":[16,55],"of":[17,40,52,106,121,128,159],"media.":[18],"For":[19],"example,":[20],"users":[21],"can":[22,66],"simply":[23],"snap":[24],"movie":[26],"poster":[27],"to":[28,45,169],"relevant":[30],"reviews":[31],"and":[32,102,131,150],"trailers.":[33],"To":[34],"solve":[35],"the":[36,153,170,190],"problem,":[37],"set":[39],"mapping":[41,76,154],"functions":[42,89,155],"are":[43,90],"learned":[44,91],"project":[46],"high-dimensional":[47],"features":[48],"extracted":[49],"data":[51,107,130,171],"different":[53],"media":[54],"into":[56,148],"common":[58],"low-dimensional":[59],"space":[60],"so":[61],"metric":[63],"distance":[64],"measures":[65],"be":[67],"applied.":[68],"In":[69],"this":[70],"paper,":[71],"we":[72,145],"propose":[73],"an":[74],"effective":[75],"mechanism":[77],"based":[78],"on":[79,174],"deep":[80],"learning":[81],"(i.e.,":[82],"stacked":[83],"auto-encoders)":[84],"for":[85,156],"multi-modal":[86],"retrieval.":[87],"Mapping":[88],"by":[92],"optimizing":[93],"objective":[96],"function,":[97],"which":[98,116],"captures":[99],"both":[100],"intra-modal":[101,129],"inter-modal":[103],"semantic":[104],"relationships":[105],"heterogeneous":[109],"sources":[110],"effectively.":[111],"Compared":[112],"with":[113,167],"previous":[114],"works":[115],"require":[117],"substantial":[119],"amount":[120],"prior":[122,138],"knowledge":[123],"such":[124],"similarity":[126],"matrices":[127],"ranking":[132],"examples,":[133],"our":[134,162,180],"method":[135,163,182],"requires":[136],"little":[137],"knowledge.":[139],"Given":[140],"large":[142],"training":[143],"dataset,":[144],"split":[146],"it":[147],"mini-batches":[149],"continually":[151],"adjust":[152],"each":[157],"batch":[158],"input.":[160],"Hence,":[161],"memory":[165],"efficient":[166],"respect":[168],"volume.":[172],"Experiments":[173],"three":[175],"real":[176],"datasets":[177],"illustrate":[178],"proposed":[181],"achieves":[183],"significant":[184],"improvement":[185],"in":[186],"accuracy":[188],"over":[189],"state-of-the-art":[191],"methods.":[192]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":18},{"year":2019,"cited_by_count":15},{"year":2018,"cited_by_count":23},{"year":2017,"cited_by_count":21},{"year":2016,"cited_by_count":29},{"year":2015,"cited_by_count":13},{"year":2014,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
