{"id":"https://openalex.org/W7129022203","doi":"https://doi.org/10.1145/3773966.3779367","title":"Factorized Transport Alignment for Multimodal and Multiview E-commerce Representation Learning","display_name":"Factorized Transport Alignment for Multimodal and Multiview E-commerce Representation Learning","publication_year":2026,"publication_date":"2026-02-16","ids":{"openalex":"https://openalex.org/W7129022203","doi":"https://doi.org/10.1145/3773966.3779367"},"language":null,"primary_location":{"id":"doi:10.1145/3773966.3779367","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3773966.3779367","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Nineteenth ACM International Conference on Web Search and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3773966.3779367","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060209007","display_name":"X. Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I8078737","display_name":"Clemson University","ror":"https://ror.org/037s24f05","country_code":"US","type":"education","lineage":["https://openalex.org/I8078737"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xiwen Chen","raw_affiliation_strings":["Clemson University, Clemson, SC, USA"],"affiliations":[{"raw_affiliation_string":"Clemson University, Clemson, SC, USA","institution_ids":["https://openalex.org/I8078737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121153997","display_name":"Yen-Chieh Lien","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112773","display_name":"Etsy (United States)","ror":"https://ror.org/01kzp9g64","country_code":"US","type":"company","lineage":["https://openalex.org/I4210112773"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yen-Chieh Lien","raw_affiliation_strings":["Etsy, Inc., Brooklyn, NY, USA"],"affiliations":[{"raw_affiliation_string":"Etsy, Inc., Brooklyn, NY, USA","institution_ids":["https://openalex.org/I4210112773"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121157685","display_name":"Susan Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112773","display_name":"Etsy (United States)","ror":"https://ror.org/01kzp9g64","country_code":"US","type":"company","lineage":["https://openalex.org/I4210112773"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Susan Liu","raw_affiliation_strings":["Etsy, Inc., Brooklyn, NY, USA"],"affiliations":[{"raw_affiliation_string":"Etsy, Inc., Brooklyn, NY, USA","institution_ids":["https://openalex.org/I4210112773"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121187718","display_name":"Mar\u00eda Casta\u00f1os","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112773","display_name":"Etsy (United States)","ror":"https://ror.org/01kzp9g64","country_code":"US","type":"company","lineage":["https://openalex.org/I4210112773"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mar\u00eda Casta\u00f1os","raw_affiliation_strings":["Etsy, Inc., Brooklyn, NY, USA"],"affiliations":[{"raw_affiliation_string":"Etsy, Inc., Brooklyn, NY, USA","institution_ids":["https://openalex.org/I4210112773"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125635832","display_name":"Abolfazl Razi","orcid":null},"institutions":[{"id":"https://openalex.org/I8078737","display_name":"Clemson University","ror":"https://ror.org/037s24f05","country_code":"US","type":"education","lineage":["https://openalex.org/I8078737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abolfazl Razi","raw_affiliation_strings":["Clemson University, Clemson, SC, USA"],"affiliations":[{"raw_affiliation_string":"Clemson University, Clemson, SC, USA","institution_ids":["https://openalex.org/I8078737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013377486","display_name":"Xiaoting Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112773","display_name":"Etsy (United States)","ror":"https://ror.org/01kzp9g64","country_code":"US","type":"company","lineage":["https://openalex.org/I4210112773"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaoting Zhao","raw_affiliation_strings":["Etsy, Inc., Brooklyn, NY, USA"],"affiliations":[{"raw_affiliation_string":"Etsy, Inc., Brooklyn, NY, USA","institution_ids":["https://openalex.org/I4210112773"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086078358","display_name":"Congzhe Su","orcid":"https://orcid.org/0009-0004-4225-0056"},"institutions":[{"id":"https://openalex.org/I4210112773","display_name":"Etsy (United States)","ror":"https://ror.org/01kzp9g64","country_code":"US","type":"company","lineage":["https://openalex.org/I4210112773"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Congzhe Su","raw_affiliation_strings":["Etsy, Inc., Brooklyn, NY, USA"],"affiliations":[{"raw_affiliation_string":"Etsy, Inc., Brooklyn, NY, USA","institution_ids":["https://openalex.org/I4210112773"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5060209007"],"corresponding_institution_ids":["https://openalex.org/I8078737"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.82720978,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1105","last_page":"1109"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.47850000858306885,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.47850000858306885,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.09260000288486481,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.05299999937415123,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6996999979019165},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5843999981880188},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5231999754905701},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.42590001225471497},{"id":"https://openalex.org/keywords/quadratic-equation","display_name":"Quadratic equation","score":0.3797999918460846},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.37310001254081726},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.3707999885082245},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.36489999294281006}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7644000053405762},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6996999979019165},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5843999981880188},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5584999918937683},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5231999754905701},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.426800012588501},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.42590001225471497},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.3797999918460846},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.37310001254081726},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.3707999885082245},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.36489999294281006},{"id":"https://openalex.org/C90673727","wikidata":"https://www.wikidata.org/wiki/Q901718","display_name":"Product (mathematics)","level":2,"score":0.36329999566078186},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.359499990940094},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.3391999900341034},{"id":"https://openalex.org/C2777027219","wikidata":"https://www.wikidata.org/wiki/Q1284190","display_name":"Constant (computer programming)","level":2,"score":0.29919999837875366},{"id":"https://openalex.org/C81845259","wikidata":"https://www.wikidata.org/wiki/Q290117","display_name":"Quadratic programming","level":2,"score":0.29190000891685486},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.27320000529289246},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.27059999108314514},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2632000148296356},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2621000111103058},{"id":"https://openalex.org/C2778828372","wikidata":"https://www.wikidata.org/wiki/Q5283209","display_name":"Distributional semantics","level":3,"score":0.26179999113082886}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3773966.3779367","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3773966.3779367","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Nineteenth ACM International Conference on Web Search and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3773966.3779367","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3773966.3779367","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Nineteenth ACM International Conference on Web Search and Data Mining","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.5020670890808105}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":3,"referenced_works":["https://openalex.org/W2053323136","https://openalex.org/W4290927925","https://openalex.org/W4327644554"],"related_works":[],"abstract_inverted_index":{"The":[0],"rapid":[1],"growth":[2],"of":[3,67,96,116,128],"e-commerce":[4,169],"requires":[5],"robust":[6],"multimodal":[7,57,152],"representations":[8],"that":[9,36,55],"capture":[10],"diverse":[11],"signals":[12],"from":[13,91],"user-generated":[14],"listings.":[15],"Existing":[16],"vision\u2013language":[17],"models":[18],"(VLMs)":[19],"typically":[20],"align":[21],"titles":[22],"with":[23,119,159],"primary":[24,81],"images,":[25],"i.e.,":[26],"single-view,":[27],"but":[28],"overlook":[29],"non-primary":[30],"images":[31],"and":[32,58,73,132,142],"auxiliary":[33,86],"textual":[34],"views":[35,82,97,105],"provide":[37],"critical":[38],"semantics":[39],"in":[40,93,140],"open":[41],"marketplaces":[42],"such":[43],"as":[44],"Etsy":[45],"or":[46],"Poshmark.":[47],"To":[48],"this":[49],"end,":[50],"we":[51],"propose":[52],"a":[53,64,109],"framework":[54,156],"unifies":[56],"multi-view":[59,164],"learning":[60],"through":[61],"Factorized":[62],"Transport,":[63],"lightweight":[65],"approximation":[66],"optimal":[68,160],"transport,":[69],"designed":[70],"for":[71,167],"scalability":[72,158],"deployment":[74],"efficiency.":[75],"During":[76],"training,":[77],"the":[78,94,114],"method":[79],"emphasizes":[80],"while":[83],"stochastically":[84],"sampling":[85],"ones,":[87],"reducing":[88],"training":[89],"cost":[90],"quadratic":[92],"number":[95],"to":[98,147],"constant":[99],"per":[100],"item.":[101],"At":[102],"inference,":[103],"all":[104],"are":[106],"fused":[107],"into":[108],"single":[110],"cached":[111],"embedding,":[112],"preserving":[113],"efficiency":[115],"two-tower":[117],"retrieval":[118],"no":[120],"additional":[121],"online":[122],"overhead.":[123],"On":[124],"an":[125],"industrial":[126],"dataset":[127],"1M":[129],"product":[130],"listings":[131],"0.3M":[133],"interactions,":[134],"our":[135,155],"approach":[136],"delivers":[137],"consistent":[138],"improvements":[139],"cross-view":[141],"query-to-item":[143],"retrieval,":[144],"achieving":[145],"up":[146],"+7.9%":[148],"Recall@500":[149],"over":[150],"strong":[151],"baselines.":[153],"Overall,":[154],"bridges":[157],"transport\u2013based":[161],"learning,":[162],"making":[163],"pretraining":[165],"practical":[166],"large-scale":[168],"search.":[170]},"counts_by_year":[],"updated_date":"2026-02-18T06:20:13.636215","created_date":"2026-02-17T00:00:00"}
