{"id":"https://openalex.org/W4312572439","doi":"https://doi.org/10.1145/3556089.3556149","title":"E-Commerce Product Matching at Internet Scale","display_name":"E-Commerce Product Matching at Internet Scale","publication_year":2022,"publication_date":"2022-07-16","ids":{"openalex":"https://openalex.org/W4312572439","doi":"https://doi.org/10.1145/3556089.3556149"},"language":"en","primary_location":{"id":"doi:10.1145/3556089.3556149","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3556089.3556149","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 13th International Conference on E-business, Management and Economics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006881411","display_name":"Muralidhar Sortur","orcid":"https://orcid.org/0000-0001-6310-1034"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muralidhar Sortur","raw_affiliation_strings":["Rakuten India, India"],"raw_orcid":"https://orcid.org/0000-0001-6310-1034","affiliations":[{"raw_affiliation_string":"Rakuten India, India","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034896106","display_name":"Pawan Rajpoot","orcid":"https://orcid.org/0000-0003-4733-1686"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pawan Rajpoot","raw_affiliation_strings":["Rakuten India, India"],"raw_orcid":"https://orcid.org/0000-0003-4733-1686","affiliations":[{"raw_affiliation_string":"Rakuten India, India","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109594146","display_name":"Manjunath","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manjunath","raw_affiliation_strings":["Rakuten India, India"],"raw_orcid":"https://orcid.org/0000-0002-2060-9505","affiliations":[{"raw_affiliation_string":"Rakuten India, India","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014566532","display_name":"Subhanandh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Subhanandh","raw_affiliation_strings":["Rakuten India, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Rakuten India, India","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034957222","display_name":"Hari Charan Rao","orcid":"https://orcid.org/0009-0004-2644-5654"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hari Charan Rao","raw_affiliation_strings":["Rakuten India, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Rakuten India, India","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.26234191,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"45","last_page":"51"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9828000068664551,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.767186164855957},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6682052612304688},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6456249356269836},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5436796545982361},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5241956114768982},{"id":"https://openalex.org/keywords/product","display_name":"Product (mathematics)","score":0.5097031593322754},{"id":"https://openalex.org/keywords/bloom-filter","display_name":"Bloom filter","score":0.49694564938545227},{"id":"https://openalex.org/keywords/taxonomy","display_name":"Taxonomy (biology)","score":0.46513739228248596},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.44624796509742737},{"id":"https://openalex.org/keywords/false-positive-paradox","display_name":"False positive paradox","score":0.43853768706321716},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4155048429965973},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2559516429901123},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.24772822856903076},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.13630026578903198},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11035838723182678},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.07743117213249207}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.767186164855957},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6682052612304688},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6456249356269836},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5436796545982361},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5241956114768982},{"id":"https://openalex.org/C90673727","wikidata":"https://www.wikidata.org/wiki/Q901718","display_name":"Product (mathematics)","level":2,"score":0.5097031593322754},{"id":"https://openalex.org/C147224247","wikidata":"https://www.wikidata.org/wiki/Q885373","display_name":"Bloom filter","level":2,"score":0.49694564938545227},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.46513739228248596},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.44624796509742737},{"id":"https://openalex.org/C64869954","wikidata":"https://www.wikidata.org/wiki/Q1859747","display_name":"False positive paradox","level":2,"score":0.43853768706321716},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4155048429965973},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2559516429901123},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.24772822856903076},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.13630026578903198},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11035838723182678},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.07743117213249207},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3556089.3556149","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3556089.3556149","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 13th International Conference on E-business, Management and Economics","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.5}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1614298861","https://openalex.org/W1940872118","https://openalex.org/W2031767704","https://openalex.org/W2058715873","https://openalex.org/W2070996757","https://openalex.org/W2560674852","https://openalex.org/W2963626623","https://openalex.org/W3107323053","https://openalex.org/W3118316880","https://openalex.org/W3214074647","https://openalex.org/W4300613830"],"related_works":["https://openalex.org/W2127784084","https://openalex.org/W2950578529","https://openalex.org/W2086416962","https://openalex.org/W4383553080","https://openalex.org/W2155669648","https://openalex.org/W4293879742","https://openalex.org/W2212047860","https://openalex.org/W2167538128","https://openalex.org/W2148425737","https://openalex.org/W4300824226"],"abstract_inverted_index":{"In":[0],"E-Commerce,":[1],"Product":[2,58,73,169],"Matching":[3,74],"is":[4,37,69],"one":[5],"of":[6,18,22,49,51,56,83,108,119,148,168],"the":[7,65,89,94,101,104,146,165],"fundamental":[8],"problems":[9],"for":[10,67,139],"various":[11,30],"use":[12,72,76],"cases":[13],"like":[14],"(1)":[15,111],"Competitive":[16],"pricing":[17],"products,":[19],"(2)":[20,117],"deduplication":[21],"products":[23,120],"in":[24],"catalog,":[25],"(3)":[26,121],"grouping":[27],"items":[28],"from":[29,124],"merchants":[31],"(4)":[32,131],"Recommending":[33],"products.":[34],"The":[35],"requirement":[36],"to":[38,71,92,144,163],"match":[39],"a":[40,44,81],"product":[41,154,176],"accurately":[42],"against":[43,133],"catalog":[45],"spread":[46],"across":[47,75],"tens":[48],"thousands":[50],"taxonomy":[52,115],"nodes":[53],"and":[54,64,127,136,157],"millions":[55],"items.":[57],"matching":[59,177],"results":[60,138,178],"must":[61],"be":[62],"accurate,":[63],"margin":[66],"error":[68],"minimal":[70],"cases.":[77],"This":[78,171],"paper":[79],"proposes":[80],"combination":[82],"Deep":[84],"Learning":[85],"models":[86],"integrated":[87],"into":[88],"scalable":[90],"architecture":[91],"achieve":[93],"required":[95],"results.":[96,150],"Here":[97],"we":[98],"have":[99,152],"approached":[100],"problem":[102],"at":[103,160,179],"grass-root":[105],"level":[106],"consisting":[107],"five":[109],"stages":[110],"Identifying":[112],"attributes":[113,141],"per":[114],"node":[116],"classification":[118],"Attribute":[122],"Enrichment":[123],"NER":[125],"(Text)":[126],"Image":[128],"feature":[129],"extraction":[130],"Search":[132],"multiple":[134],"indices":[135],"filter":[137],"mandatory":[140],"(5)":[142],"Re-rank":[143],"improve":[145,164],"relevancy":[147],"shortlisted":[149],"We":[151],"defined":[153],"data":[155],"quality":[156],"measured":[158],"it":[159],"every":[161],"stage":[162],"overall":[166],"performance":[167],"Matching.":[170],"approach":[172],"has":[173],"yielded":[174],"accurate":[175],"scale":[180],"minimising":[181],"false-positives":[182]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
