{"id":"https://openalex.org/W2913410650","doi":"https://doi.org/10.1145/3308558.3313466","title":"Learning Fast Matching Models from Weak Annotations","display_name":"Learning Fast Matching Models from Weak Annotations","publication_year":2019,"publication_date":"2019-05-13","ids":{"openalex":"https://openalex.org/W2913410650","doi":"https://doi.org/10.1145/3308558.3313466","mag":"2913410650"},"language":"en","primary_location":{"id":"doi:10.1145/3308558.3313466","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3308558.3313466","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The World Wide Web Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3308558.3313466","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100372201","display_name":"Xue Li","orcid":"https://orcid.org/0000-0002-4515-6792"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Xue Li","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031606307","display_name":"Zhipeng Luo","orcid":"https://orcid.org/0000-0001-9994-9678"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zhipeng Luo","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037488877","display_name":"Hao Sun","orcid":"https://orcid.org/0000-0001-8456-7925"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Hao Sun","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055260255","display_name":"Jianjin Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianjin Zhang","raw_affiliation_strings":["Microsoft and Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Microsoft and Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022072215","display_name":"Weihao Han","orcid":"https://orcid.org/0000-0002-5533-6455"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Weihao Han","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091025271","display_name":"Xianqi Chu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Xianqi Chu","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068728111","display_name":"Liang\u2010Jie Zhang","orcid":"https://orcid.org/0000-0002-6219-0853"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Liangjie Zhang","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022403899","display_name":"Qi Zhang","orcid":"https://orcid.org/0009-0009-7438-7248"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Qi Zhang","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100372201"],"corresponding_institution_ids":["https://openalex.org/I4210164937"],"apc_list":null,"apc_paid":null,"fwci":0.911,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.78346777,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"2985","last_page":"2991"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.8891046047210693},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8426042795181274},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.6709730625152588},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6676172018051147},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.6342272162437439},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6158390045166016},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.5926179885864258},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5708465576171875},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5398911237716675},{"id":"https://openalex.org/keywords/dependency","display_name":"Dependency (UML)","score":0.5093918442726135},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.4447748363018036},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.41150736808776855}],"concepts":[{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.8891046047210693},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8426042795181274},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.6709730625152588},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6676172018051147},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.6342272162437439},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6158390045166016},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.5926179885864258},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5708465576171875},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5398911237716675},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.5093918442726135},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.4447748363018036},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.41150736808776855},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3308558.3313466","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3308558.3313466","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The World Wide Web Conference","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3308558.3313466","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3308558.3313466","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The World Wide Web Conference","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.4300000071525574}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W1612003148","https://openalex.org/W1690739335","https://openalex.org/W1821462560","https://openalex.org/W1836465849","https://openalex.org/W1880262756","https://openalex.org/W1966443646","https://openalex.org/W2104246439","https://openalex.org/W2121456571","https://openalex.org/W2128892113","https://openalex.org/W2131876387","https://openalex.org/W2133564696","https://openalex.org/W2136189984","https://openalex.org/W2139688392","https://openalex.org/W2147152072","https://openalex.org/W2170738476","https://openalex.org/W2186845332","https://openalex.org/W2211192759","https://openalex.org/W2251008987","https://openalex.org/W2294370754","https://openalex.org/W2413794162","https://openalex.org/W2517540742","https://openalex.org/W2536015822","https://openalex.org/W2538374209","https://openalex.org/W2539671052","https://openalex.org/W2541993794","https://openalex.org/W2610314927","https://openalex.org/W2611099133","https://openalex.org/W2897444426","https://openalex.org/W2913932916","https://openalex.org/W2949117887","https://openalex.org/W2952881492","https://openalex.org/W2963053846"],"related_works":["https://openalex.org/W2361861616","https://openalex.org/W2250721602","https://openalex.org/W3210196349","https://openalex.org/W4214728004","https://openalex.org/W2950181282","https://openalex.org/W2963261224","https://openalex.org/W2798287483","https://openalex.org/W2913410650","https://openalex.org/W10944326","https://openalex.org/W2001391081"],"abstract_inverted_index":{"We":[0],"propose":[1],"a":[2,90,197,235],"novel":[3],"training":[4,72,142,189,245],"scheme":[5],"for":[6],"fast":[7,219],"matching":[8,220],"models":[9,85,130],"in":[10,243],"Search":[11],"Ads,":[12],"motivated":[13],"by":[14,79,121,162,190,196,205,222],"practical":[15],"challenges.":[16],"The":[17,40,70,128,144,211],"first":[18,107],"challenge":[19],"stems":[20],"from":[21,44,93,112,124,186,224],"the":[22,29,45,81,113,119,151,170,181,191,218,244],"pursuit":[23],"of":[24,31],"high":[25],"throughput,":[26],"which":[27,52,247],"prohibits":[28],"deployment":[30],"inseparable":[32],"architectures,":[33],"and":[34,55,88,99,117,140,155,166,200],"hence":[35],"greatly":[36],"limits":[37],"model":[38,92,146,221],"accuracy.":[39],"second":[41],"problem":[42],"arises":[43],"heavy":[46],"dependency":[47,252],"on":[48,75,150,158,253],"human":[49,95,254],"provided":[50,96,255],"labels,":[51,116,188],"are":[53,131],"expensive":[54],"time-consuming":[56],"to":[57,61,134,137,176,216,238],"collect,":[58],"yet":[59],"how":[60],"leverage":[62,239],"unlabeled":[63,141,153],"search":[64,102,240],"log":[65,103,241],"data":[66,202,242],"is":[67,147],"rarely":[68],"studied.":[69],"proposed":[71,171,192,212],"framework":[73,193,213],"targets":[74],"mitigating":[76],"both":[77,94,138,164],"issues,":[78],"treating":[80],"stronger":[82,225],"but":[83],"undeployable":[84],"as":[86],"annotators,":[87],"learning":[89,123,223],"deployable":[91,145],"relevance":[97,115,187],"labels":[98,165],"weakly":[100],"annotated":[101],"data.":[104],"Specifically,":[105],"we":[106],"construct":[108],"multiple":[109],"auxiliary":[110],"tasks":[111],"enumerated":[114],"train":[118],"annotators":[120,226],"jointly":[122],"those":[125],"related":[126],"tasks.":[127],"annotation":[129],"then":[132,156],"used":[133],"assign":[135],"scores":[136,167],"labeled":[139,160,209],"samples.":[143,210],"firstly":[148],"learnt":[149],"scored":[152,159],"data,":[154,161],"fine-tuned":[157],"leveraging":[163],"via":[168],"minimizing":[169],"label-aware":[172],"weighted":[173],"loss.":[174],"According":[175],"our":[177,251],"experiments,":[178],"compared":[179],"with":[180,207],"baseline":[182],"that":[183],"directly":[184],"learns":[185],"outperforms":[194],"it":[195,233],"large":[198],"margin,":[199],"improves":[201],"efficiency":[203],"substantially":[204],"dispensing":[206],"80%":[208],"allows":[214],"us":[215],"improve":[217],"while":[227],"keeping":[228],"its":[229],"architecture":[230],"unchanged.":[231],"Meanwhile,":[232],"offers":[234],"principled":[236],"manner":[237],"phase,":[246],"could":[248],"effectively":[249],"alleviate":[250],"labels.":[256]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
