{"id":"https://openalex.org/W4385567992","doi":"https://doi.org/10.1145/3580305.3599935","title":"S <sup>2</sup> phere: Semi-Supervised Pre-training for Web Search over Heterogeneous Learning to Rank Data","display_name":"S <sup>2</sup> phere: Semi-Supervised Pre-training for Web Search over Heterogeneous Learning to Rank Data","publication_year":2023,"publication_date":"2023-08-04","ids":{"openalex":"https://openalex.org/W4385567992","doi":"https://doi.org/10.1145/3580305.3599935"},"language":"en","primary_location":{"id":"doi:10.1145/3580305.3599935","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3580305.3599935","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100348348","display_name":"Yuchen Li","orcid":"https://orcid.org/0000-0002-3869-7881"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuchen Li","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081254155","display_name":"Haoyi Xiong","orcid":"https://orcid.org/0000-0002-5451-3253"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoyi Xiong","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072308822","display_name":"Linghe Kong","orcid":"https://orcid.org/0000-0001-9266-3044"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Linghe Kong","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073897483","display_name":"Qingzhong Wang","orcid":"https://orcid.org/0000-0003-1562-8098"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingzhong Wang","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050255638","display_name":"Shuaiqiang Wang","orcid":"https://orcid.org/0000-0002-9212-1947"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuaiqiang Wang","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100428808","display_name":"Guihai Chen","orcid":"https://orcid.org/0000-0002-6934-1685"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guihai Chen","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101771060","display_name":"Dawei Yin","orcid":"https://orcid.org/0000-0002-0684-6205"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dawei Yin","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100348348"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":2.065,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.89454476,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"4437","last_page":"4448"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7474114894866943},{"id":"https://openalex.org/keywords/learning-to-rank","display_name":"Learning to rank","score":0.5389609336853027},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.5020344257354736},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.5008945465087891},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.49457284808158875},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4844343960285187},{"id":"https://openalex.org/keywords/extractor","display_name":"Extractor","score":0.4530971348285675},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4496224820613861},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.44609007239341736},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.4323664903640747},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.39382320642471313},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3875330090522766},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.16929951310157776}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7474114894866943},{"id":"https://openalex.org/C86037889","wikidata":"https://www.wikidata.org/wiki/Q4330127","display_name":"Learning to rank","level":3,"score":0.5389609336853027},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.5020344257354736},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.5008945465087891},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.49457284808158875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4844343960285187},{"id":"https://openalex.org/C117978034","wikidata":"https://www.wikidata.org/wiki/Q5422192","display_name":"Extractor","level":2,"score":0.4530971348285675},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4496224820613861},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.44609007239341736},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.4323664903640747},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.39382320642471313},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3875330090522766},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.16929951310157776},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C21880701","wikidata":"https://www.wikidata.org/wiki/Q2144042","display_name":"Process engineering","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3580305.3599935","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3580305.3599935","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.5699999928474426,"id":"https://metadata.un.org/sdg/9"}],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1885739014","display_name":null,"funder_award_id":"2022NL0AB01","funder_id":"https://openalex.org/F4320336023","funder_display_name":"Program for Professor of Special Appointment (Eastern Scholar) at Shanghai Institutions of Higher Learning"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2286240285","display_name":null,"funder_award_id":"1972254","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G301226467","display_name":null,"funder_award_id":"62172276","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4020255992","display_name":null,"funder_award_id":"Project","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4263355572","display_name":null,"funder_award_id":"62141220","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4599507694","display_name":null,"funder_award_id":"61972253","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5760752404","display_name":null,"funder_award_id":"Projects","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6315978837","display_name":null,"funder_award_id":"61972254","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8471520140","display_name":null,"funder_award_id":"U1908212","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8513333314","display_name":null,"funder_award_id":"2021ZD01","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320336023","display_name":"Program for Professor of Special Appointment (Eastern Scholar) at Shanghai Institutions of Higher Learning","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1980224846","https://openalex.org/W1985554184","https://openalex.org/W2001832483","https://openalex.org/W2007105673","https://openalex.org/W2007563768","https://openalex.org/W2035720976","https://openalex.org/W2047221353","https://openalex.org/W2059001985","https://openalex.org/W2069870183","https://openalex.org/W2091158010","https://openalex.org/W2108862644","https://openalex.org/W2157355274","https://openalex.org/W2167432060","https://openalex.org/W2295598076","https://openalex.org/W2524182563","https://openalex.org/W2741295496","https://openalex.org/W2796727080","https://openalex.org/W2949505856","https://openalex.org/W2955669675","https://openalex.org/W2965893800","https://openalex.org/W2975938167","https://openalex.org/W2991391304","https://openalex.org/W2997574889","https://openalex.org/W3101997094","https://openalex.org/W3169109617","https://openalex.org/W3170841641","https://openalex.org/W3172750682","https://openalex.org/W3190540921","https://openalex.org/W4283804319","https://openalex.org/W4287322212"],"related_works":["https://openalex.org/W2069238515","https://openalex.org/W159425995","https://openalex.org/W1527068950","https://openalex.org/W2889658777","https://openalex.org/W1976758266","https://openalex.org/W2421630208","https://openalex.org/W3144899030","https://openalex.org/W2122840831","https://openalex.org/W1540194478","https://openalex.org/W2056872955"],"abstract_inverted_index":{"While":[0],"Learning":[1],"to":[2,14,22,123,201,221,240],"Rank":[3],"(LTR)":[4],"models":[5,102,141,320],"on":[6,112,298],"top":[7,299],"of":[8,35,43,49,64,75,99,115,127,155,191,210,243,250,300,308,314],"transformers":[9,91],"have":[10,60,287],"been":[11,288],"widely":[12],"adopted":[13],"achieve":[15],"decent":[16],"performance,":[17],"it":[18],"is":[19],"still":[20],"challenging":[21],"train":[23],"the":[24,55,86,97,113,125,203,218,223,244,260,275,312],"model":[25,189,272,276],"with":[26,68,134,264,281,290],"sufficient":[27],"data":[28,137,216,280],"as":[29,247],"only":[30],"an":[31,187],"extremely":[32],"small":[33],"number":[34,63],"query-webpage":[36,147],"pairs":[37,148],"could":[38],"be":[39],"annotated":[40],"versus":[41],"trillions":[42],"webpages":[44],"available":[45],"online":[46,295],"and":[47,106,145,176,205,253,262,273,294],"billions":[48],"web":[50],"search":[51,219,278,302],"queries":[52],"everyday.":[53],"In":[54,81],"meanwhile,":[56],"industry":[57],"research":[58],"communities":[59],"released":[61],"a":[62,156,192,197,206,265,269],"open-source":[65,120,236],"LTR":[66,76,101,121,136,140,151,174,179,188,238,271,319],"datasets":[67,122,239],"well":[69],"annotations":[70],"but":[71],"incorporating":[72],"different":[73],"designs":[74],"features/labels":[77],"(i.e.,":[78],"heterogeneous":[79,119,150,237],"domains).":[80],"this":[82],"work,":[83],"inspired":[84],"by":[85],"recent":[87],"progress":[88],"in":[89,118,225,256,316],"pre-training":[90,100,242],"for":[92,139,321],"performance":[93,126],"advantages,":[94],"we":[95,110,130],"study":[96],"problem":[98],"using":[103,142,277],"both":[104,143,291],"labeled":[105,146],"unlabeled":[107,144],"samples,":[108],"especially":[109],"focus":[111],"use":[114],"well-annotated":[116],"samples":[117],"boost":[124],"pre-training.":[128],"Hereby,":[129],"propose":[131],"S2phere-Semi-Supervised":[132],"Pre-training":[133,163,171],"Heterogeneous":[135,173],"strategies":[138],"across":[149],"datasets.":[152],"S2phere":[153,213,255,315],"consists":[154],"three-step":[157],"approach:":[158],"(1)":[159,227],"Semi-supervised":[160],"Feature":[161],"Extraction":[162],"via":[164,181,228],"Perturbed":[165],"Contrastive":[166],"Loss,":[167],"(2)":[168,233],"Cross-domain":[169],"Ranker":[170],"over":[172],"Datasets":[175],"(3)":[177,258],"End-to-end":[178],"Fine-tuning":[180],"Modular":[182],"Network":[183],"Composition.":[184],"Specifically,":[185],"given":[186],"composed":[190],"backbone":[193,224,261],"(the":[194,199,208],"feature":[195],"extractor),":[196],"neck":[198,245,263],"module":[200,246],"reason":[202],"orders)":[204],"head":[207,267],"predictor":[209],"ranking":[211],"scores),":[212],"uses":[214],"unlabeled/labeled":[215],"from":[217],"engine":[220,279],"pre-train":[222],"Step":[226,232,257],"semi-supervised":[229],"learning;":[230,252],"then":[231],"incorporates":[234],"multiple":[235],"improve":[241],"shared":[248],"parameters":[249],"cross-domain":[251],"finally,":[254],"composes":[259],"randomly-initialized":[266],"into":[268],"whole":[270],"fine-tunes":[274],"various":[282],"learning":[283],"strategies.":[284],"Extensive":[285],"experiments":[286,293],"done":[289],"offline":[292],"A/B":[296],"Test":[297],"Baidu":[301],"engine.":[303],"The":[304],"comparisons":[305],"against":[306],"numbers":[307],"baseline":[309],"algorithms":[310],"confirmed":[311],"advantages":[313],"producing":[317],"high-performance":[318],"web-scale":[322],"search.":[323]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1}],"updated_date":"2026-04-15T08:11:43.952461","created_date":"2025-10-10T00:00:00"}
