{"id":"https://openalex.org/W4387848842","doi":"https://doi.org/10.1145/3583780.3615157","title":"Pre-training with Aspect-Content Text Mutual Prediction for Multi-Aspect Dense Retrieval","display_name":"Pre-training with Aspect-Content Text Mutual Prediction for Multi-Aspect Dense Retrieval","publication_year":2023,"publication_date":"2023-10-21","ids":{"openalex":"https://openalex.org/W4387848842","doi":"https://doi.org/10.1145/3583780.3615157"},"language":"en","primary_location":{"id":"doi:10.1145/3583780.3615157","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3583780.3615157","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3583780.3615157","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3583780.3615157","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101742332","display_name":"Xiaojie Sun","orcid":"https://orcid.org/0009-0006-4570-6359"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaojie Sun","raw_affiliation_strings":["ICT, CAS &amp; University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0006-4570-6359","affiliations":[{"raw_affiliation_string":"ICT, CAS &amp; University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040708820","display_name":"Keping Bi","orcid":"https://orcid.org/0000-0001-5123-4999"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Keping Bi","raw_affiliation_strings":["ICT, CAS &amp; University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-5123-4999","affiliations":[{"raw_affiliation_string":"ICT, CAS &amp; University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088621320","display_name":"Jiafeng Guo","orcid":"https://orcid.org/0000-0002-9509-8674"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiafeng Guo","raw_affiliation_strings":["ICT, CAS &amp; University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-9509-8674","affiliations":[{"raw_affiliation_string":"ICT, CAS &amp; University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056848863","display_name":"Xinyu Ma","orcid":"https://orcid.org/0000-0002-5511-9370"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinyu Ma","raw_affiliation_strings":["ICT, CAS &amp; University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5511-9370","affiliations":[{"raw_affiliation_string":"ICT, CAS &amp; University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006971161","display_name":"Yixing Fan","orcid":"https://orcid.org/0000-0003-4317-2702"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yixing Fan","raw_affiliation_strings":["ICT, CAS &amp; University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4317-2702","affiliations":[{"raw_affiliation_string":"ICT, CAS &amp; University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038021216","display_name":"Hongyu Shan","orcid":"https://orcid.org/0000-0003-1213-4690"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hongyu Shan","raw_affiliation_strings":["Ant Group, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-1213-4690","affiliations":[{"raw_affiliation_string":"Ant Group, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005163911","display_name":"Qishen Zhang","orcid":"https://orcid.org/0000-0001-9964-6298"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qishen Zhang","raw_affiliation_strings":["Ant Group, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-9964-6298","affiliations":[{"raw_affiliation_string":"Ant Group, Beijing, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023862460","display_name":"Zhongyi Liu","orcid":"https://orcid.org/0000-0001-9478-8107"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhongyi Liu","raw_affiliation_strings":["Ant Group, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-9478-8107","affiliations":[{"raw_affiliation_string":"Ant Group, Beijing, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5101742332"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.6816,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.76183075,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"4300","last_page":"4304"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.987500011920929,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8169174194335938},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7273002862930298},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6552181839942932},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.49187755584716797},{"id":"https://openalex.org/keywords/plain-text","display_name":"Plain text","score":0.48213765025138855},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40952008962631226},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4048624336719513}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8169174194335938},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7273002862930298},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6552181839942932},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.49187755584716797},{"id":"https://openalex.org/C46503548","wikidata":"https://www.wikidata.org/wiki/Q1145976","display_name":"Plain text","level":3,"score":0.48213765025138855},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40952008962631226},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4048624336719513},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C148730421","wikidata":"https://www.wikidata.org/wiki/Q141090","display_name":"Encryption","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3583780.3615157","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3583780.3615157","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3583780.3615157","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3583780.3615157","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3583780.3615157","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3583780.3615157","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320318398","display_name":"Ant Group","ror":null},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322847","display_name":"Youth Innovation Promotion Association of the Chinese Academy of Sciences","ror":"https://ror.org/031141b54"},{"id":"https://openalex.org/F4320335892","display_name":"Youth Innovation Promotion Association","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387848842.pdf","grobid_xml":"https://content.openalex.org/works/W4387848842.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W2040873223","https://openalex.org/W2085030399","https://openalex.org/W2768459074","https://openalex.org/W2801992635","https://openalex.org/W2897392264","https://openalex.org/W2951434086","https://openalex.org/W2970641574","https://openalex.org/W2980918481","https://openalex.org/W3007702683","https://openalex.org/W3021397474","https://openalex.org/W3134665270","https://openalex.org/W3154670582","https://openalex.org/W3155895380","https://openalex.org/W3212725701","https://openalex.org/W3216225167","https://openalex.org/W4206121183","https://openalex.org/W4221164176","https://openalex.org/W4224865658","https://openalex.org/W4282961889","https://openalex.org/W4290943593","https://openalex.org/W4292955407","https://openalex.org/W4367047408","https://openalex.org/W4385572770"],"related_works":["https://openalex.org/W2085384747","https://openalex.org/W2106071040","https://openalex.org/W2088166309","https://openalex.org/W4312133475","https://openalex.org/W4238976562","https://openalex.org/W1967370444","https://openalex.org/W2150136235","https://openalex.org/W2157408137","https://openalex.org/W1980762553","https://openalex.org/W4312252109"],"abstract_inverted_index":{"Grounded":[0],"on":[1,12,22,177,187],"pre-trained":[2],"language":[3,174],"models":[4],"(PLMs),":[5],"dense":[6,29],"retrieval":[7,64,139],"has":[8,18],"been":[9,19],"studied":[10],"extensively":[11],"plain":[13],"text.":[14],"In":[15,31,158],"contrast,":[16],"there":[17],"little":[20],"research":[21],"retrieving":[23],"data":[24],"with":[25,140],"multiple":[26],"aspects":[27,182],"using":[28,73],"models.":[30],"the":[32,38,78,88,98,103,112,134,141,150,153,178,211,227],"scenarios":[33],"such":[34],"as":[35,115,207],"product":[36],"search,":[37],"aspect":[39,60,113,142,155,168,205,215],"information":[40,61,114,169],"plays":[41],"an":[42,68],"essential":[43],"role":[44],"in":[45,133],"relevance":[46],"matching,":[47],"e.g.,":[48],"category:":[49],"Electronics,":[50],"Computers,":[51],"and":[52,156,183,192,209,216,220],"Pet":[53],"Supplies.":[54],"A":[55],"common":[56],"way":[57],"of":[58,82,152,167,181],"leveraging":[59],"for":[62,214],"multi-aspect":[63],"is":[65],"to":[66,76],"introduce":[67],"auxiliary":[69],"classification":[70],"objective,":[71],"i.e.,":[72],"item":[74,83,154],"contents":[75],"predict":[77],"annotated":[79],"value":[80,89],"IDs":[81,121],"aspects.":[84],"However,":[85],"by":[86],"learning":[87],"embeddings":[90],"from":[91],"scratch,":[92],"this":[93,108,159],"approach":[94,198],"may":[95],"not":[96],"capture":[97],"various":[99],"semantic":[100,127],"similarities":[101,128],"between":[102,149],"values":[104,206],"sufficiently.":[105],"To":[106,136],"address":[107],"limitation,":[109],"we":[110,144],"leverage":[111],"text":[116,151,180],"strings":[117],"rather":[118],"than":[119,170],"class":[120],"during":[122],"pre-training":[123],"so":[124],"that":[125,196],"their":[126],"can":[129,199],"be":[130,224],"naturally":[131],"captured":[132],"PLMs.":[135],"facilitate":[137],"effective":[138],"strings,":[143],"propose":[145],"mutual":[146],"prediction":[147],"objectives":[148],"content.":[157,184],"way,":[160],"our":[161,197],"model":[162],"makes":[163],"more":[164],"sufficient":[165],"use":[166],"conducting":[171,210],"undifferentiated":[172],"masked":[173],"modeling":[175],"(MLM)":[176],"concatenated":[179],"Extensive":[185],"experiments":[186],"two":[188],"real-world":[189],"datasets":[190],"(product":[191],"mini-program":[193],"search)":[194],"show":[195],"outperform":[200],"competitive":[201],"baselines":[202],"both":[203],"treating":[204],"classes":[208],"same":[212],"MLM":[213],"content":[217],"strings.":[218],"Code":[219],"related":[221],"dataset":[222],"will":[223],"available":[225],"at":[226],"URL":[228],"\\footnotehttps://github.com/sunxiaojie99/ATTEMPT.":[229]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
