{"id":"https://openalex.org/W4412889681","doi":"https://doi.org/10.18653/v1/2025.acl-long.1501","title":"Negative Matters: Multi-Granularity Hard-Negative Synthesis and Anchor-Token-Aware Pooling for Enhanced Text Embeddings","display_name":"Negative Matters: Multi-Granularity Hard-Negative Synthesis and Anchor-Token-Aware Pooling for Enhanced Text Embeddings","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412889681","doi":"https://doi.org/10.18653/v1/2025.acl-long.1501"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2025.acl-long.1501","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.1501","pdf_url":"https://aclanthology.org/2025.acl-long.1501.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.acl-long.1501.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Tengyu Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tengyu Pan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061798935","display_name":"Zhichao Duan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhichao Duan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115028408","display_name":"Zhenyu Li","orcid":"https://orcid.org/0009-0006-4964-9910"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhenyu Li","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101916985","display_name":"Bowen Dong","orcid":"https://orcid.org/0009-0000-1362-0020"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bowen Dong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100740596","display_name":"Ning Liu","orcid":"https://orcid.org/0000-0002-3408-8632"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ning Liu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059036409","display_name":"Xiuxing Li","orcid":"https://orcid.org/0000-0002-1178-7422"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiuxing Li","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100630872","display_name":"Jianyong Wang","orcid":"https://orcid.org/0000-0003-4695-4806"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jianyong Wang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08695662,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"31102","last_page":"31118"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9430000185966492,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.8630884289741516},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.8074100613594055},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.7221090793609619},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.681538462638855},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.36573073267936707},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28646451234817505},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.24760594964027405},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.19116145372390747}],"concepts":[{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.8630884289741516},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.8074100613594055},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.7221090793609619},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.681538462638855},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.36573073267936707},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28646451234817505},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.24760594964027405},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.19116145372390747}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.18653/v1/2025.acl-long.1501","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.1501","pdf_url":"https://aclanthology.org/2025.acl-long.1501.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2509.00842","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.00842","pdf_url":"https://arxiv.org/pdf/2509.00842","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.acl-long.1501","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.1501","pdf_url":"https://aclanthology.org/2025.acl-long.1501.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5088477901","display_name":null,"funder_award_id":"62272264","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6777344962","display_name":null,"funder_award_id":"2020YFA0804503","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412889681.pdf","grobid_xml":"https://content.openalex.org/works/W4412889681.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2953234277","https://openalex.org/W2931688134","https://openalex.org/W2626256601","https://openalex.org/W2377919138","https://openalex.org/W147410782","https://openalex.org/W2166690231","https://openalex.org/W2950637221"],"abstract_inverted_index":{"Tengyu":[0],"Pan,":[1],"Zhichao":[2],"Duan,":[3],"Zhenyu":[4],"Li,":[5,11],"Bowen":[6],"Dong,":[7],"Ning":[8],"Liu,":[9],"Xiuxing":[10],"Jianyong":[12],"Wang.":[13],"Proceedings":[14],"of":[15,20],"the":[16,21],"63rd":[17],"Annual":[18],"Meeting":[19],"Association":[22],"for":[23],"Computational":[24],"Linguistics":[25],"(Volume":[26],"1:":[27],"Long":[28],"Papers).":[29],"2025.":[30]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
