{"id":"https://openalex.org/W4406612301","doi":"https://doi.org/10.1109/smc54092.2024.10831873","title":"Beyond Label: Cold-Start Self-Training for Cross-Domain Semantic Text Similarity","display_name":"Beyond Label: Cold-Start Self-Training for Cross-Domain Semantic Text Similarity","publication_year":2024,"publication_date":"2024-10-06","ids":{"openalex":"https://openalex.org/W4406612301","doi":"https://doi.org/10.1109/smc54092.2024.10831873"},"language":"en","primary_location":{"id":"doi:10.1109/smc54092.2024.10831873","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc54092.2024.10831873","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101566619","display_name":"Bo Huang","orcid":"https://orcid.org/0000-0002-5476-620X"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Huang","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051415181","display_name":"J F Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiasong Liu","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101792591","display_name":"Xin Liu","orcid":"https://orcid.org/0000-0003-1050-5697"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Liu","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101432696","display_name":"Cui Chen","orcid":"https://orcid.org/0000-0002-2138-8804"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cui Chen","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101841981","display_name":"Zuping Zhang","orcid":"https://orcid.org/0000-0002-3295-2861"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zuping Zhang","raw_affiliation_strings":["School of Computer Science and Engineering, Central South University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Central South University","institution_ids":["https://openalex.org/I139660479"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I139660479"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.22183334,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1807","last_page":"1812"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9754999876022339,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7391045689582825},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6037976741790771},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.5493898987770081},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5218721628189087},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5043915510177612},{"id":"https://openalex.org/keywords/cold-start","display_name":"Cold start (automotive)","score":0.49985694885253906},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4770483374595642},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.4226342439651489},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.41363951563835144},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.412592351436615},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11272671818733215},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.08949354290962219}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7391045689582825},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6037976741790771},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.5493898987770081},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5218721628189087},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5043915510177612},{"id":"https://openalex.org/C2778956030","wikidata":"https://www.wikidata.org/wiki/Q5142477","display_name":"Cold start (automotive)","level":2,"score":0.49985694885253906},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4770483374595642},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4226342439651489},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.41363951563835144},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.412592351436615},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11272671818733215},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.08949354290962219},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/smc54092.2024.10831873","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc54092.2024.10831873","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2735784619","https://openalex.org/W2911489562","https://openalex.org/W2955474241","https://openalex.org/W2970641574","https://openalex.org/W3080956857","https://openalex.org/W3094834348","https://openalex.org/W3119409427","https://openalex.org/W3156636935","https://openalex.org/W3194782062","https://openalex.org/W4224313754","https://openalex.org/W4323536724","https://openalex.org/W4385573170","https://openalex.org/W4389921502","https://openalex.org/W4391307405","https://openalex.org/W4404643526","https://openalex.org/W6755207826","https://openalex.org/W6761260114","https://openalex.org/W6785645804","https://openalex.org/W6791252336","https://openalex.org/W6794146050","https://openalex.org/W6850287543","https://openalex.org/W6855966607","https://openalex.org/W6856672271","https://openalex.org/W6857426794"],"related_works":["https://openalex.org/W2529147798","https://openalex.org/W1979350723","https://openalex.org/W2528269032","https://openalex.org/W2555127516","https://openalex.org/W2114797768","https://openalex.org/W2380654781","https://openalex.org/W2327130486","https://openalex.org/W2176214140","https://openalex.org/W2516873349","https://openalex.org/W2752210368"],"abstract_inverted_index":{"In":[0],"Natural":[1],"Language":[2],"Processing":[3],"(NLP),":[4],"comprehending":[5],"the":[6,38,86,96,108,119,127,140,150],"semantic":[7,74,101],"connection":[8],"between":[9],"two":[10],"texts,":[11],"a":[12,19],"Semantic":[13],"Text":[14],"Similarity":[15],"(STS)":[16],"task,":[17],"poses":[18],"significant":[20],"challenge.":[21],"This":[22,67],"challenge":[23],"is":[24],"especially":[25],"pronounced":[26],"in":[27,64,126],"resource-constrained":[28],"and":[29,80,161],"cross-domain":[30,136,157],"contexts,":[31],"where":[32],"traditional":[33,141],"methods":[34],"are":[35],"hindered":[36],"by":[37],"high":[39],"costs":[40],"associated":[41],"with":[42],"data":[43,79,83],"labeling.":[44],"We":[45,147],"propose":[46],"an":[47],"innovative":[48],"technique,":[49],"designated":[50],"as":[51],"\u201cCold-Start":[52],"Self-Training\u201d":[53],"that":[54,114],"reduces":[55],"reliance":[56,142],"on":[57,123,143],"large":[58],"labeled":[59,145],"datasets":[60],"for":[61,135,156,164],"STS":[62,124,137],"tasks":[63,125],"resource-restricted":[65],"settings.":[66],"method":[68,116],"utilizes":[69],"dual-view":[70],"pooling":[71,90,93],"to":[72,84,99],"extract":[73],"similarity":[75,102],"information":[76],"from":[77],"unlabeled":[78],"generates":[81],"pseudo-labeled":[82],"fine-tune":[85],"cross-encoder":[87,120],"model.":[88],"Dual-view":[89],"combines":[91],"different":[92],"results":[94,112],"of":[95,152],"same":[97],"text":[98],"evaluate":[100],"without":[103],"additional":[104],"model":[105],"tuning,":[106],"simplifying":[107],"self-training":[109],"process.":[110],"Experimental":[111],"show":[113],"our":[115],"significantly":[117],"improves":[118],"model's":[121],"performance":[122],"medical":[128],"domain.":[129],"Our":[130],"findings":[131],"provide":[132],"new":[133],"strategies":[134],"tasks,":[138,158],"challenging":[139],"extensive":[144],"data.":[146],"also":[148],"validate":[149],"potential":[151],"unsupervised":[153],"pretrained":[154],"models":[155],"offering":[159],"theoretical":[160],"practical":[162],"support":[163],"complex":[165],"challenges.":[166]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
