{"id":"https://openalex.org/W4392904283","doi":"https://doi.org/10.1109/icassp48485.2024.10446640","title":"Dynamic Data Sampler for Cross-Language Transfer Learning in Large Language Models","display_name":"Dynamic Data Sampler for Cross-Language Transfer Learning in Large Language Models","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392904283","doi":"https://doi.org/10.1109/icassp48485.2024.10446640"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10446640","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10446640","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100332356","display_name":"Yudong Li","orcid":"https://orcid.org/0000-0001-6779-8836"},"institutions":[{"id":"https://openalex.org/I97750245","display_name":"Software (Spain)","ror":"https://ror.org/02ethns06","country_code":"ES","type":"company","lineage":["https://openalex.org/I4210087817","https://openalex.org/I97750245"]},{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN","ES"],"is_corresponding":true,"raw_author_name":"Yudong Li","raw_affiliation_strings":["Shenzhen University,School of Computer Science and Software Engineering","School of Computer Science and Software Engineering, Shenzhen University"],"affiliations":[{"raw_affiliation_string":"Shenzhen University,School of Computer Science and Software Engineering","institution_ids":["https://openalex.org/I180726961"]},{"raw_affiliation_string":"School of Computer Science and Software Engineering, Shenzhen University","institution_ids":["https://openalex.org/I180726961","https://openalex.org/I97750245"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103042268","display_name":"Yuhao Feng","orcid":"https://orcid.org/0000-0003-4104-706X"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhao Feng","raw_affiliation_strings":["Tencent AI Lab"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032724577","display_name":"Zhou Wen","orcid":"https://orcid.org/0000-0002-9705-4421"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210118728","display_name":"State Key Laboratory of Information Engineering in Surveying Mapping and Remote Sensing","ror":"https://ror.org/02bpap860","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210118728"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wen Zhou","raw_affiliation_strings":["Wuhan University,LIESMARS","LIESMARS, Wuhan University"],"affiliations":[{"raw_affiliation_string":"Wuhan University,LIESMARS","institution_ids":["https://openalex.org/I4210118728","https://openalex.org/I37461747"]},{"raw_affiliation_string":"LIESMARS, Wuhan University","institution_ids":["https://openalex.org/I4210118728","https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100631152","display_name":"Zhe Zhao","orcid":"https://orcid.org/0000-0003-4189-3258"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhe Zhao","raw_affiliation_strings":["Tencent AI Lab"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019313200","display_name":"Linlin Shen","orcid":"https://orcid.org/0000-0003-1420-0815"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I97750245","display_name":"Software (Spain)","ror":"https://ror.org/02ethns06","country_code":"ES","type":"company","lineage":["https://openalex.org/I4210087817","https://openalex.org/I97750245"]}],"countries":["CN","ES"],"is_corresponding":false,"raw_author_name":"Linlin Shen","raw_affiliation_strings":["Shenzhen University,School of Computer Science and Software Engineering","School of Computer Science and Software Engineering, Shenzhen University"],"affiliations":[{"raw_affiliation_string":"Shenzhen University,School of Computer Science and Software Engineering","institution_ids":["https://openalex.org/I180726961"]},{"raw_affiliation_string":"School of Computer Science and Software Engineering, Shenzhen University","institution_ids":["https://openalex.org/I180726961","https://openalex.org/I97750245"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037584106","display_name":"Cheng Hou","orcid":"https://orcid.org/0000-0002-7375-4159"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng Hou","raw_affiliation_strings":["Tencent AI Lab"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033865377","display_name":"Xianxu Hou","orcid":"https://orcid.org/0000-0002-8728-2842"},"institutions":[{"id":"https://openalex.org/I69356397","display_name":"Xi\u2019an Jiaotong-Liverpool University","ror":"https://ror.org/03zmrmn05","country_code":"CN","type":"education","lineage":["https://openalex.org/I69356397"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xianxu Hou","raw_affiliation_strings":["Xi'an Jiaotong-Liverpool,School of AI and Advanced Computing","School of AI and Advanced Computing, Xi'an Jiaotong-Liverpool"],"affiliations":[{"raw_affiliation_string":"Xi'an Jiaotong-Liverpool,School of AI and Advanced Computing","institution_ids":["https://openalex.org/I69356397"]},{"raw_affiliation_string":"School of AI and Advanced Computing, Xi'an Jiaotong-Liverpool","institution_ids":["https://openalex.org/I69356397"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100332356"],"corresponding_institution_ids":["https://openalex.org/I180726961","https://openalex.org/I97750245"],"apc_list":null,"apc_paid":null,"fwci":0.6785,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.72471469,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"11291","last_page":"11295"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9843999743461609,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8580116033554077},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.7035836577415466},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.66310054063797},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6257749199867249},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.5592141151428223},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5003831386566162},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4738231897354126},{"id":"https://openalex.org/keywords/transfer","display_name":"Transfer (computing)","score":0.45357030630111694},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.4326738119125366},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4259389042854309},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.09070166945457458}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8580116033554077},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.7035836577415466},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.66310054063797},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6257749199867249},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.5592141151428223},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5003831386566162},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4738231897354126},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.45357030630111694},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.4326738119125366},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4259389042854309},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.09070166945457458},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp48485.2024.10446640","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10446640","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1141204904","display_name":null,"funder_award_id":"2023A1515010688","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"},{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1477544716","display_name":null,"funder_award_id":"Guangdong","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2981938667","display_name":null,"funder_award_id":"Shenzhen","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3111586145","display_name":null,"funder_award_id":"31101412","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3398858419","display_name":null,"funder_award_id":"51501068","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3472539505","display_name":null,"funder_award_id":"202205","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3577061224","display_name":null,"funder_award_id":"JCYJ20220531101412030","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3757194791","display_name":null,"funder_award_id":"JCYJ20","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4488680036","display_name":null,"funder_award_id":"2022A15","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7041006821","display_name":null,"funder_award_id":"82261138629","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7884267847","display_name":null,"funder_award_id":"51501101","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8322697783","display_name":null,"funder_award_id":"82261138","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8786868300","display_name":null,"funder_award_id":"62206180","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320324032","display_name":"Xi\u2019an Jiaotong-Liverpool University","ror":"https://ror.org/03zmrmn05"},{"id":"https://openalex.org/F4320329174","display_name":"Shenzhen Municipal Science and Technology Innovation Council","ror":"https://ror.org/017n8df75"},{"id":"https://openalex.org/F4320337111","display_name":"Basic and Applied Basic Research Foundation of Guangdong Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W2296073425","https://openalex.org/W2977458338","https://openalex.org/W3010108619","https://openalex.org/W3121904249","https://openalex.org/W3152788712","https://openalex.org/W4303443398","https://openalex.org/W4322718191","https://openalex.org/W4365799947","https://openalex.org/W4366456685","https://openalex.org/W4376653782","https://openalex.org/W4378464464","https://openalex.org/W4379468930","https://openalex.org/W4384918448","https://openalex.org/W4385373704","https://openalex.org/W4385565577","https://openalex.org/W4389519291","https://openalex.org/W4402684121","https://openalex.org/W6774242638","https://openalex.org/W6782879696","https://openalex.org/W6800875267","https://openalex.org/W6842802441","https://openalex.org/W6846002521","https://openalex.org/W6850625674","https://openalex.org/W6852144548","https://openalex.org/W6852584927","https://openalex.org/W6852870998","https://openalex.org/W6852911403","https://openalex.org/W6853234313","https://openalex.org/W6854860422","https://openalex.org/W6854866820"],"related_works":["https://openalex.org/W3201126466","https://openalex.org/W4282827391","https://openalex.org/W2169518243","https://openalex.org/W4386828785","https://openalex.org/W3165580226","https://openalex.org/W3135401135","https://openalex.org/W2886688859","https://openalex.org/W3133164560","https://openalex.org/W3041001745","https://openalex.org/W3171384686"],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4],"gained":[5],"significant":[6,32],"attention":[7],"in":[8,38,67],"the":[9,36,43,84,94,99,114,144],"field":[10],"of":[11,21,75],"natural":[12],"language":[13,65,101],"processing":[14],"(NLP)":[15],"due":[16,34],"to":[17,35,57,81,88,98,111,119],"their":[18],"wide":[19],"range":[20],"applications.":[22],"However,":[23],"training":[24],"LLMs":[25],"for":[26],"languages":[27],"other":[28,150],"than":[29],"English":[30,142],"poses":[31],"challenges,":[33],"difficulty":[37],"acquiring":[39],"large-scale":[40],"corpus":[41,80],"and":[42,61,78,92,131,141],"requisite":[44],"computing":[45],"resources.":[46],"In":[47,103],"this":[48],"paper,":[49],"we":[50,105],"propose":[51],"ChatFlow,":[52],"a":[53,68,73,107],"cross-language":[54,90],"transfer-based":[55],"LLM,":[56],"address":[58],"these":[59],"challenges":[60],"train":[62,83],"large":[63],"Chinese":[64,100,140,151],"models":[66,152],"cost-effective":[69],"manner.":[70],"We":[71,135],"employ":[72],"mix":[74],"Chinese,":[76],"English,":[77],"parallel":[79],"continuously":[82],"LLaMA2":[85],"model,":[86],"aiming":[87],"align":[89],"representations":[91],"facilitate":[93],"knowledge":[95],"transfer":[96],"specifically":[97],"model.":[102],"addition,":[104],"use":[106],"dynamic":[108],"data":[109],"sampler":[110],"progressively":[112],"transition":[113],"model":[115,129],"from":[116],"unsupervised":[117],"pre-training":[118],"supervised":[120],"fine-tuning.":[121],"Experimental":[122],"results":[123,145],"demonstrate":[124],"that":[125,147],"our":[126],"approach":[127],"accelerates":[128],"convergence":[130],"achieves":[132],"superior":[133],"performance.":[134],"evaluate":[136],"ChatFlow":[137],"on":[138,154],"popular":[139],"benchmarks,":[143],"indicate":[146],"it":[148],"outperforms":[149],"post-trained":[153],"LLaMA-2-7B.":[155]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
