{"id":"https://openalex.org/W4406892635","doi":"https://doi.org/10.1109/fllm63129.2024.10852506","title":"Teaching Large Language Models to Understand Jeju Island with Domain-Adaptive Pretraining","display_name":"Teaching Large Language Models to Understand Jeju Island with Domain-Adaptive Pretraining","publication_year":2024,"publication_date":"2024-11-26","ids":{"openalex":"https://openalex.org/W4406892635","doi":"https://doi.org/10.1109/fllm63129.2024.10852506"},"language":"en","primary_location":{"id":"doi:10.1109/fllm63129.2024.10852506","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fllm63129.2024.10852506","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 2nd International Conference on Foundation and Large Language Models (FLLM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Jaeyoung Suh","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jaeyoung Suh","raw_affiliation_strings":["AIO2O,Gyeonggi,South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AIO2O,Gyeonggi,South Korea","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090056525","display_name":"Eunchan Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eunchan Lee","raw_affiliation_strings":["AIO2O,Gyeonggi,South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AIO2O,Gyeonggi,South Korea","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yohan Jeong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yohan Jeong","raw_affiliation_strings":["AIO2O,Gyeonggi,South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AIO2O,Gyeonggi,South Korea","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050869074","display_name":"D. Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Donggil Park","raw_affiliation_strings":["AIO2O,Gyeonggi,South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AIO2O,Gyeonggi,South Korea","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109048161","display_name":"Sung\u2013Min Ahn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sungmin Ahn","raw_affiliation_strings":["AIO2O,Gyeonggi,South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AIO2O,Gyeonggi,South Korea","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7574,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.91478347,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"21","last_page":"28"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.8205999732017517,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.8205999732017517,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.7461000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6591819524765015},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5002548694610596},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3441493511199951},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07719182968139648}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6591819524765015},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5002548694610596},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3441493511199951},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07719182968139648},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/fllm63129.2024.10852506","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fllm63129.2024.10852506","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 2nd International Conference on Foundation and Large Language Models (FLLM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"The":[0],"advancement":[1],"of":[2,25,105],"large":[3],"language":[4,15],"models":[5],"(LLMs)":[6],"has":[7],"led":[8],"to":[9,81,125],"remarkable":[10],"achievements":[11],"in":[12,118],"various":[13,134],"natural":[14,112],"processing":[16],"(NLP)":[17],"tasks.":[18,135],"Specifically,":[19],"tasks":[20],"requiring":[21],"a":[22,74,127],"deep":[23],"understanding":[24],"specific":[26,71],"topics":[27],"have":[28],"significantly":[29,114],"benefited":[30],"from":[31],"Domain-Adaptive":[32],"Pretraining":[33],"(DAPT)":[34],"and":[35,56,68,102,111],"Low-Rank":[36],"Adaptation":[37],"(LoRA)":[38],"fine-tuning.":[39],"This":[40,122],"paper":[41],"explores":[42],"enhancing":[43],"LLM":[44],"performance":[45,132],"by":[46],"combining":[47],"these":[48,79],"methodologies.":[49],"By":[50],"integrating":[51],"domain-specific":[52],"knowledge":[53],"through":[54],"DAPT":[55],"optimizing":[57],"the":[58,63,82,97,116],"training":[59],"process":[60],"with":[61],"LoRA,":[62],"model":[64,85,99],"achieves":[65],"higher":[66],"accuracy":[67],"efficiency":[69,117],"within":[70],"domains.":[72],"As":[73],"case":[75],"study,":[76],"we":[77],"apply":[78],"techniques":[80],"Llama":[83],"3":[84],"using":[86],"publicly":[87],"available":[88],"data":[89],"about":[90],"Jeju":[91],"Island.":[92],"Experimental":[93],"results":[94],"demonstrate":[95],"that":[96],"adjusted":[98],"provides":[100],"detailed":[101],"accurate":[103],"descriptions":[104],"Jeju\u2019s":[106],"tourist":[107],"attractions,":[108],"cultural":[109],"heritage,":[110],"landscapes,":[113],"improving":[115],"handling":[119],"specialized":[120],"topics.":[121],"approach":[123],"proves":[124],"be":[126],"valuable":[128],"method":[129],"for":[130],"maximizing":[131],"across":[133]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
