{"id":"https://openalex.org/W7125210338","doi":"https://doi.org/10.48550/arxiv.2601.12921","title":"Injecting Knowledge from Social Science Journals to Improve Indonesian Cultural Understanding by LLMs","display_name":"Injecting Knowledge from Social Science Journals to Improve Indonesian Cultural Understanding by LLMs","publication_year":2026,"publication_date":"2026-01-19","ids":{"openalex":"https://openalex.org/W7125210338","doi":"https://doi.org/10.48550/arxiv.2601.12921"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.12921","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.12921","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.12921","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123509271","display_name":"Adimulya Kartiyasa","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kartiyasa, Adimulya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123520082","display_name":"Bao Gia Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Bao Gia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5123512547","display_name":"Boyang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Boyang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5123509271"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.2913999855518341,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.2913999855518341,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.11590000241994858,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.018400000408291817,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/indonesian","display_name":"Indonesian","score":0.9574000239372253},{"id":"https://openalex.org/keywords/recipe","display_name":"Recipe","score":0.5817999839782715},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5242999792098999},{"id":"https://openalex.org/keywords/computational-sociology","display_name":"Computational sociology","score":0.3321000039577484},{"id":"https://openalex.org/keywords/traditional-knowledge","display_name":"Traditional knowledge","score":0.30550000071525574},{"id":"https://openalex.org/keywords/social-knowledge","display_name":"Social knowledge","score":0.30160000920295715}],"concepts":[{"id":"https://openalex.org/C2779207338","wikidata":"https://www.wikidata.org/wiki/Q9240","display_name":"Indonesian","level":2,"score":0.9574000239372253},{"id":"https://openalex.org/C2778671685","wikidata":"https://www.wikidata.org/wiki/Q219239","display_name":"Recipe","level":2,"score":0.5817999839782715},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5242999792098999},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.39969998598098755},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.34880000352859497},{"id":"https://openalex.org/C126349790","wikidata":"https://www.wikidata.org/wiki/Q905036","display_name":"Computational sociology","level":2,"score":0.3321000039577484},{"id":"https://openalex.org/C514011633","wikidata":"https://www.wikidata.org/wiki/Q1428168","display_name":"Traditional knowledge","level":3,"score":0.30550000071525574},{"id":"https://openalex.org/C2986930172","wikidata":"https://www.wikidata.org/wiki/Q1116133","display_name":"Social knowledge","level":2,"score":0.30160000920295715},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.2992999851703644},{"id":"https://openalex.org/C125209646","wikidata":"https://www.wikidata.org/wiki/Q1338878","display_name":"Cultural diversity","level":2,"score":0.27970001101493835},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.27570000290870667},{"id":"https://openalex.org/C29595303","wikidata":"https://www.wikidata.org/wiki/Q165650","display_name":"Media studies","level":1,"score":0.26589998602867126},{"id":"https://openalex.org/C2994055011","wikidata":"https://www.wikidata.org/wiki/Q210272","display_name":"Cultural knowledge","level":2,"score":0.26080000400543213},{"id":"https://openalex.org/C39549134","wikidata":"https://www.wikidata.org/wiki/Q133080","display_name":"Public relations","level":1,"score":0.2554999887943268},{"id":"https://openalex.org/C206440729","wikidata":"https://www.wikidata.org/wiki/Q4806809","display_name":"Asian studies","level":3,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.12921","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.12921","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.12921","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.12921","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.8408522009849548,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recently":[0],"there":[1],"have":[2],"been":[3,26],"intensifying":[4],"efforts":[5],"to":[6,82],"improve":[7],"the":[8,79,110,127],"understanding":[9],"of":[10,21,32,51],"Indonesian":[11,59,72,83,118],"cultures":[12],"by":[13,114],"large":[14],"language":[15],"models":[16],"(LLMs).":[17],"An":[18],"attractive":[19],"source":[20],"cultural":[22,39,73],"knowledge":[23,74],"that":[24],"has":[25],"largely":[27],"overlooked":[28],"is":[29],"local":[30],"journals":[31],"social":[33,60],"science,":[34],"which":[35],"likely":[36],"contain":[37],"substantial":[38],"studies":[40],"from":[41,56],"a":[42,47,122],"native":[43],"perspective.":[44],"We":[45,65],"present":[46],"novel":[48],"text":[49],"dataset":[50],"journal":[52],"article":[53],"passages,":[54],"created":[55],"151":[57],"open-source":[58],"science":[61],"journals,":[62],"called":[63],"IndoSoSci.":[64],"demonstrate":[66],"an":[67],"effective":[68],"recipe":[69,100],"for":[70],"injecting":[71],"therein":[75],"into":[76],"LLMs:":[77],"extracting":[78],"facts":[80],"related":[81],"culture,":[84],"and":[85],"apply":[86],"retrieval-augmented":[87],"generation":[88],"(RAG)":[89],"with":[90,117],"LLM-generated":[91],"hypothetical":[92],"documents":[93],"as":[94],"queries":[95],"during":[96],"retrieval.":[97],"The":[98],"proposed":[99],"yields":[101],"strong":[102,107],"performance":[103],"gains":[104],"over":[105],"several":[106],"baselines":[108],"on":[109,126],"IndoCulture":[111,128],"benchmark.":[112,129],"Additionally,":[113],"combining":[115],"IndoSoSci":[116],"Wikipedia,":[119],"we":[120],"set":[121],"new":[123],"state-of-the-art":[124],"accuracy":[125]},"counts_by_year":[],"updated_date":"2026-01-22T23:33:04.759266","created_date":"2026-01-22T00:00:00"}
