{"id":"https://openalex.org/W4400649375","doi":"https://doi.org/10.1145/3676969","title":"SikuGPT: A Generative Pre-trained Model for Intelligent Information Processing of Ancient Texts from the Perspective of Digital Humanities","display_name":"SikuGPT: A Generative Pre-trained Model for Intelligent Information Processing of Ancient Texts from the Perspective of Digital Humanities","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4400649375","doi":"https://doi.org/10.1145/3676969"},"language":"en","primary_location":{"id":"doi:10.1145/3676969","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3676969","pdf_url":null,"source":{"id":"https://openalex.org/S4210184050","display_name":"Journal on Computing and Cultural Heritage","issn_l":"1556-4673","issn":["1556-4673","1556-4711"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal on Computing and Cultural Heritage","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101829627","display_name":"Chang Liu","orcid":"https://orcid.org/0000-0001-9048-4552"},"institutions":[{"id":"https://openalex.org/I119454577","display_name":"Nanjing Agricultural University","ror":"https://ror.org/05td3s095","country_code":"CN","type":"education","lineage":["https://openalex.org/I119454577"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chang Liu","raw_affiliation_strings":["College of Information Management, Nanjing Agricultural University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0001-9048-4552","affiliations":[{"raw_affiliation_string":"College of Information Management, Nanjing Agricultural University, Nanjing, China","institution_ids":["https://openalex.org/I119454577"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Dongbo Wang","orcid":"https://orcid.org/0000-0001-5946-3489"},"institutions":[{"id":"https://openalex.org/I119454577","display_name":"Nanjing Agricultural University","ror":"https://ror.org/05td3s095","country_code":"CN","type":"education","lineage":["https://openalex.org/I119454577"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongbo Wang","raw_affiliation_strings":["College of Information Management, Nanjing Agricultural University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0001-5946-3489","affiliations":[{"raw_affiliation_string":"College of Information Management, Nanjing Agricultural University, Nanjing, China","institution_ids":["https://openalex.org/I119454577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102534284","display_name":"Zhixiao Zhao","orcid":"https://orcid.org/0009-0007-1992-4296"},"institutions":[{"id":"https://openalex.org/I119454577","display_name":"Nanjing Agricultural University","ror":"https://ror.org/05td3s095","country_code":"CN","type":"education","lineage":["https://openalex.org/I119454577"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhixiao Zhao","raw_affiliation_strings":["College of Information Management, Nanjing Agricultural University, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0007-1992-4296","affiliations":[{"raw_affiliation_string":"College of Information Management, Nanjing Agricultural University, Nanjing, China","institution_ids":["https://openalex.org/I119454577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034442813","display_name":"Die Hu","orcid":"https://orcid.org/0009-0007-6730-450X"},"institutions":[{"id":"https://openalex.org/I119454577","display_name":"Nanjing Agricultural University","ror":"https://ror.org/05td3s095","country_code":"CN","type":"education","lineage":["https://openalex.org/I119454577"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Die Hu","raw_affiliation_strings":["College of Information Management, Nanjing Agricultural University, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0007-6730-450X","affiliations":[{"raw_affiliation_string":"College of Information Management, Nanjing Agricultural University, Nanjing, China","institution_ids":["https://openalex.org/I119454577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113289466","display_name":"Mengcheng Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I119454577","display_name":"Nanjing Agricultural University","ror":"https://ror.org/05td3s095","country_code":"CN","type":"education","lineage":["https://openalex.org/I119454577"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengcheng Wu","raw_affiliation_strings":["College of Information Management, Nanjing Agricultural University, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0004-6424-6875","affiliations":[{"raw_affiliation_string":"College of Information Management, Nanjing Agricultural University, Nanjing, China","institution_ids":["https://openalex.org/I119454577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068300675","display_name":"Litao Lin","orcid":"https://orcid.org/0000-0001-8287-936X"},"institutions":[{"id":"https://openalex.org/I119454577","display_name":"Nanjing Agricultural University","ror":"https://ror.org/05td3s095","country_code":"CN","type":"education","lineage":["https://openalex.org/I119454577"]},{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Litao Lin","raw_affiliation_strings":["School of Information Management, Nanjing University, Nanjing, China","College of Information Management, Nanjing Agricultural University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0001-8287-936X","affiliations":[{"raw_affiliation_string":"School of Information Management, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"College of Information Management, Nanjing Agricultural University, Nanjing, China","institution_ids":["https://openalex.org/I119454577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083285009","display_name":"Jiangfeng Liu","orcid":"https://orcid.org/0000-0001-7268-7313"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiangfeng Liu","raw_affiliation_strings":["School of Information Management, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0001-7268-7313","affiliations":[{"raw_affiliation_string":"School of Information Management, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047769452","display_name":"H. P. Zhang","orcid":"https://orcid.org/0000-0003-3698-5385"},"institutions":[{"id":"https://openalex.org/I119454577","display_name":"Nanjing Agricultural University","ror":"https://ror.org/05td3s095","country_code":"CN","type":"education","lineage":["https://openalex.org/I119454577"]},{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hai Zhang","raw_affiliation_strings":["College of Information Management, Nanjing Agricultural University, Nanjing, China","School of Information Management, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0003-3698-5385","affiliations":[{"raw_affiliation_string":"College of Information Management, Nanjing Agricultural University, Nanjing, China","institution_ids":["https://openalex.org/I119454577"]},{"raw_affiliation_string":"School of Information Management, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102279651","display_name":"Si Shen","orcid":"https://orcid.org/0009-0003-3554-4307"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Si Shen","raw_affiliation_strings":["Group of Science and Technology Full-text Knowledge Mining, School of Economics and Management, Nanjing University of Science and Technology, Nanjing, China","Group of Science and Technology Full-text Knowledge Mining, School of Economics &amp; Management, Nanjing University of Science and Technology, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0003-3554-4307","affiliations":[{"raw_affiliation_string":"Group of Science and Technology Full-text Knowledge Mining, School of Economics and Management, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"Group of Science and Technology Full-text Knowledge Mining, School of Economics &amp; Management, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100365206","display_name":"Bin Li","orcid":"https://orcid.org/0000-0002-7328-9947"},"institutions":[{"id":"https://openalex.org/I152031979","display_name":"Nanjing Normal University","ror":"https://ror.org/036trcv74","country_code":"CN","type":"education","lineage":["https://openalex.org/I152031979"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Li","raw_affiliation_strings":["College of Liberal Art, Nanjing Normal University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-7328-9947","affiliations":[{"raw_affiliation_string":"College of Liberal Art, Nanjing Normal University, Nanjing, China","institution_ids":["https://openalex.org/I152031979"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050414514","display_name":"L. Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I161716053","display_name":"China Pharmaceutical University","ror":"https://ror.org/01sfm2718","country_code":"CN","type":"education","lineage":["https://openalex.org/I161716053"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lianzhen Zhao","raw_affiliation_strings":["School of Foreign Languages, China Pharmaceutical University, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0007-0642-8138","affiliations":[{"raw_affiliation_string":"School of Foreign Languages, China Pharmaceutical University, Nanjing, China","institution_ids":["https://openalex.org/I161716053"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.1383,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.88910998,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"17","issue":"4","first_page":"1","last_page":"17"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.7672568559646606},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5763885378837585},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5448411107063293},{"id":"https://openalex.org/keywords/digital-humanities","display_name":"Digital humanities","score":0.517159640789032},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5002694129943848},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.46828433871269226},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.42636987566947937},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4172014594078064},{"id":"https://openalex.org/keywords/humanities","display_name":"Humanities","score":0.38439953327178955},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.20091721415519714},{"id":"https://openalex.org/keywords/art","display_name":"Art","score":0.14522317051887512}],"concepts":[{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.7672568559646606},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5763885378837585},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5448411107063293},{"id":"https://openalex.org/C24351657","wikidata":"https://www.wikidata.org/wiki/Q1026962","display_name":"Digital humanities","level":2,"score":0.517159640789032},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5002694129943848},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.46828433871269226},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.42636987566947937},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4172014594078064},{"id":"https://openalex.org/C15708023","wikidata":"https://www.wikidata.org/wiki/Q80083","display_name":"Humanities","level":1,"score":0.38439953327178955},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.20091721415519714},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.14522317051887512}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3676969","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3676969","pdf_url":null,"source":{"id":"https://openalex.org/S4210184050","display_name":"Journal on Computing and Cultural Heritage","issn_l":"1556-4673","issn":["1556-4673","1556-4711"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal on Computing and Cultural Heritage","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7599999904632568}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W2896457183","https://openalex.org/W2944815030","https://openalex.org/W2945260553","https://openalex.org/W2946345909","https://openalex.org/W2952771545","https://openalex.org/W2954004546","https://openalex.org/W2973078864","https://openalex.org/W2981852735","https://openalex.org/W3030513270","https://openalex.org/W3082145431","https://openalex.org/W3153444823","https://openalex.org/W3178503538","https://openalex.org/W3185341429","https://openalex.org/W3200202382","https://openalex.org/W3205068155","https://openalex.org/W3205395604","https://openalex.org/W4220941542","https://openalex.org/W4225529853","https://openalex.org/W4285141993","https://openalex.org/W4286985375","https://openalex.org/W4288088047","https://openalex.org/W4288089799","https://openalex.org/W4292779060","https://openalex.org/W4307079201","https://openalex.org/W4322621892","https://openalex.org/W6739901393","https://openalex.org/W6778883912"],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3014948380","https://openalex.org/W4380551139","https://openalex.org/W4317695495","https://openalex.org/W4287117424","https://openalex.org/W4387506531","https://openalex.org/W4238433571","https://openalex.org/W3174044702","https://openalex.org/W2967848559","https://openalex.org/W4299831724"],"abstract_inverted_index":{"The":[0,43,149,165],"rapid":[1],"development":[2],"of":[3,14,20,27,41,45,56,63,66,134,146,162,167,179,190],"generative":[4,46,102,111],"artificial":[5],"intelligence":[6],"has":[7],"brought":[8],"significant":[9],"opportunities":[10],"for":[11,60,113],"the":[12,39,64,81,93,98,107,177,187],"advancement":[13],"digital":[15,28],"humanities":[16],"research.":[17],"Intelligent":[18],"processing":[19,116,170],"ancient":[21,51,74,114,135,147,163,180],"texts,":[22,52],"as":[23],"an":[24],"essential":[25],"part":[26],"humanities,":[29],"is":[30],"also":[31],"undergoing":[32],"a":[33,53,89,110],"transformation":[34],"in":[35,38,157,169],"research":[36],"methodologies":[37],"wave":[40],"AIGC.":[42],"integration":[44],"pre-trained":[47,103],"models":[48,122],"with":[49,101],"Chinese":[50,57,96,172,192],"vital":[54],"carrier":[55],"culture,":[58],"allows":[59],"deep":[61],"mining":[62],"content":[65],"these":[67],"texts":[68,75,173],"and":[69,78,141,144,159,182,185],"provides":[70],"services":[71],"that":[72,91,152],"make":[73],"more":[76],"understandable":[77],"accessible":[79],"to":[80,175],"general":[82],"public.":[83],"In":[84],"this":[85],"research,":[86],"we":[87],"propose":[88],"method":[90],"combines":[92],"most":[94],"renowned":[95],"anthology,":[97],"\u201cSiku":[99],"Quanshu,\u201d":[100],"models.":[104],"We":[105],"developed":[106],"SikuGPT":[108,168],"model,":[109],"model":[112,127,154],"text":[115,136],"tasks,":[117],"based":[118],"on":[119,130],"GPT-type":[120],"language":[121],"by":[123],"continued":[124],"pretraining.":[125],"This":[126],"was":[128],"tested":[129],"two":[131],"typical":[132],"tasks":[133],"processing:":[137],"translation":[138],"between":[139],"classical":[140],"modern":[142],"Chinese,":[143],"classification":[145],"texts.":[148,164],"findings":[150],"reveal":[151],"our":[153],"achieves":[155],"advantages":[156],"understanding":[158],"generating":[160],"scenarios":[161],"capability":[166],"traditional":[171,191],"helps":[174],"promote":[176],"organization":[178],"information":[181],"knowledge":[183],"services,":[184],"advances":[186],"international":[188],"dissemination":[189],"culture.":[193]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
