{"id":"https://openalex.org/W4406461910","doi":"https://doi.org/10.1109/bigdata62323.2024.10825111","title":"Pre-Trained Language Models with Topic Attention for Supervised Document Structure Learning","display_name":"Pre-Trained Language Models with Topic Attention for Supervised Document Structure Learning","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406461910","doi":"https://doi.org/10.1109/bigdata62323.2024.10825111"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10825111","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825111","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069574538","display_name":"Dang Pham","orcid":"https://orcid.org/0000-0002-0924-8403"},"institutions":[{"id":"https://openalex.org/I10052268","display_name":"New Mexico State University","ror":"https://ror.org/00hpz7z43","country_code":"US","type":"education","lineage":["https://openalex.org/I10052268"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Dang Pham","raw_affiliation_strings":["New Mexico State University,Department of Computer Science"],"affiliations":[{"raw_affiliation_string":"New Mexico State University,Department of Computer Science","institution_ids":["https://openalex.org/I10052268"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059645701","display_name":"Tuan M. V. Le","orcid":"https://orcid.org/0000-0001-9998-1045"},"institutions":[{"id":"https://openalex.org/I10052268","display_name":"New Mexico State University","ror":"https://ror.org/00hpz7z43","country_code":"US","type":"education","lineage":["https://openalex.org/I10052268"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tuan M. V. Le","raw_affiliation_strings":["New Mexico State University,Department of Computer Science"],"affiliations":[{"raw_affiliation_string":"New Mexico State University,Department of Computer Science","institution_ids":["https://openalex.org/I10052268"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5069574538"],"corresponding_institution_ids":["https://openalex.org/I10052268"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.23185713,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1094","last_page":"1103"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7977371215820312},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6658273935317993},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.634038507938385},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4682888388633728},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33876317739486694}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7977371215820312},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6658273935317993},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.634038507938385},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4682888388633728},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33876317739486694}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10825111","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825111","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6100000143051147}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W193333623","https://openalex.org/W1522301498","https://openalex.org/W1959608418","https://openalex.org/W2023440853","https://openalex.org/W2075942762","https://openalex.org/W2101101940","https://openalex.org/W2147994374","https://openalex.org/W2190817982","https://openalex.org/W2470673105","https://openalex.org/W2565349465","https://openalex.org/W2567736915","https://openalex.org/W2886946814","https://openalex.org/W2896457183","https://openalex.org/W2959589111","https://openalex.org/W2963355447","https://openalex.org/W2963414291","https://openalex.org/W2970217403","https://openalex.org/W2970771982","https://openalex.org/W2977752818","https://openalex.org/W2990138404","https://openalex.org/W3010804678","https://openalex.org/W3034834827","https://openalex.org/W3046553216","https://openalex.org/W3101587314","https://openalex.org/W3128288937","https://openalex.org/W3177599311","https://openalex.org/W4220873409","https://openalex.org/W4231510805","https://openalex.org/W4285138469","https://openalex.org/W4294554825","https://openalex.org/W4318028277","https://openalex.org/W4322619000","https://openalex.org/W4327644058","https://openalex.org/W4327644619","https://openalex.org/W4385498392","https://openalex.org/W4385570558","https://openalex.org/W4385574308","https://openalex.org/W6631190155","https://openalex.org/W6640963894","https://openalex.org/W6676803185","https://openalex.org/W6745097924","https://openalex.org/W6779928756","https://openalex.org/W6795022033"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4387369504","https://openalex.org/W3046775127","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474"],"abstract_inverted_index":{"The":[0,118],"discourse-level":[1],"structure":[2,85,88],"of":[3,14,31,43,56,89,112,125,136,139],"a":[4,62,70,75,95],"document":[5,58,145],"can":[6,48],"be":[7],"captured":[8],"through":[9,74],"learning":[10,55,81],"the":[11,41,54,57,83,101,110,113,130,134],"rhetorical":[12,29,37,84,116,137],"functions":[13,30,138],"sentences":[15,32,107,140],"in":[16,144],"that":[17,66,129],"document.":[18],"Existing":[19],"supervised":[20],"methods":[21],"based":[22],"on":[23,35,121],"pre-trained":[24],"language":[25,72],"models":[26],"for":[27,52,80],"classifying":[28],"usually":[33],"focus":[34],"utilizing":[36],"words":[38,47,104],"but":[39],"ignore":[40],"topics":[42],"sentences.":[44],"Since":[45],"topic":[46,64,87,96,103],"provide":[49],"additional":[50],"information":[51],"enhancing":[53],"structure,":[59],"we":[60,93],"present":[61],"neural":[63],"model":[65,73,132],"is":[67,142],"integrated":[68],"with":[69],"BERT-based":[71],"unified":[76],"probabilistic":[77],"generative":[78],"process":[79],"both":[82],"and":[86,141,147],"documents.":[90],"For":[91],"inference,":[92],"design":[94],"attention":[97],"mechanism":[98],"to":[99,108],"utilize":[100],"learned":[102],"from":[105],"previous":[106],"improve":[109],"prediction":[111],"current":[114],"sentence\u2019s":[115],"label.":[117],"extensive":[119],"experiments":[120],"four":[122],"real-world":[123],"datasets":[124],"different":[126],"domains":[127],"show":[128],"proposed":[131],"improves":[133],"detection":[135],"effective":[143],"modeling":[146],"extracting":[148],"coherent":[149],"topics.":[150]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
