{"id":"https://openalex.org/W2751200649","doi":"https://doi.org/10.1587/transinf.2017edp7043","title":"Modeling Content Structures of Domain-Specific Texts with RUP-HDP-HSMM and Its Applications","display_name":"Modeling Content Structures of Domain-Specific Texts with RUP-HDP-HSMM and Its Applications","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2751200649","doi":"https://doi.org/10.1587/transinf.2017edp7043","mag":"2751200649"},"language":"en","primary_location":{"id":"doi:10.1587/transinf.2017edp7043","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2017edp7043","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E100.D/9/E100.D_2017EDP7043/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://www.jstage.jst.go.jp/article/transinf/E100.D/9/E100.D_2017EDP7043/_pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109377230","display_name":"Youwei Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Youwei LU","raw_affiliation_strings":["Department of Computational Intelligence and Systems Science, Tokyo Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Department of Computational Intelligence and Systems Science, Tokyo Institute of Technology","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080920610","display_name":"Shogo Okada","orcid":"https://orcid.org/0000-0002-9260-0403"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shogo OKADA","raw_affiliation_strings":["School of Information Science, Japan Advanced Institute of Science and Technology"],"affiliations":[{"raw_affiliation_string":"School of Information Science, Japan Advanced Institute of Science and Technology","institution_ids":["https://openalex.org/I177738480"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109912424","display_name":"Katsumi Nitta","orcid":"https://orcid.org/0000-0002-9018-8603"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Katsumi NITTA","raw_affiliation_strings":["School of Computing, Tokyo Institute of Technology"],"affiliations":[{"raw_affiliation_string":"School of Computing, Tokyo Institute of Technology","institution_ids":["https://openalex.org/I114531698"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5109377230"],"corresponding_institution_ids":["https://openalex.org/I114531698"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1126533,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"E100.D","issue":"9","first_page":"2126","last_page":"2137"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7232098579406738},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5994711518287659},{"id":"https://openalex.org/keywords/content","display_name":"Content (measure theory)","score":0.5983149409294128},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.06942570209503174}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7232098579406738},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5994711518287659},{"id":"https://openalex.org/C2778152352","wikidata":"https://www.wikidata.org/wiki/Q5165061","display_name":"Content (measure theory)","level":2,"score":0.5983149409294128},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.06942570209503174},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1587/transinf.2017edp7043","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2017edp7043","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E100.D/9/E100.D_2017EDP7043/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1587/transinf.2017edp7043","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2017edp7043","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E100.D/9/E100.D_2017EDP7043/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2751200649.pdf","grobid_xml":"https://content.openalex.org/works/W2751200649.grobid-xml"},"referenced_works_count":20,"referenced_works":["https://openalex.org/W1502101714","https://openalex.org/W1532325895","https://openalex.org/W1578979740","https://openalex.org/W1614151208","https://openalex.org/W1880262756","https://openalex.org/W2011760672","https://openalex.org/W2053569739","https://openalex.org/W2076618452","https://openalex.org/W2096110600","https://openalex.org/W2118370253","https://openalex.org/W2124585778","https://openalex.org/W2128709346","https://openalex.org/W2132991226","https://openalex.org/W2133227439","https://openalex.org/W2136019741","https://openalex.org/W2151967501","https://openalex.org/W2158266063","https://openalex.org/W2882319491","https://openalex.org/W3104490327","https://openalex.org/W4213009331"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W2530322880"],"abstract_inverted_index":{"We":[0,73],"propose":[1],"a":[2,59,63,142,156,161],"novel":[3],"method,":[4],"built":[5],"upon":[6],"the":[7,16,52,55,76,86,147,165],"hierarchical":[8],"Dirichlet":[9],"process":[10,61],"hidden":[11,90],"semi-Markov":[12],"model,":[13],"to":[14,115,152],"reveal":[15],"content":[17,24],"structures":[18,25],"of":[19,26,29,48,54,100,136,144],"unstructured":[20],"domain-specific":[21,137],"texts.":[22,138],"The":[23,45],"texts":[27],"consisting":[28],"sequential":[30],"local":[31,148],"contexts":[32,149],"are":[33],"useful":[34],"for":[35,113,154],"tasks,":[36],"such":[37],"as":[38,160],"text":[39,43,105,122,157],"retrieval,":[40],"classification,":[41],"and":[42,108],"mining.":[44],"prominent":[46],"feature":[47],"our":[49,93,104,121,130],"model":[50],"is":[51,158],"use":[53],"recursive":[56,77],"uniform":[57,78],"partitioning,":[58],"stochastic":[60],"taking":[62],"view":[64],"different":[65],"from":[66],"existing":[67],"HSMMs":[68],"in":[69,84,98,103,120,164],"modeling":[70],"state":[71],"duration.":[72],"show":[74],"that":[75,129,150],"partitioning":[79],"plays":[80],"an":[81],"important":[82],"role":[83],"avoiding":[85],"rapid":[87],"switching":[88],"between":[89],"states.":[91],"Remarkably,":[92],"method":[94,131,143],"greatly":[95],"outperforms":[96],"others":[97],"terms":[99],"ranking":[101],"performance":[102],"retrieval":[106],"experiments,":[107],"provides":[109],"more":[110],"accurate":[111],"features":[112],"SVM":[114],"achieve":[116],"higher":[117],"F1":[118],"scores":[119],"classification":[123],"experiments.":[124],"These":[125],"experiment":[126],"results":[127],"suggest":[128],"can":[132],"yield":[133],"improved":[134],"representations":[135],"Furthermore,":[139],"we":[140],"present":[141],"automatically":[145],"discovering":[146],"serve":[151],"account":[153],"why":[155],"classified":[159],"positive":[162],"instance,":[163],"supervised":[166],"learning":[167],"settings.":[168]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
