{"id":"https://openalex.org/W2024809659","doi":"https://doi.org/10.3115/1117794.1117815","title":"Reducing parsing complexity by intra-sentence segmentation based on maximum entropy model","display_name":"Reducing parsing complexity by intra-sentence segmentation based on maximum entropy model","publication_year":2000,"publication_date":"2000-01-01","ids":{"openalex":"https://openalex.org/W2024809659","doi":"https://doi.org/10.3115/1117794.1117815","mag":"2024809659"},"language":"en","primary_location":{"id":"doi:10.3115/1117794.1117815","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117815","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117815","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117815","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013474750","display_name":"Sung\u2010Dong Kim","orcid":"https://orcid.org/0000-0002-8436-5722"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Sung Dong Kim","raw_affiliation_strings":["Seoul National University, Korea","Seoul National University (Korea)"],"affiliations":[{"raw_affiliation_string":"Seoul National University, Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University (Korea)","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107826037","display_name":"Byoung\u2010Tak Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Byoung-Tak Zhang","raw_affiliation_strings":["Seoul National University, Korea","Seoul National University (Korea)"],"affiliations":[{"raw_affiliation_string":"Seoul National University, Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University (Korea)","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089859598","display_name":"Yung Taek Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yung Taek Kim","raw_affiliation_strings":["Seoul National University, Korea","Seoul National University (Korea)"],"affiliations":[{"raw_affiliation_string":"Seoul National University, Korea","institution_ids":["https://openalex.org/I139264467"]},{"raw_affiliation_string":"Seoul National University (Korea)","institution_ids":["https://openalex.org/I139264467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5013474750"],"corresponding_institution_ids":["https://openalex.org/I139264467"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.11415804,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":null,"first_page":"164","last_page":"171"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.8637642860412598},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.8366724252700806},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7515602111816406},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.726290225982666},{"id":"https://openalex.org/keywords/principle-of-maximum-entropy","display_name":"Principle of maximum entropy","score":0.6599817276000977},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6584125757217407},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4887573719024658},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.4457905888557434},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.4319227635860443},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.33967769145965576},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.23925769329071045}],"concepts":[{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.8637642860412598},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.8366724252700806},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7515602111816406},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.726290225982666},{"id":"https://openalex.org/C9679016","wikidata":"https://www.wikidata.org/wiki/Q1417473","display_name":"Principle of maximum entropy","level":2,"score":0.6599817276000977},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6584125757217407},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4887573719024658},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.4457905888557434},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.4319227635860443},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33967769145965576},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.23925769329071045},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3115/1117794.1117815","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117815","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117815","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.12.7166","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.12.7166","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://acl.ldc.upenn.edu/W/W00/W00-1321.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.21.493","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.21.493","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://bi.snu.ac.kr/Publications/Conferences/International/EMNLP2000.pdf","raw_type":"text"}],"best_oa_location":{"id":"doi:10.3115/1117794.1117815","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117815","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117815","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2024809659.pdf","grobid_xml":"https://content.openalex.org/works/W2024809659.grobid-xml"},"referenced_works_count":13,"referenced_works":["https://openalex.org/W132450547","https://openalex.org/W1490831147","https://openalex.org/W1495949396","https://openalex.org/W1549123485","https://openalex.org/W1550597138","https://openalex.org/W1572970401","https://openalex.org/W1605351056","https://openalex.org/W1966032129","https://openalex.org/W2001792610","https://openalex.org/W2018560257","https://openalex.org/W2032558547","https://openalex.org/W2059230065","https://openalex.org/W2137813774"],"related_works":["https://openalex.org/W579810227","https://openalex.org/W2142145894","https://openalex.org/W2952780262","https://openalex.org/W2375873920","https://openalex.org/W2979495269","https://openalex.org/W2392917763","https://openalex.org/W2146114872","https://openalex.org/W3041490575","https://openalex.org/W2970690932","https://openalex.org/W2110715801"],"abstract_inverted_index":{"Long":[0],"sentence":[1],"analysis":[2],"has":[3],"been":[4],"a":[5,41],"critical":[6],"problem":[7],"because":[8],"of":[9,17,37,51],"high":[10],"complexity.":[11],"This":[12],"paper":[13],"addresses":[14],"the":[15,52],"reduction":[16],"parsing":[18,61],"complexity":[19],"by":[20,65],"intra-sentence":[21],"segmentation,":[22],"and":[23,49,57,69],"presents":[24],"maximum":[25],"entropy":[26],"model":[27,33],"for":[28],"determining":[29],"segmentation":[30,38],"positions.":[31],"The":[32,60],"features":[34],"lexical":[35],"contexts":[36],"positions,":[39],"giving":[40],"probability":[42],"to":[43],"each":[44],"potential":[45],"position.":[46],"Segmentation":[47],"coverage":[48],"accuracy":[50],"proposed":[53],"method":[54],"are":[55],"96%":[56],"88%":[58],"respectively.":[59],"efficiency":[62],"is":[63],"improved":[64],"77%":[66],"in":[67,71],"time":[68],"71%":[70],"space.":[72]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
