{"id":"https://openalex.org/W2051721519","doi":"https://doi.org/10.3115/1117794.1117803","title":"Error-driven HMM-based chunk tagger with context-dependent lexicon","display_name":"Error-driven HMM-based chunk tagger with context-dependent lexicon","publication_year":2000,"publication_date":"2000-01-01","ids":{"openalex":"https://openalex.org/W2051721519","doi":"https://doi.org/10.3115/1117794.1117803","mag":"2051721519"},"language":"en","primary_location":{"id":"doi:10.3115/1117794.1117803","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117803","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117803","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117803","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012794465","display_name":"Guodong Zhou","orcid":"https://orcid.org/0000-0002-7887-5099"},"institutions":[{"id":"https://openalex.org/I4210108443","display_name":"Advanced Digital Sciences Center","ror":"https://ror.org/01xaqx887","country_code":"SG","type":"facility","lineage":["https://openalex.org/I4210108443"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"GuoDong Zhou","raw_affiliation_strings":["Kent Ridge Digital Labs, Singapore","Kent Ridge Digital Labs, Singapore#TAB#"],"affiliations":[{"raw_affiliation_string":"Kent Ridge Digital Labs, Singapore","institution_ids":["https://openalex.org/I4210108443"]},{"raw_affiliation_string":"Kent Ridge Digital Labs, Singapore#TAB#","institution_ids":["https://openalex.org/I4210108443"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101860993","display_name":"Jian Su","orcid":"https://orcid.org/0009-0001-9484-5885"},"institutions":[{"id":"https://openalex.org/I4210108443","display_name":"Advanced Digital Sciences Center","ror":"https://ror.org/01xaqx887","country_code":"SG","type":"facility","lineage":["https://openalex.org/I4210108443"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Jian Su","raw_affiliation_strings":["Kent Ridge Digital Labs, Singapore","Kent Ridge Digital Labs, Singapore#TAB#"],"affiliations":[{"raw_affiliation_string":"Kent Ridge Digital Labs, Singapore","institution_ids":["https://openalex.org/I4210108443"]},{"raw_affiliation_string":"Kent Ridge Digital Labs, Singapore#TAB#","institution_ids":["https://openalex.org/I4210108443"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5012794465"],"corresponding_institution_ids":["https://openalex.org/I4210108443"],"apc_list":null,"apc_paid":null,"fwci":3.7132,"has_fulltext":true,"cited_by_count":30,"citation_normalized_percentile":{"value":0.93313735,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"13","issue":null,"first_page":"71","last_page":"79"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/treebank","display_name":"Treebank","score":0.9134090542793274},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7931721210479736},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.736741304397583},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7311177849769592},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.718834400177002},{"id":"https://openalex.org/keywords/noun","display_name":"Noun","score":0.6246973872184753},{"id":"https://openalex.org/keywords/lexicon","display_name":"Lexicon","score":0.6009156107902527},{"id":"https://openalex.org/keywords/verb","display_name":"Verb","score":0.5571990013122559},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5501469373703003},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5154970288276672},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.4952358305454254},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.41744381189346313},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.36191076040267944}],"concepts":[{"id":"https://openalex.org/C206134035","wikidata":"https://www.wikidata.org/wiki/Q811525","display_name":"Treebank","level":3,"score":0.9134090542793274},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7931721210479736},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.736741304397583},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7311177849769592},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.718834400177002},{"id":"https://openalex.org/C121934690","wikidata":"https://www.wikidata.org/wiki/Q1084","display_name":"Noun","level":2,"score":0.6246973872184753},{"id":"https://openalex.org/C2778121359","wikidata":"https://www.wikidata.org/wiki/Q8096","display_name":"Lexicon","level":2,"score":0.6009156107902527},{"id":"https://openalex.org/C2776397901","wikidata":"https://www.wikidata.org/wiki/Q24905","display_name":"Verb","level":2,"score":0.5571990013122559},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5501469373703003},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5154970288276672},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.4952358305454254},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.41744381189346313},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.36191076040267944},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3115/1117794.1117803","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117803","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117803","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.12.5401","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.12.5401","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://acl.ldc.upenn.edu/W/W00/W00-1309.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.20.7864","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.20.7864","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://textmining.krdl.org.sg/docs/emnlpvlc2000.pdf","raw_type":"text"}],"best_oa_location":{"id":"doi:10.3115/1117794.1117803","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117803","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117803","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6399999856948853,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2051721519.pdf","grobid_xml":"https://content.openalex.org/works/W2051721519.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W1489594794","https://openalex.org/W1544752668","https://openalex.org/W1551773846","https://openalex.org/W1554031433","https://openalex.org/W1571453868","https://openalex.org/W1589411737","https://openalex.org/W1612238087","https://openalex.org/W1632114991","https://openalex.org/W2061271742","https://openalex.org/W2074870484","https://openalex.org/W2097125878","https://openalex.org/W2099247782","https://openalex.org/W2116266212","https://openalex.org/W2123282296","https://openalex.org/W2125838338","https://openalex.org/W2155063582","https://openalex.org/W2162539697","https://openalex.org/W2170909726","https://openalex.org/W2951200021","https://openalex.org/W2951956562","https://openalex.org/W2952115222","https://openalex.org/W4253573210","https://openalex.org/W6633995852","https://openalex.org/W6636573309"],"related_works":["https://openalex.org/W1043255351","https://openalex.org/W2135057643","https://openalex.org/W2109902858","https://openalex.org/W1533278948","https://openalex.org/W1781980207","https://openalex.org/W2951759144","https://openalex.org/W28706907","https://openalex.org/W2949524199","https://openalex.org/W2575884139","https://openalex.org/W2017946383"],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"a":[3,21,33],"new":[4,22],"error-driven":[5,38],"HMM-based":[6,16],"text":[7],"chunk":[8,82,130],"tagger":[9,19],"with":[10,14],"context-dependent":[11,62],"lexicon.":[12],"Compared":[13],"standard":[15],"tagger,":[17],"this":[18,68],"uses":[20],"Hidden":[23],"Markov":[24],"Modelling":[25],"approach":[26,40],"which":[27],"incorporates":[28],"more":[29,61],"contextual":[30],"information":[31],"into":[32],"lexical":[34,52,63],"entry.":[35],"Moreover,":[36],"an":[37],"learning":[39],"is":[41],"adopted":[42],"to":[43,58],"decrease":[44],"the":[45],"memory":[46],"requirement":[47],"by":[48],"keeping":[49],"only":[50],"positive":[51],"entries":[53],"and":[54,73,78,85,90,92,105,121,126,133,138,140],"makes":[55],"it":[56],"possible":[57],"further":[59],"incorporate":[60],"entries.":[64],"Experiments":[65],"show":[66,118],"that":[67],"technique":[69],"achieves":[70],"overall":[71,119],"precision":[72,120],"recall":[74,122],"rates":[75,123],"of":[76,114,124],"93.40%":[77],"93.95%":[79],"for":[80,87,94,128,135,142],"all":[81,129],"types,":[83,131],"93.60%":[84],"94.64%":[86,91],"noun":[88,136],"phrases,":[89,137],"94.75%":[93],"verb":[95,143],"phrases":[96],"when":[97],"trained":[98],"on":[99,107],"PENN":[100,115],"WSJ":[101,116],"TreeBank":[102,117],"section":[103,108],"00-19":[104],"tested":[106],"20-24,":[109],"while":[110],"25-fold":[111],"validation":[112],"experiments":[113],"96.40%":[125],"96.47%":[127],"96.49%":[132],"96.99%":[134],"97.13%":[139],"97.36%":[141],"phrases.":[144]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":4}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
