{"id":"https://openalex.org/W2116632765","doi":"https://doi.org/10.3115/1073012.1073081","title":"Text chunking using regularized Winnow","display_name":"Text chunking using regularized Winnow","publication_year":2001,"publication_date":"2001-01-01","ids":{"openalex":"https://openalex.org/W2116632765","doi":"https://doi.org/10.3115/1073012.1073081","mag":"2116632765"},"language":"en","primary_location":{"id":"doi:10.3115/1073012.1073081","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1073012.1073081","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1073012.1073081","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 39th Annual Meeting on Association for Computational Linguistics  - ACL '01","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.3115/1073012.1073081","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100378800","display_name":"Tong Zhang","orcid":"https://orcid.org/0000-0002-7025-6365"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]},{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tong Zhang","raw_affiliation_strings":["IBM T.J. Watson Research Center, Yorktown Heights, New York","[IBM T.J. Watson Research Center, Yorktown Heights, New York]"],"affiliations":[{"raw_affiliation_string":"IBM T.J. Watson Research Center, Yorktown Heights, New York","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"[IBM T.J. Watson Research Center, Yorktown Heights, New York]","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056772857","display_name":"Fred J. Damerau","orcid":null},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]},{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fred Damerau","raw_affiliation_strings":["IBM T.J. Watson Research Center, Yorktown Heights, New York","[IBM T.J. Watson Research Center, Yorktown Heights, New York]"],"affiliations":[{"raw_affiliation_string":"IBM T.J. Watson Research Center, Yorktown Heights, New York","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"[IBM T.J. Watson Research Center, Yorktown Heights, New York]","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101586727","display_name":"David E. Johnson","orcid":"https://orcid.org/0000-0001-8793-8736"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]},{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Johnson","raw_affiliation_strings":["IBM T.J. Watson Research Center, Yorktown Heights, New York","[IBM T.J. Watson Research Center, Yorktown Heights, New York]"],"affiliations":[{"raw_affiliation_string":"IBM T.J. Watson Research Center, Yorktown Heights, New York","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"[IBM T.J. Watson Research Center, Yorktown Heights, New York]","institution_ids":["https://openalex.org/I1341412227"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100378800"],"corresponding_institution_ids":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"],"apc_list":null,"apc_paid":null,"fwci":4.218,"has_fulltext":true,"cited_by_count":45,"citation_normalized_percentile":{"value":0.94170993,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"539","last_page":"546"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/chunking","display_name":"Chunking (psychology)","score":0.8464609980583191},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8268752694129944},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6772069931030273},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5977143049240112},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5960522890090942},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4512549638748169},{"id":"https://openalex.org/keywords/separable-space","display_name":"Separable space","score":0.4363935589790344},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3899040222167969},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.30620646476745605},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10684826970100403}],"concepts":[{"id":"https://openalex.org/C203357204","wikidata":"https://www.wikidata.org/wiki/Q1089605","display_name":"Chunking (psychology)","level":2,"score":0.8464609980583191},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8268752694129944},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6772069931030273},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5977143049240112},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5960522890090942},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4512549638748169},{"id":"https://openalex.org/C70710897","wikidata":"https://www.wikidata.org/wiki/Q680081","display_name":"Separable space","level":2,"score":0.4363935589790344},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3899040222167969},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.30620646476745605},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10684826970100403},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3115/1073012.1073081","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1073012.1073081","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1073012.1073081","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 39th Annual Meeting on Association for Computational Linguistics  - ACL '01","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.20.62","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.20.62","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://acl.ldc.upenn.edu/P/P01/P01-1069.pdf","raw_type":"text"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-98643","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-98643","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"},{"id":"pmh:oai:repository.ust.hk:1783.1-98643","is_oa":false,"landing_page_url":"http://repository.ust.hk/ir/Record/1783.1-98643","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference paper"}],"best_oa_location":{"id":"doi:10.3115/1073012.1073081","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1073012.1073081","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1073012.1073081","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 39th Annual Meeting on Association for Computational Linguistics  - ACL '01","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.7900000214576721,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2116632765.pdf","grobid_xml":"https://content.openalex.org/works/W2116632765.grobid-xml"},"referenced_works_count":16,"referenced_works":["https://openalex.org/W10972377","https://openalex.org/W1560621288","https://openalex.org/W1570127741","https://openalex.org/W1589153833","https://openalex.org/W1813610639","https://openalex.org/W2040909025","https://openalex.org/W2097125878","https://openalex.org/W2098921539","https://openalex.org/W2129113961","https://openalex.org/W2143773250","https://openalex.org/W2150067374","https://openalex.org/W2161290181","https://openalex.org/W2163046677","https://openalex.org/W2949108231","https://openalex.org/W2949995692","https://openalex.org/W4246994868"],"related_works":["https://openalex.org/W2384729545","https://openalex.org/W2198395236","https://openalex.org/W2800417007","https://openalex.org/W147604216","https://openalex.org/W2161080928","https://openalex.org/W2118525872","https://openalex.org/W2279104074","https://openalex.org/W4245487161","https://openalex.org/W2090755435","https://openalex.org/W2039036070"],"abstract_inverted_index":{"Many":[0],"machine":[1],"learning":[2],"methods":[3],"have":[4],"recently":[5],"been":[6,19,55],"applied":[7],"to":[8,21,29,32,65],"natural":[9],"language":[10],"processing":[11],"tasks.":[12],"Among":[13],"them,":[14],"the":[15,76],"Winnow":[16,38,53],"algorithm":[17],"has":[18,54],"argued":[20],"be":[22],"particularly":[23],"suitable":[24],"for":[25,42],"NLP":[26],"problems,":[27],"due":[28],"its":[30],"robustness":[31],"irrelevant":[33],"features.":[34],"However":[35],"in":[36],"theory,":[37],"may":[39],"not":[40],"converge":[41],"non-separable":[43],"data.":[44],"To":[45],"remedy":[46],"this":[47,58,62,71],"problem,":[48],"a":[49],"modification":[50],"called":[51],"regularized":[52],"proposed.":[56],"In":[57],"paper,":[59],"we":[60],"apply":[61],"new":[63],"method":[64,72],"text":[66],"chunking.":[67],"We":[68],"show":[69],"that":[70],"achieves":[73],"state":[74],"of":[75],"art":[77],"performance":[78],"with":[79],"significantly":[80],"less":[81],"computation":[82],"than":[83],"previous":[84],"approaches.":[85]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
