{"id":"https://openalex.org/W2120006020","doi":"https://doi.org/10.1017/s1351324903003097","title":"Application of finite-state transducers to the acquisition of verb subcategorization information","display_name":"Application of finite-state transducers to the acquisition of verb subcategorization information","publication_year":2003,"publication_date":"2003-03-01","ids":{"openalex":"https://openalex.org/W2120006020","doi":"https://doi.org/10.1017/s1351324903003097","mag":"2120006020"},"language":"en","primary_location":{"id":"doi:10.1017/s1351324903003097","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324903003097","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085496182","display_name":"Izaskun Aldezabal","orcid":"https://orcid.org/0000-0001-7630-1406"},"institutions":[{"id":"https://openalex.org/I169108374","display_name":"University of the Basque Country","ror":"https://ror.org/000xsnr85","country_code":"ES","type":"education","lineage":["https://openalex.org/I169108374"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"I. ALDEZABAL","raw_affiliation_strings":["IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail:","IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail: jibalroi@si.ehu.es"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail:","institution_ids":["https://openalex.org/I169108374"]},{"raw_affiliation_string":"IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail: jibalroi@si.ehu.es","institution_ids":["https://openalex.org/I169108374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100657245","display_name":"Mar\u00eda Jes\u00fas Aranzabe","orcid":"https://orcid.org/0000-0002-0401-1087"},"institutions":[{"id":"https://openalex.org/I169108374","display_name":"University of the Basque Country","ror":"https://ror.org/000xsnr85","country_code":"ES","type":"education","lineage":["https://openalex.org/I169108374"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"M. ARANZABE","raw_affiliation_strings":["IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail:","IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail: jibarurm@si.ehu.es"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail:","institution_ids":["https://openalex.org/I169108374"]},{"raw_affiliation_string":"IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail: jibarurm@si.ehu.es","institution_ids":["https://openalex.org/I169108374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030328561","display_name":"Koldo Gojenola","orcid":"https://orcid.org/0000-0002-2116-6611"},"institutions":[{"id":"https://openalex.org/I169108374","display_name":"University of the Basque Country","ror":"https://ror.org/000xsnr85","country_code":"ES","type":"education","lineage":["https://openalex.org/I169108374"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"K. GOJENOLA","raw_affiliation_strings":["IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail:","IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail: jipgogak@si.ehu.es"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail:","institution_ids":["https://openalex.org/I169108374"]},{"raw_affiliation_string":"IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail: jipgogak@si.ehu.es","institution_ids":["https://openalex.org/I169108374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017928422","display_name":"Maite Oronoz","orcid":"https://orcid.org/0000-0001-9097-6047"},"institutions":[{"id":"https://openalex.org/I169108374","display_name":"University of the Basque Country","ror":"https://ror.org/000xsnr85","country_code":"ES","type":"education","lineage":["https://openalex.org/I169108374"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"M. ORONOZ","raw_affiliation_strings":["IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail:","IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail: jiboranm@si.ehu.es#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail:","institution_ids":["https://openalex.org/I169108374"]},{"raw_affiliation_string":"IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail: jiboranm@si.ehu.es#TAB#","institution_ids":["https://openalex.org/I169108374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070002404","display_name":"Kepa Sarasola","orcid":"https://orcid.org/0000-0003-4349-6088"},"institutions":[{"id":"https://openalex.org/I169108374","display_name":"University of the Basque Country","ror":"https://ror.org/000xsnr85","country_code":"ES","type":"education","lineage":["https://openalex.org/I169108374"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"K. SARASOLA","raw_affiliation_strings":["IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail:","IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail: jipsagak@si.ehu.es#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail:","institution_ids":["https://openalex.org/I169108374"]},{"raw_affiliation_string":"IXA group, Department of Computer Languages and Systems, University of the Basque Country, 649 P.K., 20080-Donostia, Spain e-mail: jipsagak@si.ehu.es#TAB#","institution_ids":["https://openalex.org/I169108374"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005074637","display_name":"Aitziber Atutxa","orcid":"https://orcid.org/0000-0003-4512-8633"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"A. ATUTXA","raw_affiliation_strings":["Department of Linguistics, University of Maryland, College Park, MD 20742, USA e-mail:","Department of Linguistics, University of Maryland, College Park, MD 20742, USA e-mail: sener@wam.umd.edu#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Linguistics, University of Maryland, College Park, MD 20742, USA e-mail:","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Department of Linguistics, University of Maryland, College Park, MD 20742, USA e-mail: sener@wam.umd.edu#TAB#","institution_ids":["https://openalex.org/I66946132"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.3442,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.90018546,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":"9","issue":"1","first_page":"39","last_page":"48"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9833999872207642,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/subcategorization","display_name":"Subcategorization","score":0.9113556146621704},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8648040294647217},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7338653802871704},{"id":"https://openalex.org/keywords/verb","display_name":"Verb","score":0.7284075021743774},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.6612966060638428},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6454652547836304},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5056211948394775},{"id":"https://openalex.org/keywords/finite-state","display_name":"Finite state","score":0.4791276156902313},{"id":"https://openalex.org/keywords/noun","display_name":"Noun","score":0.4503372013568878},{"id":"https://openalex.org/keywords/grammar","display_name":"Grammar","score":0.4220025837421417},{"id":"https://openalex.org/keywords/noun-phrase","display_name":"Noun phrase","score":0.4111669957637787},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.39810407161712646},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.15432608127593994},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.0966101884841919}],"concepts":[{"id":"https://openalex.org/C70845037","wikidata":"https://www.wikidata.org/wiki/Q6980760","display_name":"Subcategorization","level":3,"score":0.9113556146621704},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8648040294647217},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7338653802871704},{"id":"https://openalex.org/C2776397901","wikidata":"https://www.wikidata.org/wiki/Q24905","display_name":"Verb","level":2,"score":0.7284075021743774},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.6612966060638428},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6454652547836304},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5056211948394775},{"id":"https://openalex.org/C2983497884","wikidata":"https://www.wikidata.org/wiki/Q176452","display_name":"Finite state","level":3,"score":0.4791276156902313},{"id":"https://openalex.org/C121934690","wikidata":"https://www.wikidata.org/wiki/Q1084","display_name":"Noun","level":2,"score":0.4503372013568878},{"id":"https://openalex.org/C26022165","wikidata":"https://www.wikidata.org/wiki/Q8091","display_name":"Grammar","level":2,"score":0.4220025837421417},{"id":"https://openalex.org/C153962237","wikidata":"https://www.wikidata.org/wiki/Q1401131","display_name":"Noun phrase","level":3,"score":0.4111669957637787},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.39810407161712646},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.15432608127593994},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.0966101884841919},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1017/s1351324903003097","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324903003097","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.20.9116","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.20.9116","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://ixa.si.ehu.es/dokument/Artikulu/01ESSLLI.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.7.8225","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.7.8225","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://ixa.si.ehu.es/Ixa/Argitalpenak/Artikuluak/1055319279/publikoak/nle-argitaratua.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6299999952316284,"display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320323737","display_name":"Ministerio de Ciencia y Tecnolog\u00eda","ror":"https://ror.org/034900433"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1499641710","https://openalex.org/W1527398610","https://openalex.org/W1588265531","https://openalex.org/W1589269291","https://openalex.org/W1904428263","https://openalex.org/W1980907635","https://openalex.org/W1991923024","https://openalex.org/W2008172256","https://openalex.org/W2088198454","https://openalex.org/W2093476618","https://openalex.org/W2096369514","https://openalex.org/W2108455276","https://openalex.org/W2122978558","https://openalex.org/W2127349157","https://openalex.org/W2157439354","https://openalex.org/W2295375623","https://openalex.org/W2951085107","https://openalex.org/W2951151097","https://openalex.org/W2951837407"],"related_works":["https://openalex.org/W2400253058","https://openalex.org/W2354679542","https://openalex.org/W2250921869","https://openalex.org/W2250526231","https://openalex.org/W2388592016","https://openalex.org/W4300910997","https://openalex.org/W1575587935","https://openalex.org/W2025590371","https://openalex.org/W2375184316","https://openalex.org/W2137478468"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"the":[3,19,62],"design":[4],"and":[5,46,59],"implementation":[6],"of":[7,12,21,56,61,83],"a":[8,32,49,68],"finite-state":[9,50],"syntactic":[10,38,53,75],"grammar":[11],"Basque":[13],"that":[14,94],"has":[15,35],"been":[16],"used":[17],"with":[18,72],"objective":[20],"extracting":[22],"information":[23],"about":[24],"verb":[25,69,87],"subcategorization":[26],"instances":[27],"from":[28,97],"newspaper":[29],"texts.":[30],"After":[31],"partial":[33],"parser":[34,51],"built":[36],"basic":[37],"units":[39],"such":[40],"as":[41],"noun":[42],"phrases,":[43,45],"prepositional":[44],"sentential":[47],"complements,":[48],"performs":[52],"disambiguation,":[54],"determination":[55],"clause":[57],"boundaries":[58],"filtering":[60],"results,":[63],"in":[64],"order":[65],"to":[66],"obtain":[67],"occurrence":[70],"together":[71],"its":[73],"associated":[74],"components,":[76],"either":[77],"complements":[78],"or":[79],"adjuncts.":[80,98],"The":[81],"set":[82],"occurrences":[84],"for":[85],"each":[86],"is":[88],"then":[89],"filtered":[90],"by":[91],"statistical":[92],"measures":[93],"distinguish":[95],"arguments":[96]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
