{"id":"https://openalex.org/W2143954309","doi":"https://doi.org/10.1017/s1351324905003840","title":"Bootstrapping parsers via syntactic projection across parallel texts","display_name":"Bootstrapping parsers via syntactic projection across parallel texts","publication_year":2005,"publication_date":"2005-09-01","ids":{"openalex":"https://openalex.org/W2143954309","doi":"https://doi.org/10.1017/s1351324905003840","mag":"2143954309"},"language":"en","primary_location":{"id":"doi:10.1017/s1351324905003840","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324905003840","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070135550","display_name":"Rebecca Hwa","orcid":"https://orcid.org/0000-0003-1158-7014"},"institutions":[{"id":"https://openalex.org/I170201317","display_name":"University of Pittsburgh","ror":"https://ror.org/01an3r305","country_code":"US","type":"education","lineage":["https://openalex.org/I170201317"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"REBECCA HWA","raw_affiliation_strings":["Department of Computer Science, University of Pittsburgh, PA 15260, USA e-mail:","Department of Computer Science, University of Pittsburgh, PA 15260, USA e-mail: [email\u00a0protected]#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Pittsburgh, PA 15260, USA e-mail:","institution_ids":["https://openalex.org/I170201317"]},{"raw_affiliation_string":"Department of Computer Science, University of Pittsburgh, PA 15260, USA e-mail: [email\u00a0protected]#TAB#","institution_ids":["https://openalex.org/I170201317"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059946729","display_name":"Philip Resnik","orcid":"https://orcid.org/0000-0002-6130-8602"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"PHILIP RESNIK","raw_affiliation_strings":["Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail:","Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail: resnik@umiacs.umd.edu, weinberg@umiacs.umd.edu, clarac@umiacs "],"affiliations":[{"raw_affiliation_string":"Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail:","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail: resnik@umiacs.umd.edu, weinberg@umiacs.umd.edu, clarac@umiacs ","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110392663","display_name":"Amy Weinberg","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"AMY WEINBERG","raw_affiliation_strings":["Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail:","Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail: resnik@umiacs.umd.edu, weinberg@umiacs.umd.edu, clarac@umiacs "],"affiliations":[{"raw_affiliation_string":"Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail:","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail: resnik@umiacs.umd.edu, weinberg@umiacs.umd.edu, clarac@umiacs ","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043720664","display_name":"Clara I. Cabezas","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"CLARA CABEZAS","raw_affiliation_strings":["Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail:","Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail: resnik@umiacs.umd.edu, weinberg@umiacs.umd.edu, clarac@umiacs "],"affiliations":[{"raw_affiliation_string":"Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail:","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Institute for Advanced Computer Studies and Department of Linguistics, University of Maryland, College Park, MD USA 20742, USA e-mail: resnik@umiacs.umd.edu, weinberg@umiacs.umd.edu, clarac@umiacs ","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074899580","display_name":"Okan Kolak","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"OKAN KOLAK","raw_affiliation_strings":["Department of Computer Science, University of Maryland, College Park, MD 20742, USA e-mail:","Department of Computer Science, University of Maryland, College Park, MD 20742, USA e-mail: okan@umiacs.umd.edu"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Maryland, College Park, MD 20742, USA e-mail:","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Department of Computer Science, University of Maryland, College Park, MD 20742, USA e-mail: okan@umiacs.umd.edu","institution_ids":["https://openalex.org/I66946132"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5070135550"],"corresponding_institution_ids":["https://openalex.org/I170201317"],"apc_list":null,"apc_paid":null,"fwci":15.5276,"has_fulltext":false,"cited_by_count":340,"citation_normalized_percentile":{"value":0.99013018,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"11","issue":"3","first_page":"311","last_page":"325"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9297066926956177},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.7885681986808777},{"id":"https://openalex.org/keywords/bootstrapping","display_name":"Bootstrapping (finance)","score":0.7847989201545715},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.7339444756507874},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6780019998550415},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6265219449996948},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4580823481082916},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.44986462593078613},{"id":"https://openalex.org/keywords/projection","display_name":"Projection (relational algebra)","score":0.42459186911582947},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.21480754017829895},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.14897048473358154}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9297066926956177},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.7885681986808777},{"id":"https://openalex.org/C207609745","wikidata":"https://www.wikidata.org/wiki/Q4944086","display_name":"Bootstrapping (finance)","level":2,"score":0.7847989201545715},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.7339444756507874},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6780019998550415},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6265219449996948},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4580823481082916},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.44986462593078613},{"id":"https://openalex.org/C57493831","wikidata":"https://www.wikidata.org/wiki/Q3134666","display_name":"Projection (relational algebra)","level":2,"score":0.42459186911582947},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.21480754017829895},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.14897048473358154},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C106159729","wikidata":"https://www.wikidata.org/wiki/Q2294553","display_name":"Financial economics","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1017/s1351324905003840","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324905003840","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.80.4033","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.80.4033","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.pitt.edu/~hwa/nle04draft.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W73274768","https://openalex.org/W74075037","https://openalex.org/W89239156","https://openalex.org/W568341626","https://openalex.org/W1535015163","https://openalex.org/W1607229519","https://openalex.org/W1632114991","https://openalex.org/W1924403233","https://openalex.org/W1953828586","https://openalex.org/W1972542019","https://openalex.org/W1986543644","https://openalex.org/W2000566875","https://openalex.org/W2002586403","https://openalex.org/W2010588484","https://openalex.org/W2016630033","https://openalex.org/W2046592963","https://openalex.org/W2073955506","https://openalex.org/W2076083849","https://openalex.org/W2079442239","https://openalex.org/W2097333193","https://openalex.org/W2110607519","https://openalex.org/W2114858359","https://openalex.org/W2116316001","https://openalex.org/W2117475509","https://openalex.org/W2118686841","https://openalex.org/W2124262992","https://openalex.org/W2130330688","https://openalex.org/W2137806537","https://openalex.org/W2137854946","https://openalex.org/W2142708806","https://openalex.org/W2143008661","https://openalex.org/W2155693943","https://openalex.org/W2156985047","https://openalex.org/W2158388102","https://openalex.org/W2159705183","https://openalex.org/W2160382364","https://openalex.org/W2166451556","https://openalex.org/W2168822971","https://openalex.org/W2949237929","https://openalex.org/W3021713638","https://openalex.org/W3104029765"],"related_works":["https://openalex.org/W1534274833","https://openalex.org/W3117246195","https://openalex.org/W2081850291","https://openalex.org/W2361861616","https://openalex.org/W156620619","https://openalex.org/W3046984657","https://openalex.org/W2053943328","https://openalex.org/W4381248170","https://openalex.org/W2817971408","https://openalex.org/W3189621521"],"abstract_inverted_index":{"Broad":[0],"coverage,":[1],"high":[2],"quality":[3],"parsers":[4,19,133],"are":[5,134],"available":[6],"for":[7,15,20],"only":[8],"a":[9,41,89,102],"handful":[10],"of":[11,26,72,88,122],"languages.":[12,78],"A":[13],"prerequisite":[14],"developing":[16],"broad":[17],"coverage":[18],"more":[21,77],"languages":[22],"is":[23,40,49,82],"the":[24,29,70,85,93,96,106,120],"annotation":[25,39,75],"text":[27,55,66],"with":[28,136],"desired":[30],"linguistic":[31],"representations":[32],"(also":[33],"known":[34],"as":[35],"\u201ctreebanking\u201d).":[36],"However,":[37],"syntactic":[38,74,123],"labor":[42],"intensive":[43],"and":[44,47,99,125],"time-consuming":[45],"process,":[46],"it":[48],"difficult":[50],"to":[51,67,83,95],"find":[52],"linguistically":[53],"annotated":[54],"in":[56,76,130],"sufficient":[57],"quantities.":[58],"In":[59],"this":[60],"article,":[61],"we":[62],"explore":[63],"using":[64],"parallel":[65,90],"help":[68],"solving":[69],"problem":[71],"creating":[73],"The":[79],"central":[80],"idea":[81],"annotate":[84],"English":[86],"side":[87],"corpus,":[91],"project":[92],"analysis":[94],"second":[97],"language,":[98],"then":[100,126],"train":[101],"stochastic":[103,132],"analyzer":[104],"on":[105,119],"resulting":[107],"noisy":[108],"annotations.":[109],"We":[110],"discuss":[111],"our":[112],"background":[113],"assumptions,":[114],"describe":[115],"an":[116],"initial":[117],"study":[118],"\u201cprojectability\u201d":[121],"relations,":[124],"present":[127],"two":[128],"experiments":[129],"which":[131],"developed":[135],"minimal":[137],"human":[138],"intervention":[139],"via":[140],"projection":[141],"from":[142],"English.":[143]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":12},{"year":2020,"cited_by_count":16},{"year":2019,"cited_by_count":31},{"year":2018,"cited_by_count":13},{"year":2017,"cited_by_count":28},{"year":2016,"cited_by_count":32},{"year":2015,"cited_by_count":34},{"year":2014,"cited_by_count":29},{"year":2013,"cited_by_count":14},{"year":2012,"cited_by_count":22}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
