{"id":"https://openalex.org/W2593007760","doi":"https://doi.org/10.1162/tacl_a_00066","title":"Unsupervised Learning of Morphological Forests","display_name":"Unsupervised Learning of Morphological Forests","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2593007760","doi":"https://doi.org/10.1162/tacl_a_00066","mag":"2593007760"},"language":"en","primary_location":{"id":"doi:10.1162/tacl_a_00066","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00066","pdf_url":"http://www.mitpressjournals.org/doi/pdf/10.1162/tacl_a_00066","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"http://www.mitpressjournals.org/doi/pdf/10.1162/tacl_a_00066","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029740891","display_name":"Jiaming Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jiaming Luo","raw_affiliation_strings":["CSAIL, MIT,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CSAIL, MIT,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025205227","display_name":"Karthik Narasimhan","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Karthik Narasimhan","raw_affiliation_strings":["CSAIL, MIT,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CSAIL, MIT,","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010124873","display_name":"Regina Barzilay","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Regina Barzilay","raw_affiliation_strings":["CSAIL, MIT,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CSAIL, MIT,","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5010124873","https://openalex.org/A5025205227","https://openalex.org/A5029740891"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.6645,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.87742297,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":"5","issue":null,"first_page":"353","last_page":"364"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7771216630935669},{"id":"https://openalex.org/keywords/affix","display_name":"Affix","score":0.6980840563774109},{"id":"https://openalex.org/keywords/integer-programming","display_name":"Integer programming","score":0.6045557856559753},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5822011232376099},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5821820497512817},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5813446044921875},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5577787160873413},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.4955381155014038},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.4911046028137207},{"id":"https://openalex.org/keywords/integer","display_name":"Integer (computer science)","score":0.454406201839447},{"id":"https://openalex.org/keywords/unsupervised-learning","display_name":"Unsupervised learning","score":0.4436720013618469},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4279051423072815},{"id":"https://openalex.org/keywords/root","display_name":"Root (linguistics)","score":0.4258171617984772},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.40525129437446594},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2432040572166443}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7771216630935669},{"id":"https://openalex.org/C2778428490","wikidata":"https://www.wikidata.org/wiki/Q62155","display_name":"Affix","level":2,"score":0.6980840563774109},{"id":"https://openalex.org/C56086750","wikidata":"https://www.wikidata.org/wiki/Q6042592","display_name":"Integer programming","level":2,"score":0.6045557856559753},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5822011232376099},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5821820497512817},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5813446044921875},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5577787160873413},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.4955381155014038},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.4911046028137207},{"id":"https://openalex.org/C97137487","wikidata":"https://www.wikidata.org/wiki/Q729138","display_name":"Integer (computer science)","level":2,"score":0.454406201839447},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.4436720013618469},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4279051423072815},{"id":"https://openalex.org/C171078966","wikidata":"https://www.wikidata.org/wiki/Q111029","display_name":"Root (linguistics)","level":2,"score":0.4258171617984772},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40525129437446594},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2432040572166443},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1162/tacl_a_00066","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00066","pdf_url":"http://www.mitpressjournals.org/doi/pdf/10.1162/tacl_a_00066","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:bc003db1657d44ceb5f8c503354b40d6","is_oa":false,"landing_page_url":"https://doaj.org/article/bc003db1657d44ceb5f8c503354b40d6","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Transactions of the Association for Computational Linguistics, Vol 5 (2021)","raw_type":"article"},{"id":"pmh:oai:dspace.mit.edu:1721.1/111923","is_oa":true,"landing_page_url":"http://hdl.handle.net/1721.1/111923","pdf_url":null,"source":{"id":"https://openalex.org/S4306400425","display_name":"DSpace@MIT (Massachusetts Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63966007","host_organization_name":"Massachusetts Institute of Technology","host_organization_lineage":["https://openalex.org/I63966007"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Thesis"},{"id":"pmh:oai:dspace.mit.edu:1721.1/135066","is_oa":true,"landing_page_url":"https://hdl.handle.net/1721.1/135066","pdf_url":null,"source":{"id":"https://openalex.org/S4306400425","display_name":"DSpace@MIT (Massachusetts Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63966007","host_organization_name":"Massachusetts Institute of Technology","host_organization_lineage":["https://openalex.org/I63966007"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"MIT Press","raw_type":"http://purl.org/eprint/type/ConferencePaper"}],"best_oa_location":{"id":"doi:10.1162/tacl_a_00066","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00066","pdf_url":"http://www.mitpressjournals.org/doi/pdf/10.1162/tacl_a_00066","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6000000238418579,"display_name":"Life in Land","id":"https://metadata.un.org/sdg/15"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2593007760.pdf","grobid_xml":"https://content.openalex.org/works/W2593007760.grobid-xml"},"referenced_works_count":29,"referenced_works":["https://openalex.org/W201532657","https://openalex.org/W309335912","https://openalex.org/W1518332699","https://openalex.org/W1582588624","https://openalex.org/W1839584883","https://openalex.org/W1975638594","https://openalex.org/W1999121513","https://openalex.org/W2053306448","https://openalex.org/W2097532276","https://openalex.org/W2103729963","https://openalex.org/W2115322217","https://openalex.org/W2116211107","https://openalex.org/W2123641849","https://openalex.org/W2126377586","https://openalex.org/W2130935327","https://openalex.org/W2137807925","https://openalex.org/W2155925463","https://openalex.org/W2172709584","https://openalex.org/W2179974023","https://openalex.org/W2211744643","https://openalex.org/W2251565024","https://openalex.org/W2252037542","https://openalex.org/W2294970769","https://openalex.org/W2295551984","https://openalex.org/W2736397884","https://openalex.org/W2950577311","https://openalex.org/W2963216505","https://openalex.org/W2964121744","https://openalex.org/W4246185962"],"related_works":["https://openalex.org/W2167062050","https://openalex.org/W1925942709","https://openalex.org/W4382645103","https://openalex.org/W2137383100","https://openalex.org/W2047683846","https://openalex.org/W2044902158","https://openalex.org/W1567360509","https://openalex.org/W2082154838","https://openalex.org/W2109912052","https://openalex.org/W1711527768"],"abstract_inverted_index":{"This":[0,17],"paper":[1],"focuses":[2],"on":[3,90],"unsupervised":[4],"modeling":[5],"of":[6,34,44,51,96],"morphological":[7,27,53,97],"families,":[8,98],"collectively":[9],"comprising":[10],"a":[11],"forest":[12],"over":[13],"the":[14,35,42,45,71,77,82,116],"language":[15],"vocabulary.":[16],"formulation":[18],"enables":[19],"us":[20],"to":[21],"capture":[22],"edge-wise":[23],"properties":[24,33,40],"reflecting":[25],"single-step":[26],"derivations,":[28],"along":[29],"with":[30,66,115],"global":[31,39,83],"distributional":[32],"entire":[36],"forest.":[37],"These":[38],"constrain":[41],"size":[43],"affix":[46],"set":[47],"and":[48,81,99],"encourage":[49],"formation":[50],"tight":[52],"families.":[54],"The":[55],"resulting":[56],"objective":[57],"is":[58],"solved":[59],"using":[60],"Integer":[61],"Linear":[62],"Programming":[63],"(ILP)":[64],"paired":[65],"contrastive":[67],"estimation.":[68],"We":[69,86],"train":[70],"model":[72,80,106],"by":[73],"alternating":[74],"between":[75],"optimizing":[76],"local":[78],"log-linear":[79],"ILP":[84],"objective.":[85],"evaluate":[87],"our":[88,105],"system":[89],"three":[91,112],"tasks:":[92],"root":[93],"detection,":[94],"clustering":[95],"segmentation.":[100],"Our":[101],"experiments":[102],"demonstrate":[103],"that":[104],"yields":[107],"consistent":[108],"gains":[109],"in":[110],"all":[111],"tasks":[113],"compared":[114],"best":[117],"published":[118],"results.":[119]},"counts_by_year":[{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":3}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
