{"id":"https://openalex.org/W2894088664","doi":"https://doi.org/10.18653/v1/k18-1001","title":"Embedded-State Latent Conditional Random Fields for Sequence Labeling","display_name":"Embedded-State Latent Conditional Random Fields for Sequence Labeling","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2894088664","doi":"https://doi.org/10.18653/v1/k18-1001","mag":"2894088664"},"language":"en","primary_location":{"id":"doi:10.18653/v1/k18-1001","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/k18-1001","pdf_url":"https://www.aclweb.org/anthology/K18-1001.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd Conference on Computational Natural Language Learning","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/K18-1001.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041743374","display_name":"Dung Thai","orcid":null},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Dung Thai","raw_affiliation_strings":["College of Information and Computer Sciences University of Massachusetts Amherst","University of Massachusetts Amherst, Amherst Center, United States"],"affiliations":[{"raw_affiliation_string":"College of Information and Computer Sciences University of Massachusetts Amherst","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"University of Massachusetts Amherst, Amherst Center, United States","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078996717","display_name":"Sree Harsha Ramesh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sree Harsha Ramesh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054587391","display_name":"Shikhar Murty","orcid":null},"institutions":[{"id":"https://openalex.org/I64295750","display_name":"Indian Institute of Technology Indore","ror":"https://ror.org/01hhf7w52","country_code":"IN","type":"education","lineage":["https://openalex.org/I64295750"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Shikhar Murty","raw_affiliation_strings":["Indian Institute of Technology Indore, Indore, India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology Indore, Indore, India","institution_ids":["https://openalex.org/I64295750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016501970","display_name":"Luke Vilnis","orcid":null},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Luke Vilnis","raw_affiliation_strings":["College of Information and Computer Sciences University of Massachusetts Amherst","University of Massachusetts Amherst, Amherst Center, United States"],"affiliations":[{"raw_affiliation_string":"College of Information and Computer Sciences University of Massachusetts Amherst","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"University of Massachusetts Amherst, Amherst Center, United States","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5107835063","display_name":"Andrew McCallum","orcid":null},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrew McCallum","raw_affiliation_strings":["College of Information and Computer Sciences University of Massachusetts Amherst","University of Massachusetts Amherst, Amherst Center, United States"],"affiliations":[{"raw_affiliation_string":"College of Information and Computer Sciences University of Massachusetts Amherst","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"University of Massachusetts Amherst, Amherst Center, United States","institution_ids":["https://openalex.org/I24603500"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5041743374"],"corresponding_institution_ids":["https://openalex.org/I24603500"],"apc_list":null,"apc_paid":null,"fwci":0.39712492,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.67849856,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7160613536834717},{"id":"https://openalex.org/keywords/conditional-random-field","display_name":"Conditional random field","score":0.687480628490448},{"id":"https://openalex.org/keywords/graphical-model","display_name":"Graphical model","score":0.6351439952850342},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5960226058959961},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5538769364356995},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5386815667152405},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5358847975730896},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5339995622634888},{"id":"https://openalex.org/keywords/sequence-labeling","display_name":"Sequence labeling","score":0.5283278226852417},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5238480567932129},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.4501972198486328},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.4480217695236206},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.4380667209625244},{"id":"https://openalex.org/keywords/structured-prediction","display_name":"Structured prediction","score":0.4294532239437103},{"id":"https://openalex.org/keywords/approximate-inference","display_name":"Approximate inference","score":0.42866310477256775},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.42844706773757935},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.4280407726764679},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.41510629653930664},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.37657076120376587},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3048381805419922},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.25016841292381287},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.21766218543052673}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7160613536834717},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.687480628490448},{"id":"https://openalex.org/C155846161","wikidata":"https://www.wikidata.org/wiki/Q1143367","display_name":"Graphical model","level":2,"score":0.6351439952850342},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5960226058959961},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5538769364356995},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5386815667152405},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5358847975730896},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5339995622634888},{"id":"https://openalex.org/C35639132","wikidata":"https://www.wikidata.org/wiki/Q7452468","display_name":"Sequence labeling","level":3,"score":0.5283278226852417},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5238480567932129},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.4501972198486328},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.4480217695236206},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.4380667209625244},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.4294532239437103},{"id":"https://openalex.org/C2777472644","wikidata":"https://www.wikidata.org/wiki/Q16968992","display_name":"Approximate inference","level":3,"score":0.42866310477256775},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.42844706773757935},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.4280407726764679},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.41510629653930664},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.37657076120376587},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3048381805419922},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.25016841292381287},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.21766218543052673},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.18653/v1/k18-1001","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/k18-1001","pdf_url":"https://www.aclweb.org/anthology/K18-1001.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd Conference on Computational Natural Language Learning","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1809.10835","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1809.10835","pdf_url":"https://arxiv.org/pdf/1809.10835","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:2894088664","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1809.10835.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1809.10835","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1809.10835","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.18653/v1/k18-1001","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/k18-1001","pdf_url":"https://www.aclweb.org/anthology/K18-1001.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd Conference on Computational Natural Language Learning","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2894088664.pdf","grobid_xml":"https://content.openalex.org/works/W2894088664.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W1481355931","https://openalex.org/W1903393809","https://openalex.org/W2086161653","https://openalex.org/W2109651326","https://openalex.org/W2117497855","https://openalex.org/W2132678463","https://openalex.org/W2133510715","https://openalex.org/W2147196093","https://openalex.org/W2158823144","https://openalex.org/W2160815625","https://openalex.org/W2161236525","https://openalex.org/W2172099713","https://openalex.org/W2250539671","https://openalex.org/W2251830157","https://openalex.org/W2296283641","https://openalex.org/W2412782625","https://openalex.org/W2625885504","https://openalex.org/W2899771611","https://openalex.org/W2952230511","https://openalex.org/W2964076774","https://openalex.org/W2964121744","https://openalex.org/W2964205912","https://openalex.org/W2964308564"],"related_works":["https://openalex.org/W2963744612","https://openalex.org/W2948166700","https://openalex.org/W1706732857","https://openalex.org/W3167569698","https://openalex.org/W2766236296","https://openalex.org/W2834136616","https://openalex.org/W3186814551","https://openalex.org/W3171932471","https://openalex.org/W2769275980","https://openalex.org/W2979915069","https://openalex.org/W3166703191","https://openalex.org/W1826694107","https://openalex.org/W2464714129","https://openalex.org/W3034097097","https://openalex.org/W2248934801","https://openalex.org/W2994486311","https://openalex.org/W2796075534","https://openalex.org/W2397771106","https://openalex.org/W3114760901","https://openalex.org/W2986440166"],"abstract_inverted_index":{"Complex":[0],"textual":[1],"information":[2],"extraction":[3],"tasks":[4],"are":[5,16,216],"often":[6,77],"posed":[7],"as":[8,52,89],"sequence":[9,118],"labeling":[10],"or":[11,101],"\\emph{shallow":[12],"parsing},":[13],"where":[14],"fields":[15],"extracted":[17,46],"using":[18,43],"local":[19,115],"labels":[20],"made":[21],"consistent":[22,56],"through":[23,58],"probabilistic":[24],"inference":[25,177,191],"in":[26,102,134],"a":[27,59,90,96,127],"graphical":[28,72,129],"model":[29,73,130,139,207],"with":[30,126,159,200],"constrained":[31],"transitions.":[32],"Recently,":[33],"it":[34],"has":[35],"become":[36],"common":[37],"to":[38,123,146],"locally":[39],"parametrize":[40],"these":[41],"models":[42,211],"rich":[44,181],"features":[45,116],"by":[47],"recurrent":[48],"neural":[49],"networks":[50],"(such":[51],"LSTM),":[53],"while":[54],"enforcing":[55],"outputs":[57],"simple":[60,71],"linear-chain":[61],"model,":[62],"representing":[63],"Markovian":[64],"dependencies":[65],"between":[66,81],"successive":[67],"labels.":[68,83],"However,":[69],"the":[70,76,103,135,142,180,185,206,222],"structure":[74],"belies":[75],"complex":[78],"non-local":[79,195],"constraints":[80,215],"output":[82,136,152,196,214],"For":[84],"example,":[85],"many":[86],"fields,":[87],"such":[88],"first":[91],"name,":[92],"can":[93],"only":[94],"occur":[95],"fixed":[97],"number":[98],"of":[99,105,131,176,184],"times,":[100],"presence":[104],"other":[106],"fields.":[107],"While":[108],"RNNs":[109],"have":[110,121],"provided":[111],"increasingly":[112],"powerful":[113],"context-aware":[114],"for":[117,169],"tagging,":[119],"they":[120],"yet":[122],"be":[124],"integrated":[125],"global":[128,190,213],"similar":[132],"expressivity":[133],"distribution.":[137],"Our":[138],"goes":[140],"beyond":[141],"linear":[143],"chain":[144],"CRF":[145],"incorporate":[147],"multiple":[148],"hidden":[149,170],"states":[150],"per":[151],"label,":[153],"but":[154],"parametrizes":[155],"their":[156],"transitions":[157],"parsimoniously":[158],"low-rank":[160],"log-potential":[161],"scoring":[162],"matrices,":[163],"effectively":[164],"learning":[165],"an":[166],"embedding":[167],"space":[168,175],"states.":[171],"This":[172],"augmented":[173],"latent":[174,224],"variables":[178],"complements":[179],"feature":[182],"representation":[183],"RNN,":[186],"and":[187,203,220],"allows":[188],"exact":[189],"obeying":[192],"complex,":[193],"learned":[194],"constraints.":[197],"We":[198],"experiment":[199],"several":[201],"datasets":[202],"show":[204],"that":[205],"outperforms":[208],"baseline":[209],"CRF+RNN":[210],"when":[212],"necessary":[217],"at":[218],"inference-time,":[219],"explore":[221],"interpretable":[223],"structure.":[225]},"counts_by_year":[{"year":2020,"cited_by_count":2}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
