{"id":"https://openalex.org/W6922228622","doi":"https://doi.org/10.1184/r1/21699629.v1","title":"Knowledge-Aware Natural Language Understanding","display_name":"Knowledge-Aware Natural Language Understanding","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W6922228622","doi":"https://doi.org/10.1184/r1/21699629.v1"},"language":"en","primary_location":{"id":"pmh:oai:figshare.com:article/21699629","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"},"type":"article","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Dasigi, Pradeep","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Dasigi, Pradeep","raw_affiliation_strings":["Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.26485976,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.3353999853134155,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.3353999853134155,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.24719999730587006,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1412000060081482,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.7669000029563904},{"id":"https://openalex.org/keywords/wordnet","display_name":"WordNet","score":0.6255000233650208},{"id":"https://openalex.org/keywords/natural-language-understanding","display_name":"Natural language understanding","score":0.5403000116348267},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5001999735832214},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.48410001397132874},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4699000120162964},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.45080000162124634},{"id":"https://openalex.org/keywords/meaning","display_name":"Meaning (existential)","score":0.41830000281333923},{"id":"https://openalex.org/keywords/commonsense-knowledge","display_name":"Commonsense knowledge","score":0.39010000228881836}],"concepts":[{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.7669000029563904},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7318000197410583},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6299999952316284},{"id":"https://openalex.org/C157659113","wikidata":"https://www.wikidata.org/wiki/Q533822","display_name":"WordNet","level":2,"score":0.6255000233650208},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5715000033378601},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.5403000116348267},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5001999735832214},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.48410001397132874},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4699000120162964},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.45080000162124634},{"id":"https://openalex.org/C2780876879","wikidata":"https://www.wikidata.org/wiki/Q3054749","display_name":"Meaning (existential)","level":2,"score":0.41830000281333923},{"id":"https://openalex.org/C30542707","wikidata":"https://www.wikidata.org/wiki/Q1603203","display_name":"Commonsense knowledge","level":3,"score":0.39010000228881836},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.3849000036716461},{"id":"https://openalex.org/C28076734","wikidata":"https://www.wikidata.org/wiki/Q63087","display_name":"Coreference","level":3,"score":0.384799987077713},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.3734999895095825},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.36910000443458557},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.35190001130104065},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3434999883174896},{"id":"https://openalex.org/C2777532361","wikidata":"https://www.wikidata.org/wiki/Q687185","display_name":"Lexicalization","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.31130000948905945},{"id":"https://openalex.org/C153962237","wikidata":"https://www.wikidata.org/wiki/Q1401131","display_name":"Noun phrase","level":3,"score":0.29339998960494995},{"id":"https://openalex.org/C67277372","wikidata":"https://www.wikidata.org/wiki/Q7449085","display_name":"Semantic role labeling","level":3,"score":0.2888999879360199},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.2784999907016754},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.2770000100135803},{"id":"https://openalex.org/C126706616","wikidata":"https://www.wikidata.org/wiki/Q2944660","display_name":"Lexical item","level":2,"score":0.2750000059604645},{"id":"https://openalex.org/C98954769","wikidata":"https://www.wikidata.org/wiki/Q1759657","display_name":"Lexical semantics","level":3,"score":0.2743000090122223},{"id":"https://openalex.org/C25810664","wikidata":"https://www.wikidata.org/wiki/Q44325","display_name":"Ontology","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.26249998807907104},{"id":"https://openalex.org/C2983448237","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Language understanding","level":2,"score":0.25519999861717224},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.251800000667572}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:figshare.com:article/21699629","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"},{"id":"doi:10.1184/r1/21699629.v1","is_oa":true,"landing_page_url":"https://doi.org/10.1184/r1/21699629.v1","pdf_url":null,"source":{"id":"https://openalex.org/S7407050927","display_name":"KiltHub Repository","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:figshare.com:article/21699629","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7172660231590271,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Natural":[0],"Language":[1],"Understanding":[2],"(NLU)":[3],"systems":[4,116],"need":[5,560],"to":[6,62,97,112,155,177,225,281,291,406,421,429,463,535],"encode":[7,118,207,292],"human":[8,188],"generated":[9],"text":[10],"(or":[11,38,354],"speech)":[12],"and":[13,68,89,103,125,210,253,294,342,370,432,446,479,503,510,541,546,564],"reason":[14,63,126],"over":[15,64,387],"it":[16,384],"at":[17,248,259,301,324],"a":[18,60,404,417,434,496],"deep":[19],"semantic":[20,278,339,374,413,473],"level.":[21],"Any":[22],"NLU":[23,115,500,573],"system":[24],"typically":[25],"involves":[26,385],"two":[27,91,212,484,507],"main":[28],"components:":[29],"The":[30,106,135,313,549],"first":[31,136],"is":[32,111,184,191],"an":[33,388],"<strong>encoder</strong>,":[34],"which":[35,50,183],"composes":[36],"words":[37,159],"other":[39,164,572],"basic":[40],"linguistic":[41],"units)":[42],"within":[43],"the":[44,57,65,70,76,83,99,130,139,196,204,262,343,350,365,408,412,423,448,451,457,506,518,537,553,559],"input":[45,430],"utterances":[46,77],"compute":[47],"encoded":[48,66],"representations,":[49],"are":[51,163,169,175,299,524],"then":[52],"used":[53,154],"as":[54,333,505,533],"features":[55],"in":[56,129,160,195,304,358,489,521,544],"second":[58,314],"component,":[59],"<strong>predictor</strong>,":[61],"inputs":[67,119],"produce":[69],"desired":[71],"output.":[72],"We":[73,198,232,270,287,322,361,467],"argue":[74],"that":[75,117,168,296,439,475],"themselves":[78],"do":[79,362],"not":[80,192,363],"contain":[81],"all":[82],"information":[84,182],"needed":[85,96],"for":[86,149,214,443,472,499,552,558,561,566,571],"understanding":[87,527],"them":[88,128],"identify":[90],"kinds":[92],"of":[93,108,132,138,158,166,171,186,230,335,352,367,392,411,425,450,539],"additional":[94,512,562],"knowledge":[95,189,222,265,458,513,543],"fill":[98],"gaps:":[100],"<strong>background":[101],"knowledge</strong>":[102],"<strong>contextual":[104],"knowledge</strong>.":[105],"goal":[107],"this":[109,200,289,493,522],"thesis":[110,140,494,523],"build":[113,371,468],"end-to-end":[114],"along":[120],"with":[121,142,283,319,380,397,501],"relevant":[122],"background":[123,144,208,264,540],"knowledge,":[124,209,563],"about":[127],"presence":[131],"contextual":[133,320,542],"knowledge.":[134,145,321],"part":[137,185,315],"deals":[141],"encoding":[143,150,502,545],"While":[146,517],"distributional":[147],"methods":[148],"sentences":[151],"have":[152],"been":[153],"represent":[156],"meaning":[157],"context,":[161],"there":[162],"aspects":[165],"semantics":[167],"out":[170],"their":[172,277],"reach.":[173],"These":[174],"related":[176],"commonsense":[178],"or":[179],"real":[180],"world":[181],"shared":[187],"but":[190],"explicitly":[193],"present":[194,211],"input.":[197],"address":[199],"limitation":[201],"by":[202,311,348],"having":[203],"encoders":[205],"also":[206,531],"approaches":[213],"doing":[215],"so.":[216],"First,":[217],"we":[218,257,400],"leverage":[219],"explicit":[220],"symbolic":[221],"from":[223,459],"WordNet":[224],"learn":[226],"ontology-grounded":[227],"token-level":[228],"representations":[229,240,298,309],"words.":[231],"show":[233,295,480],"sentence":[234,308],"encodings":[235],"based":[236,243],"on":[237,244,276,317,483],"our":[238],"token":[239],"outperform":[241],"those":[242],"off-the-shelf":[245],"word":[246],"embeddings":[247],"predicting":[249],"prepositional":[250],"phrase":[251],"attachment":[252],"textual":[254],"entailment.":[255],"Second,":[256],"look":[258,323],"cases":[260],"where":[261,328],"required":[263],"cannot":[266],"be":[267,331,346],"stated":[268],"symbolically.":[269],"model":[271,290],"selectional":[272],"restrictions":[273],"verbs":[274],"place":[275],"role":[279,538],"fillers":[280],"deal":[282,396],"one":[284],"such":[285],"case.":[286],"use":[288,476],"events,":[293],"these":[297,398,477],"better":[300],"detecting":[302],"anomalies":[303],"newswire":[305],"texts":[306],"than":[307],"produced":[310,426],"LSTMs.":[312],"focuses":[316],"reasoning":[318,329,504,547],"Question-Answering":[325],"(QA)":[326],"tasks":[327,487,519,554],"can":[330,345,514],"expressed":[332],"sequences":[334],"discrete":[336],"operations,":[337],"(i.e.":[338],"parsing":[340,474],"problems),":[341],"answer":[344],"obtained":[347],"executing":[349],"sequence":[351],"operations":[353],"logical":[355,368,393,427,444,461],"form)":[356],"grounded":[357,488],"some":[359],"context.":[360],"assume":[364],"availability":[366],"forms,":[369,445],"weakly":[372],"supervised":[373],"parsers.":[375],"This":[376],"training":[377,437],"setup":[378],"comes":[379],"significant":[381],"challenges":[382,528],"since":[383],"searching":[386,442],"exponentially":[389],"large":[390],"space":[391,410],"forms.":[394],"To":[395],"challenges,":[399],"propose":[401],"1)":[402],"using":[403],"grammar":[405],"constrain":[407],"output":[409],"parser;":[414],"2)":[415],"leveraging":[416],"lexical":[418],"coverage":[419],"measure":[420],"ensure":[422],"relevance":[424],"forms":[428,462],"utterances;":[431],"3)":[433],"novel":[435],"iterative":[436],"scheme":[438],"alternates":[440],"between":[441],"maximizing":[447],"likelihood":[449],"retrieved":[452],"ones,":[453],"thus":[454],"effectively":[455],"transferring":[456],"simpler":[460],"more":[464],"complex":[465,485],"ones.":[466],"neural":[469],"encoder-decoder":[470],"models":[471,550,570],"techniques,":[478],"state-of-the-art":[481],"results":[482],"QA":[486],"structured":[490],"contexts":[491],"Overall,":[492],"presents":[495],"general":[497],"framework":[498],"core":[508],"components,":[509],"how":[511],"augment":[515],"them.":[516],"presented":[520],"hard":[525],"language":[526],"themselves,":[529],"they":[530],"serve":[532],"examples":[534],"highlight":[536],"components.":[548],"built":[551],"provide":[555],"empirical":[556],"evidence":[557],"pointers":[565],"building":[567],"effective":[568],"knowledge-aware":[569],"tasks.":[574]},"counts_by_year":[],"updated_date":"2026-02-12T00:53:03.260389","created_date":"2025-10-10T00:00:00"}
