{"id":"https://openalex.org/W2763322166","doi":"https://doi.org/10.1145/3132847.3133023","title":"Unsupervised Concept Categorization and Extraction from Scientific Document Titles","display_name":"Unsupervised Concept Categorization and Extraction from Scientific Document Titles","publication_year":2017,"publication_date":"2017-11-06","ids":{"openalex":"https://openalex.org/W2763322166","doi":"https://doi.org/10.1145/3132847.3133023","mag":"2763322166"},"language":"en","primary_location":{"id":"doi:10.1145/3132847.3133023","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3132847.3133023","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2017 ACM on Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1710.02271.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110529898","display_name":"Adit Krishnan","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Adit Krishnan","raw_affiliation_strings":["University of Illinois at Urbana-Champaign, Urbana-Champaign, IL, USA","University of Illinois at Urbana\u2013Champaign, Urbana, Champaign, IL, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign, Urbana-Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"University of Illinois at Urbana\u2013Champaign, Urbana, Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103854691","display_name":"Aravind Sankar","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aravind Sankar","raw_affiliation_strings":["University of Illinois at Urbana-Champaign, Urbana-Champaign, IL, USA","University of Illinois at Urbana\u2013Champaign, Urbana, Champaign, IL, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign, Urbana-Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"University of Illinois at Urbana\u2013Champaign, Urbana, Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077700761","display_name":"Shi Zhi","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shi Zhi","raw_affiliation_strings":["University of Illinois at Urbana-Champaign, Urbana-Champaign, IL, USA","University of Illinois at Urbana\u2013Champaign, Urbana, Champaign, IL, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign, Urbana-Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"University of Illinois at Urbana\u2013Champaign, Urbana, Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019539533","display_name":"Jiawei Han","orcid":"https://orcid.org/0000-0002-3629-2696"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiawei Han","raw_affiliation_strings":["University of Illinois at Urbana-Champaign, Urbana-Champaign, IL, USA","University of Illinois at Urbana\u2013Champaign, Urbana, Champaign, IL, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign, Urbana-Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"University of Illinois at Urbana\u2013Champaign, Urbana, Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5110529898"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13690163,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1339","last_page":"1348"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8247514367103577},{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.7440774440765381},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5688628554344177},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.567842960357666},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5251787900924683},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.5078290104866028},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.48102647066116333},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4742816090583801},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.47232574224472046},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.436636358499527},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4210784435272217},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.41332268714904785},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4040152430534363},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.35012710094451904}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8247514367103577},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.7440774440765381},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5688628554344177},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.567842960357666},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5251787900924683},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.5078290104866028},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.48102647066116333},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4742816090583801},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.47232574224472046},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.436636358499527},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4210784435272217},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.41332268714904785},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4040152430534363},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.35012710094451904},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3132847.3133023","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3132847.3133023","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2017 ACM on Conference on Information and Knowledge Management","raw_type":"proceedings-article"},{"id":"mag:2763322166","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1710.02271.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null}],"best_oa_location":{"id":"mag:2763322166","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1710.02271.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},"sustainable_development_goals":[{"score":0.5799999833106995,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W2061922307","https://openalex.org/W2101964309","https://openalex.org/W2133108446","https://openalex.org/W2133580306","https://openalex.org/W2134368421","https://openalex.org/W2150815390","https://openalex.org/W2178628967","https://openalex.org/W2223881431","https://openalex.org/W2325923789","https://openalex.org/W2336224400","https://openalex.org/W2339514589","https://openalex.org/W2538360111"],"related_works":["https://openalex.org/W2962809787","https://openalex.org/W3099330776","https://openalex.org/W2557826550","https://openalex.org/W2782221572","https://openalex.org/W2402743087","https://openalex.org/W3128068256","https://openalex.org/W3176396223","https://openalex.org/W2189067371","https://openalex.org/W2467816047","https://openalex.org/W2989102449","https://openalex.org/W1984865283","https://openalex.org/W2251841523","https://openalex.org/W142048424","https://openalex.org/W2034056228","https://openalex.org/W2508644674","https://openalex.org/W3141012936","https://openalex.org/W3020880053","https://openalex.org/W3152908328","https://openalex.org/W2294607801","https://openalex.org/W1865748020"],"abstract_inverted_index":{"This":[0],"paper":[1],"studies":[2],"the":[3,29,64,109,117,135,139,180],"automated":[4],"categorization":[5],"and":[6,27,44,50,80,101,164],"extraction":[7,171],"of":[8,13,23,31,57,67,179],"scientific":[9,14,162],"concepts":[10],"from":[11,134,160],"titles":[12],"articles,":[15],"in":[16,105,148],"order":[17],"to":[18,48,84,96,128,157],"gain":[19],"a":[20,32,72,149,176],"deeper":[21],"understanding":[22],"their":[24],"key":[25,52],"contributions":[26],"facilitate":[28],"construction":[30],"generic":[33],"academic":[34,103],"knowledgebase.":[35],"Towards":[36],"this":[37,94],"goal,":[38],"we":[39,70,120],"propose":[40,121],"an":[41,122],"unsupervised,":[42],"domain-independent,":[43],"scalable":[45],"two-phase":[46],"algorithm":[47,69],"type":[49],"extract":[51,129],"concept":[53,132,170],"mentions":[54,133],"into":[55,89],"aspects":[56],"interest":[58],"(e.g.,":[59],"Techniques,":[60],"Applications,":[61],"etc.).":[62],"In":[63,116],"first":[65],"phase":[66],"our":[68,155],"proposePhraseType,":[71],"probabilistic":[73],"generative":[74],"model":[75,95],"which":[76],"exploits":[77],"textual":[78],"features":[79,100],"limited":[81],"POS":[82],"tags":[83],"broadly":[85],"segment":[86],"text":[87],"snippets":[88],"aspect-typed":[90,136],"phrases.":[91],"We":[92,153,173],"extend":[93],"simultaneously":[97],"learn":[98],"aspect-specific":[99],"identify":[102],"domains":[104,163],"multi-domain":[106],"corpora,":[107],"since":[108],"two":[110],"tasks":[111],"mutually":[112],"enhance":[113],"each":[114],"other.":[115],"second":[118],"phase,":[119],"approach":[123],"based":[124],"on":[125],"adaptor":[126],"grammars":[127],"fine":[130],"grained":[131],"phrases":[137],"without":[138],"need":[140],"for":[141],"any":[142],"external":[143],"resources":[144],"or":[145],"human":[146],"effort,":[147],"purely":[150],"data-driven":[151],"manner.":[152],"apply":[154],"technique":[156],"study":[158],"literature":[159],"diverse":[161],"show":[165],"significant":[166],"gains":[167],"over":[168],"state-of-the-art":[169],"techniques.":[172],"also":[174],"present":[175],"qualitative":[177],"analysis":[178],"results":[181],"obtained.":[182]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
