{"id":"https://openalex.org/W2964864162","doi":"https://doi.org/10.1021/acs.jcim.9b00470","title":"Named Entity Recognition and Normalization Applied to Large-Scale Information Extraction from the Materials Science Literature","display_name":"Named Entity Recognition and Normalization Applied to Large-Scale Information Extraction from the Materials Science Literature","publication_year":2019,"publication_date":"2019-07-30","ids":{"openalex":"https://openalex.org/W2964864162","doi":"https://doi.org/10.1021/acs.jcim.9b00470","mag":"2964864162","pmid":"https://pubmed.ncbi.nlm.nih.gov/31361962"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.9b00470","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.9b00470","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.osti.gov/servlets/purl/1581363","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051902238","display_name":"Leigh Weston","orcid":"https://orcid.org/0000-0002-3973-0161"},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"L. Weston","raw_affiliation_strings":["Energy Technologies Area and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States"],"affiliations":[{"raw_affiliation_string":"Energy Technologies Area and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States","institution_ids":["https://openalex.org/I148283060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016150069","display_name":"Vahe Tshitoyan","orcid":"https://orcid.org/0000-0003-4518-2314"},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"V. Tshitoyan","raw_affiliation_strings":["Materials Science Division and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States"],"affiliations":[{"raw_affiliation_string":"Materials Science Division and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States","institution_ids":["https://openalex.org/I148283060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024396096","display_name":"John Dagdelen","orcid":"https://orcid.org/0000-0003-2181-4815"},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"J. Dagdelen","raw_affiliation_strings":["Energy Technologies Area and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States"],"affiliations":[{"raw_affiliation_string":"Energy Technologies Area and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States","institution_ids":["https://openalex.org/I148283060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046633150","display_name":"Olga Kononova","orcid":"https://orcid.org/0000-0001-9267-312X"},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"O. Kononova","raw_affiliation_strings":["Materials Science Division and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States"],"affiliations":[{"raw_affiliation_string":"Materials Science Division and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States","institution_ids":["https://openalex.org/I148283060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006018763","display_name":"Amalie Trewartha","orcid":"https://orcid.org/0000-0001-6095-8032"},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"A. Trewartha","raw_affiliation_strings":["Materials Science Division and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States"],"affiliations":[{"raw_affiliation_string":"Materials Science Division and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States","institution_ids":["https://openalex.org/I148283060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037535334","display_name":"Kristin A. Persson","orcid":"https://orcid.org/0000-0003-2495-5509"},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"K. A. Persson","raw_affiliation_strings":["Energy Technologies Area and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States"],"affiliations":[{"raw_affiliation_string":"Energy Technologies Area and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States","institution_ids":["https://openalex.org/I148283060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014983956","display_name":"Gerbrand Ceder","orcid":"https://orcid.org/0000-0001-9275-3605"},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"G. Ceder","raw_affiliation_strings":["Materials Science Division and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States"],"affiliations":[{"raw_affiliation_string":"Materials Science Division and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States","institution_ids":["https://openalex.org/I148283060"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003640520","display_name":"Anubhav Jain","orcid":"https://orcid.org/0000-0001-5893-9967"},"institutions":[{"id":"https://openalex.org/I148283060","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I148283060","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"A. Jain","raw_affiliation_strings":["Energy Technologies Area and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States"],"affiliations":[{"raw_affiliation_string":"Energy Technologies Area and Lawrence Berkeley National Laboratory, 1 Cyclotron Road, Berkeley, California 94720, United States","institution_ids":["https://openalex.org/I148283060"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5003640520"],"corresponding_institution_ids":["https://openalex.org/I148283060"],"apc_list":null,"apc_paid":null,"fwci":8.4402,"has_fulltext":true,"cited_by_count":273,"citation_normalized_percentile":{"value":0.98678188,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"59","issue":"9","first_page":"3692","last_page":"3702"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7727732062339783},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.7373304963111877},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6321848034858704},{"id":"https://openalex.org/keywords/named-entity-recognition","display_name":"Named-entity recognition","score":0.5998244285583496},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.49610933661460876},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.4940932095050812},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.47988927364349365},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.43222159147262573},{"id":"https://openalex.org/keywords/pace","display_name":"Pace","score":0.41438984870910645},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3713456392288208},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.32556790113449097},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2651142477989197},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.16226515173912048}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7727732062339783},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7373304963111877},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6321848034858704},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.5998244285583496},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.49610933661460876},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.4940932095050812},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.47988927364349365},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.43222159147262573},{"id":"https://openalex.org/C2777526511","wikidata":"https://www.wikidata.org/wiki/Q691543","display_name":"Pace","level":2,"score":0.41438984870910645},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3713456392288208},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32556790113449097},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2651142477989197},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.16226515173912048},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000074266","descriptor_name":"Materials Science","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D000074266","descriptor_name":"Materials Science","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D000074266","descriptor_name":"Materials Science","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D000080911","descriptor_name":"Cheminformatics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D000080911","descriptor_name":"Cheminformatics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D000080911","descriptor_name":"Cheminformatics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false}],"locations_count":5,"locations":[{"id":"doi:10.1021/acs.jcim.9b00470","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.9b00470","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:31361962","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/31361962","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null},{"id":"pmh:oai:osti.gov:1581363","is_oa":true,"landing_page_url":"https://www.osti.gov/biblio/1581363","pdf_url":"https://www.osti.gov/servlets/purl/1581363","source":{"id":"https://openalex.org/S4306402487","display_name":"OSTI OAI (U.S. Department of Energy Office of Scientific and Technical Information)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I139351228","host_organization_name":"Office of Scientific and Technical Information","host_organization_lineage":["https://openalex.org/I139351228"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null},{"id":"pmh:ark:/13030/qt7r45h4mf","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null},{"id":"pmh:oai:escholarship.org/ark:/13030/qt7r45h4mf","is_oa":false,"landing_page_url":"https://escholarship.org/uc/item/7r45h4mf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400115","display_name":"eScholarship (California Digital Library)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I2801248553","host_organization_name":"California Digital Library","host_organization_lineage":["https://openalex.org/I2801248553"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of chemical information and modeling, vol 59, iss 9","raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:osti.gov:1581363","is_oa":true,"landing_page_url":"https://www.osti.gov/biblio/1581363","pdf_url":"https://www.osti.gov/servlets/purl/1581363","source":{"id":"https://openalex.org/S4306402487","display_name":"OSTI OAI (U.S. Department of Energy Office of Scientific and Technical Information)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I139351228","host_organization_name":"Office of Scientific and Technical Information","host_organization_lineage":["https://openalex.org/I139351228"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null},"sustainable_development_goals":[{"score":0.75,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320315934","display_name":"Toyota Research Institute","ror":null}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W2964864162.pdf"},"referenced_works_count":52,"referenced_works":["https://openalex.org/W1623072288","https://openalex.org/W1673310716","https://openalex.org/W1880262756","https://openalex.org/W1940872118","https://openalex.org/W1977781223","https://openalex.org/W1990719174","https://openalex.org/W1994957358","https://openalex.org/W2014362743","https://openalex.org/W2015197254","https://openalex.org/W2020278455","https://openalex.org/W2022298832","https://openalex.org/W2053673723","https://openalex.org/W2059811790","https://openalex.org/W2064675550","https://openalex.org/W2101234009","https://openalex.org/W2101553882","https://openalex.org/W2123554644","https://openalex.org/W2130156865","https://openalex.org/W2144578941","https://openalex.org/W2148488766","https://openalex.org/W2156997379","https://openalex.org/W2166468803","https://openalex.org/W2169491861","https://openalex.org/W2177317049","https://openalex.org/W2187089797","https://openalex.org/W2270423142","https://openalex.org/W2296283641","https://openalex.org/W2313966941","https://openalex.org/W2315433270","https://openalex.org/W2479958290","https://openalex.org/W2498119267","https://openalex.org/W2523785361","https://openalex.org/W2594692737","https://openalex.org/W2610394652","https://openalex.org/W2620846205","https://openalex.org/W2755202310","https://openalex.org/W2766033547","https://openalex.org/W2766362701","https://openalex.org/W2770164889","https://openalex.org/W2770778462","https://openalex.org/W2784133128","https://openalex.org/W2808304511","https://openalex.org/W2950577311","https://openalex.org/W2953384591","https://openalex.org/W2953641512","https://openalex.org/W2974675506","https://openalex.org/W3020786614","https://openalex.org/W3098281808","https://openalex.org/W4298082496","https://openalex.org/W4394307009","https://openalex.org/W4394452526","https://openalex.org/W4394515759"],"related_works":["https://openalex.org/W2793132289","https://openalex.org/W2334378031","https://openalex.org/W2916255597","https://openalex.org/W2999302224","https://openalex.org/W3091569222","https://openalex.org/W4241018868","https://openalex.org/W1495833002","https://openalex.org/W4289715253","https://openalex.org/W2964631078","https://openalex.org/W2075635421"],"abstract_inverted_index":{"The":[0,81],"number":[1],"of":[2,47,121,147,173,189,219],"published":[3,48,77,175],"materials":[4,21,78,91,132,221],"science":[5,79,92,133,222],"articles":[6,49],"has":[7,194],"increased":[8],"manyfold":[9],"over":[10],"the":[11,20,30,43,76,145,174,217],"past":[12],"few":[13],"decades.":[14],"Now,":[15],"a":[16,153,157],"major":[17],"bottleneck":[18],"in":[19,25,156],"discovery":[22],"pipeline":[23],"arises":[24],"connecting":[26],"new":[27],"results":[28,214],"with":[29,66],"previously":[31,180],"established":[32],"literature.":[33,80],"A":[34],"potential":[35],"solution":[36],"to":[37,41,86,126,169,186,215],"this":[38,60],"problem":[39],"is":[40,84,124,150],"map":[42],"unstructured":[44],"raw":[45],"text":[46,64],"onto":[50],"structured":[51,158],"database":[52,154,164],"entries":[53],"that":[54,162,177],"allow":[55],"for":[56,71],"programmatic":[57],"querying.":[58],"To":[59],"end,":[61],"we":[62,211],"apply":[63],"mining":[65],"named":[67,142],"entity":[68],"recognition":[69],"(NER)":[70],"large-scale":[72],"information":[73,89,127],"extraction":[74,128],"from":[75,90,129],"NER":[82],"model":[83],"trained":[85],"extract":[87,136],"summary-level":[88],"documents,":[93],"including":[94],"inorganic":[95],"material":[96,102],"mentions,":[97],"sample":[98],"descriptors,":[99],"phase":[100],"labels,":[101],"properties":[103],"and":[104,111,123,144,192,205,210],"applications,":[105],"as":[106,108,152],"well":[107],"any":[109],"synthesis":[110],"characterization":[112],"methods":[113],"used.":[114],"Our":[115],"classifier":[116],"achieves":[117],"an":[118],"accuracy":[119],"(<i>f</i><sub>1</sub>)":[120],"87%,":[122],"applied":[125],"3.27":[130],"million":[131,140],"abstracts.":[134],"We":[135,160],"more":[137],"than":[138],"80":[139],"materials-science-related":[141],"entities,":[143],"content":[146],"each":[148],"abstract":[149],"represented":[151],"entry":[155],"format.":[159],"demonstrate":[161],"simple":[163],"queries":[165],"can":[166],"be":[167],"used":[168],"answer":[170],"complex":[171],"\"meta-questions\"":[172],"literature":[176,184],"would":[178],"have":[179],"required":[181],"laborious,":[182],"manual":[183],"searches":[185],"answer.":[187],"All":[188],"our":[190,200],"data":[191],"functionality":[193],"been":[195],"made":[196],"freely":[197],"available":[198],"on":[199],"Github":[201],"(":[202,207],"https://github.com/materialsintelligence/matscholar":[203],")":[204],"website":[206],"http://matscholar.com":[208],"),":[209],"expect":[212],"these":[213],"accelerate":[216],"pace":[218],"future":[220],"discovery.":[223]},"counts_by_year":[{"year":2026,"cited_by_count":13},{"year":2025,"cited_by_count":51},{"year":2024,"cited_by_count":65},{"year":2023,"cited_by_count":51},{"year":2022,"cited_by_count":37},{"year":2021,"cited_by_count":35},{"year":2020,"cited_by_count":19},{"year":2019,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
