{"id":"https://openalex.org/W4384201826","doi":"https://doi.org/10.1007/s11192-023-04667-9","title":"Discovery and recognition of formula concepts using machine learning","display_name":"Discovery and recognition of formula concepts using machine learning","publication_year":2023,"publication_date":"2023-07-13","ids":{"openalex":"https://openalex.org/W4384201826","doi":"https://doi.org/10.1007/s11192-023-04667-9"},"language":"en","primary_location":{"id":"doi:10.1007/s11192-023-04667-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11192-023-04667-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11192-023-04667-9.pdf","source":{"id":"https://openalex.org/S148561398","display_name":"Scientometrics","issn_l":"0138-9130","issn":["0138-9130","1588-2861"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320108","host_organization_name":"Springer Nature (Netherlands)","host_organization_lineage":["https://openalex.org/P4310320108","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature (Netherlands)","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Scientometrics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s11192-023-04667-9.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069041521","display_name":"Philipp Scharpf","orcid":"https://orcid.org/0000-0002-4212-0508"},"institutions":[{"id":"https://openalex.org/I189712700","display_name":"University of Konstanz","ror":"https://ror.org/0546hnb39","country_code":"DE","type":"education","lineage":["https://openalex.org/I189712700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Philipp Scharpf","raw_affiliation_strings":["University of Konstanz, Konstanz, Germany"],"raw_orcid":"https://orcid.org/0000-0002-4212-0508","affiliations":[{"raw_affiliation_string":"University of Konstanz, Konstanz, Germany","institution_ids":["https://openalex.org/I189712700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038664667","display_name":"Moritz Schubotz","orcid":"https://orcid.org/0000-0001-7141-4997"},"institutions":[{"id":"https://openalex.org/I158675288","display_name":"FIZ Karlsruhe \u2013 Leibniz Institute for Information Infrastructure","ror":"https://ror.org/0387prb75","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I158675288","https://openalex.org/I315704651"]},{"id":"https://openalex.org/I167360494","display_name":"University of Wuppertal","ror":"https://ror.org/00613ak93","country_code":"DE","type":"education","lineage":["https://openalex.org/I167360494"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Moritz Schubotz","raw_affiliation_strings":["University of Wuppertal and FIZ Karlsruhe \u2013 Leibniz Institute for Information Infrastructure, Berlin, Germany"],"raw_orcid":"https://orcid.org/0000-0001-7141-4997","affiliations":[{"raw_affiliation_string":"University of Wuppertal and FIZ Karlsruhe \u2013 Leibniz Institute for Information Infrastructure, Berlin, Germany","institution_ids":["https://openalex.org/I158675288","https://openalex.org/I167360494"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075372847","display_name":"Howard S. Cohl","orcid":"https://orcid.org/0000-0002-9398-455X"},"institutions":[{"id":"https://openalex.org/I1321296531","display_name":"National Institute of Standards and Technology","ror":"https://ror.org/05xpvk416","country_code":"US","type":"funder","lineage":["https://openalex.org/I1321296531","https://openalex.org/I1343035065"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Howard S. Cohl","raw_affiliation_strings":["Applied and Computational Mathematics Division, National Institute of Standards and Technology, Gaithersburg, Maryland, USA"],"raw_orcid":"https://orcid.org/0000-0002-9398-455X","affiliations":[{"raw_affiliation_string":"Applied and Computational Mathematics Division, National Institute of Standards and Technology, Gaithersburg, Maryland, USA","institution_ids":["https://openalex.org/I1321296531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013617539","display_name":"Corinna Breitinger","orcid":"https://orcid.org/0000-0001-6586-0392"},"institutions":[{"id":"https://openalex.org/I74656192","display_name":"University of G\u00f6ttingen","ror":"https://ror.org/01y9bpm73","country_code":"DE","type":"education","lineage":["https://openalex.org/I74656192"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Corinna Breitinger","raw_affiliation_strings":["University of G\u00f6ttingen, G\u00f6ttingen, Germany"],"raw_orcid":"https://orcid.org/0000-0001-6586-0392","affiliations":[{"raw_affiliation_string":"University of G\u00f6ttingen, G\u00f6ttingen, Germany","institution_ids":["https://openalex.org/I74656192"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058837356","display_name":"B\u00e9la Gipp","orcid":"https://orcid.org/0000-0001-6522-3019"},"institutions":[{"id":"https://openalex.org/I74656192","display_name":"University of G\u00f6ttingen","ror":"https://ror.org/01y9bpm73","country_code":"DE","type":"education","lineage":["https://openalex.org/I74656192"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Bela Gipp","raw_affiliation_strings":["University of G\u00f6ttingen, G\u00f6ttingen, Germany"],"raw_orcid":"https://orcid.org/0000-0001-6522-3019","affiliations":[{"raw_affiliation_string":"University of G\u00f6ttingen, G\u00f6ttingen, Germany","institution_ids":["https://openalex.org/I74656192"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5058837356"],"corresponding_institution_ids":["https://openalex.org/I74656192"],"apc_list":{"value":2290,"currency":"EUR","value_usd":2890},"apc_paid":{"value":2290,"currency":"EUR","value_usd":2890},"fwci":0.7435,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.74936743,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"128","issue":"9","first_page":"4971","last_page":"5025"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9502999782562256,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9420999884605408,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7456659078598022},{"id":"https://openalex.org/keywords/citation","display_name":"Citation","score":0.6242669224739075},{"id":"https://openalex.org/keywords/notation","display_name":"Notation","score":0.5780913829803467},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5529739856719971},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5495012998580933},{"id":"https://openalex.org/keywords/mathematical-notation","display_name":"Mathematical notation","score":0.5141618251800537},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5043898820877075},{"id":"https://openalex.org/keywords/identifier","display_name":"Identifier","score":0.4474678337574005},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40236207842826843},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18678435683250427},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.13250598311424255},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.09383028745651245}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7456659078598022},{"id":"https://openalex.org/C2778805511","wikidata":"https://www.wikidata.org/wiki/Q1713","display_name":"Citation","level":2,"score":0.6242669224739075},{"id":"https://openalex.org/C45357846","wikidata":"https://www.wikidata.org/wiki/Q2001982","display_name":"Notation","level":2,"score":0.5780913829803467},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5529739856719971},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5495012998580933},{"id":"https://openalex.org/C24457124","wikidata":"https://www.wikidata.org/wiki/Q1140046","display_name":"Mathematical notation","level":3,"score":0.5141618251800537},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5043898820877075},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.4474678337574005},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40236207842826843},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18678435683250427},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.13250598311424255},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.09383028745651245},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1007/s11192-023-04667-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11192-023-04667-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11192-023-04667-9.pdf","source":{"id":"https://openalex.org/S148561398","display_name":"Scientometrics","issn_l":"0138-9130","issn":["0138-9130","1588-2861"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320108","host_organization_name":"Springer Nature (Netherlands)","host_organization_lineage":["https://openalex.org/P4310320108","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature (Netherlands)","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Scientometrics","raw_type":"journal-article"},{"id":"pmh:oai:RePEc:spr:scient:v:128:y:2023:i:9:d:10.1007_s11192-023-04667-9","is_oa":false,"landing_page_url":"http://link.springer.com/10.1007/s11192-023-04667-9","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},{"id":"pmh:oai:kops.uni-konstanz.de:123456789/72154","is_oa":true,"landing_page_url":"http://nbn-resolving.de/urn:nbn:de:bsz:352-2-ff4tuct3qxt3","pdf_url":null,"source":{"id":"https://openalex.org/S4306401487","display_name":"KOPS (University of Konstanz)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I189712700","host_organization_name":"University of Konstanz","host_organization_lineage":["https://openalex.org/I189712700"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Scientometrics. Springer. 2023, 128(9), S. 4971-5025. ISSN 0138-9130. eISSN 1588-2861. Verf\u00fcgbar unter: doi: 10.1007/s11192-023-04667-9","raw_type":"doc-type:Text"},{"id":"pmh:oai:publications.goettingen-research-online.de:2/132247","is_oa":true,"landing_page_url":"https://resolver.sub.uni-goettingen.de/purl?gro-2/132247","pdf_url":null,"source":{"id":"https://openalex.org/S4306401634","display_name":"GoeScholar  The Publication Server of the Georg-August-Universit\u00e4t G\u00f6ttingen (Georg-August-Universit\u00e4t G\u00f6ttingen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210122495","host_organization_name":"Asklepios Klinik St. Georg","host_organization_lineage":["https://openalex.org/I4210122495"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"yes"}],"best_oa_location":{"id":"doi:10.1007/s11192-023-04667-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11192-023-04667-9","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11192-023-04667-9.pdf","source":{"id":"https://openalex.org/S148561398","display_name":"Scientometrics","issn_l":"0138-9130","issn":["0138-9130","1588-2861"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320108","host_organization_name":"Springer Nature (Netherlands)","host_organization_lineage":["https://openalex.org/P4310320108","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature (Netherlands)","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Scientometrics","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.8399999737739563,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G4964679585","display_name":null,"funder_award_id":"437179652","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G5414194935","display_name":null,"funder_award_id":"350192710","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"}],"funders":[{"id":"https://openalex.org/F4320313139","display_name":"Nieders\u00e4chsische Ministerium f\u00fcr Wissenschaft und Kultur","ror":"https://ror.org/0116z8r77"},{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320320882","display_name":"Volkswagen Foundation","ror":"https://ror.org/03bsmfz84"},{"id":"https://openalex.org/F4320321870","display_name":"Georg-August-Universit\u00e4t G\u00f6ttingen","ror":"https://ror.org/01y9bpm73"},{"id":"https://openalex.org/F4320326493","display_name":"Nieders\u00e4chsisches Ministerium f\u00fcr Wissenschaft und Kultur","ror":null}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4384201826.pdf"},"referenced_works_count":60,"referenced_works":["https://openalex.org/W1494975459","https://openalex.org/W1505494854","https://openalex.org/W1593320022","https://openalex.org/W1888893865","https://openalex.org/W1980404452","https://openalex.org/W1987490028","https://openalex.org/W1988322580","https://openalex.org/W2009957709","https://openalex.org/W2047210446","https://openalex.org/W2066636486","https://openalex.org/W2080133951","https://openalex.org/W2091095871","https://openalex.org/W2122081959","https://openalex.org/W2127589108","https://openalex.org/W2131744502","https://openalex.org/W2137079713","https://openalex.org/W2139685094","https://openalex.org/W2170544604","https://openalex.org/W2182868890","https://openalex.org/W2337021505","https://openalex.org/W2522880372","https://openalex.org/W2556128865","https://openalex.org/W2569480976","https://openalex.org/W2617469434","https://openalex.org/W2770920320","https://openalex.org/W2797867514","https://openalex.org/W2883885170","https://openalex.org/W2887888371","https://openalex.org/W2902254442","https://openalex.org/W2907090821","https://openalex.org/W2965221296","https://openalex.org/W2972393600","https://openalex.org/W3004742727","https://openalex.org/W3028148433","https://openalex.org/W3028529056","https://openalex.org/W3040999115","https://openalex.org/W3043441534","https://openalex.org/W3098678576","https://openalex.org/W3099633411","https://openalex.org/W3101340675","https://openalex.org/W3101645173","https://openalex.org/W3125340959","https://openalex.org/W3164439416","https://openalex.org/W4232315234","https://openalex.org/W4251572646","https://openalex.org/W4281622223","https://openalex.org/W4289535737","https://openalex.org/W4309217187","https://openalex.org/W4375843291","https://openalex.org/W4403252750","https://openalex.org/W6631501603","https://openalex.org/W6636892783","https://openalex.org/W6672077861","https://openalex.org/W6673039648","https://openalex.org/W6675354045","https://openalex.org/W6696853935","https://openalex.org/W6713259660","https://openalex.org/W6785069526","https://openalex.org/W6803544816","https://openalex.org/W6980547258"],"related_works":["https://openalex.org/W2390777183","https://openalex.org/W1882848237","https://openalex.org/W4252772812","https://openalex.org/W2316776327","https://openalex.org/W2328387788","https://openalex.org/W2911510094","https://openalex.org/W4247174507","https://openalex.org/W4386351071","https://openalex.org/W1992321925","https://openalex.org/W2357241418"],"abstract_inverted_index":{"Abstract":[0],"Citation-based":[1],"Information":[2],"Retrieval":[3,86],"(IR)":[4],"methods":[5,57],"for":[6,12,169,181,214],"scientific":[7],"documents":[8,200],"have":[9],"proven":[10],"effective":[11],"IR":[13,56],"applications,":[14],"such":[15],"as":[16,208,210],"Plagiarism":[17],"Detection":[18],"or":[19,217],"Literature":[20],"Recommender":[21],"Systems":[22],"in":[23],"academic":[24],"disciplines":[25],"that":[26,112],"use":[27],"many":[28],"references.":[29],"In":[30,70],"science,":[31],"technology,":[32],"engineering,":[33],"and":[34,58,67,81,95,106,145,176,191,201,205],"mathematics,":[35],"researchers":[36],"often":[37],"employ":[38],"mathematical":[39,68,76,133,199],"concepts":[40],"through":[41],"formula":[42,127,184],"notation":[43],"to":[44,46,53,63,123,128,141],"refer":[45],"prior":[47,130],"knowledge.":[48],"Our":[49,161],"long-term":[50],"goal":[51],"is":[52,121],"generalize":[54],"citation-based":[55],"apply":[59],"this":[60,71],"generalized":[61],"method":[62],"both":[64],"classical":[65],"references":[66],"concepts.":[69],"paper,":[72],"we":[73],"suggest":[74],"how":[75],"formulas":[77,175,197],"could":[78],"be":[79],"cited":[80],"define":[82],"a":[83,109,118,125,129,154,165,177],"Formula":[84,91,96],"Concept":[85,92,97],"task":[87],"with":[88],"two":[89],"subtasks:":[90],"Discovery":[93],"(FCD)":[94],"Recognition":[98],"(FCR).":[99],"While":[100],"FCD":[101,144,162,190],"aims":[102],"at":[103],"the":[104,143,183,187,194],"definition":[105],"exploration":[107],"of":[108,117,167,173,179,196],"\u2018Formula":[110],"Concept\u2019":[111],"names":[113],"bundled":[114],"equivalent":[115,171],"representations":[116,172],"formula,":[119],"FCR":[120,146,192],"designed":[122],"match":[124],"given":[126],"assigned":[131],"unique":[132],"concept":[134],"identifier.":[135],"We":[136,148],"present":[137],"machine":[138],"learning-based":[139],"approaches":[140,152],"address":[142],"tasks.":[147],"then":[149],"evaluate":[150],"these":[151],"on":[153],"standardized":[155],"test":[156],"collection":[157],"(NTCIR":[158],"arXiv":[159],"dataset).":[160],"approach":[163],"yields":[164],"precision":[166],"68%":[168],"retrieving":[170],"frequent":[174],"recall":[178],"72%":[180],"extracting":[182],"name":[185],"from":[186],"surrounding":[188],"text.":[189],"enable":[193],"citation":[195],"within":[198],"facilitate":[202],"semantic":[203],"search":[204],"question":[206],"answering,":[207],"well":[209],"document":[211],"similarity":[212],"assessments":[213],"plagiarism":[215],"detection":[216],"recommender":[218],"systems.":[219]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2024,"cited_by_count":2}],"updated_date":"2026-06-14T07:44:22.658603","created_date":"2025-10-10T00:00:00"}
