{"id":"https://openalex.org/W2165671627","doi":"https://doi.org/10.1186/1758-2946-3-41","title":"OSCAR4: a flexible architecture for chemical text-mining","display_name":"OSCAR4: a flexible architecture for chemical text-mining","publication_year":2011,"publication_date":"2011-10-14","ids":{"openalex":"https://openalex.org/W2165671627","doi":"https://doi.org/10.1186/1758-2946-3-41","mag":"2165671627","pmid":"https://pubmed.ncbi.nlm.nih.gov/21999457"},"language":"en","primary_location":{"id":"doi:10.1186/1758-2946-3-41","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1758-2946-3-41","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/1758-2946-3-41","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/1758-2946-3-41","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028799902","display_name":"David Jessop","orcid":"https://orcid.org/0009-0004-1712-5245"},"institutions":[{"id":"https://openalex.org/I1342131907","display_name":"Unilever (United Kingdom)","ror":"https://ror.org/05n8ah907","country_code":"GB","type":"company","lineage":["https://openalex.org/I1342131907"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"David M Jessop","raw_affiliation_strings":["Unilever Centre for Molecular Science Informatics, Department of Chemistry, Lensfield Road, Cambridge CB2 1EW, UK. pm286@cam.ac.uk","Department of Chemistry, Unilever Centre for Molecular Science Informatics, Lensfield Road, Cambridge, CB2 1EW, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Unilever Centre for Molecular Science Informatics, Department of Chemistry, Lensfield Road, Cambridge CB2 1EW, UK. pm286@cam.ac.uk","institution_ids":["https://openalex.org/I1342131907"]},{"raw_affiliation_string":"Department of Chemistry, Unilever Centre for Molecular Science Informatics, Lensfield Road, Cambridge, CB2 1EW, UK","institution_ids":["https://openalex.org/I1342131907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048250757","display_name":"Sam Adams","orcid":"https://orcid.org/0000-0001-7141-0400"},"institutions":[{"id":"https://openalex.org/I1342131907","display_name":"Unilever (United Kingdom)","ror":"https://ror.org/05n8ah907","country_code":"GB","type":"company","lineage":["https://openalex.org/I1342131907"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Sam E Adams","raw_affiliation_strings":["Department of Chemistry, Unilever Centre for Molecular Science Informatics, Lensfield Road, Cambridge, CB2 1EW, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Chemistry, Unilever Centre for Molecular Science Informatics, Lensfield Road, Cambridge, CB2 1EW, UK","institution_ids":["https://openalex.org/I1342131907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060194743","display_name":"Egon Willighagen","orcid":"https://orcid.org/0000-0001-7542-0286"},"institutions":[{"id":"https://openalex.org/I1342131907","display_name":"Unilever (United Kingdom)","ror":"https://ror.org/05n8ah907","country_code":"GB","type":"company","lineage":["https://openalex.org/I1342131907"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Egon L Willighagen","raw_affiliation_strings":["Department of Chemistry, Unilever Centre for Molecular Science Informatics, Lensfield Road, Cambridge, CB2 1EW, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Chemistry, Unilever Centre for Molecular Science Informatics, Lensfield Road, Cambridge, CB2 1EW, UK","institution_ids":["https://openalex.org/I1342131907"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012357306","display_name":"Lezan Hawizy","orcid":"https://orcid.org/0000-0002-0932-3135"},"institutions":[{"id":"https://openalex.org/I1342131907","display_name":"Unilever (United Kingdom)","ror":"https://ror.org/05n8ah907","country_code":"GB","type":"company","lineage":["https://openalex.org/I1342131907"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Lezan Hawizy","raw_affiliation_strings":["Department of Chemistry, Unilever Centre for Molecular Science Informatics, Lensfield Road, Cambridge, CB2 1EW, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Chemistry, Unilever Centre for Molecular Science Informatics, Lensfield Road, Cambridge, CB2 1EW, UK","institution_ids":["https://openalex.org/I1342131907"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5041092827","display_name":"Peter Murray\u2010Rust","orcid":"https://orcid.org/0000-0003-3386-3972"},"institutions":[{"id":"https://openalex.org/I1342131907","display_name":"Unilever (United Kingdom)","ror":"https://ror.org/05n8ah907","country_code":"GB","type":"company","lineage":["https://openalex.org/I1342131907"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Peter Murray-Rust","raw_affiliation_strings":["Department of Chemistry, Unilever Centre for Molecular Science Informatics, Lensfield Road, Cambridge, CB2 1EW, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Chemistry, Unilever Centre for Molecular Science Informatics, Lensfield Road, Cambridge, CB2 1EW, UK","institution_ids":["https://openalex.org/I1342131907"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1290,"currency":"GBP","value_usd":1582},"apc_paid":{"value":1290,"currency":"GBP","value_usd":1582},"fwci":6.121,"has_fulltext":true,"cited_by_count":222,"citation_normalized_percentile":{"value":0.97359538,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"3","issue":"1","first_page":"41","last_page":"41"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9764000177383423,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8032577633857727},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.6079075336456299},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.5063232183456421},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.476046085357666},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.47064393758773804},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.40361738204956055},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.16017374396324158}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8032577633857727},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.6079075336456299},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.5063232183456421},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.476046085357666},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.47064393758773804},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.40361738204956055},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.16017374396324158},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":7,"locations":[{"id":"doi:10.1186/1758-2946-3-41","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1758-2946-3-41","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/1758-2946-3-41","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},{"id":"pmid:21999457","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/21999457","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of cheminformatics","raw_type":null},{"id":"pmh:oai:cris.maastrichtuniversity.nl:openaire/1caa0bcd-c702-44fb-8038-ef39c3e2ad56","is_oa":true,"landing_page_url":"https://cris.maastrichtuniversity.nl/en/publications/1caa0bcd-c702-44fb-8038-ef39c3e2ad56","pdf_url":null,"source":{"id":"https://openalex.org/S4306402616","display_name":"Research Publications (Maastricht University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I34352273","host_organization_name":"Maastricht University","host_organization_lineage":["https://openalex.org/I34352273"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Jessop, D M, Adams, S E, Willighagen, E L, Hawizy, L & Murray-rust, P 2011, 'OSCAR4: a flexible architecture for chemical text-mining', Journal of Cheminformatics, vol. 3, no. 1. https://doi.org/10.1186/1758-2946-3-41","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:doaj.org/article:e6cc79f7c4094bd195125539a02d23bf","is_oa":true,"landing_page_url":"https://doaj.org/article/e6cc79f7c4094bd195125539a02d23bf","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Cheminformatics, Vol 3, Iss 1, p 41 (2011)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:3205045","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/3205045","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Cheminform","raw_type":"Text"},{"id":"pmh:oai:www.repository.cam.ac.uk:1810/238388","is_oa":true,"landing_page_url":"http://www.dspace.cam.ac.uk/handle/1810/238388","pdf_url":null,"source":{"id":"https://openalex.org/S4306401777","display_name":"Apollo (University of Cambridge)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I241749","host_organization_name":"University of Cambridge","host_organization_lineage":["https://openalex.org/I241749"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"pmh:oai:www.repository.cam.ac.uk:1810/239919","is_oa":true,"landing_page_url":"http://www.dspace.cam.ac.uk/handle/1810/239919","pdf_url":null,"source":{"id":"https://openalex.org/S4306401777","display_name":"Apollo (University of Cambridge)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I241749","host_organization_name":"University of Cambridge","host_organization_lineage":["https://openalex.org/I241749"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":{"id":"doi:10.1186/1758-2946-3-41","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1758-2946-3-41","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/1758-2946-3-41","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5299999713897705,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320309","display_name":"Joint Information Systems Committee","ror":"https://ror.org/01rv9gx86"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2165671627.pdf","grobid_xml":"https://content.openalex.org/works/W2165671627.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W77347155","https://openalex.org/W104426851","https://openalex.org/W1490056294","https://openalex.org/W1497319365","https://openalex.org/W1508604947","https://openalex.org/W1524134026","https://openalex.org/W1541135842","https://openalex.org/W1548027170","https://openalex.org/W1626162317","https://openalex.org/W1975147762","https://openalex.org/W1977289091","https://openalex.org/W2009556891","https://openalex.org/W2028578434","https://openalex.org/W2033377040","https://openalex.org/W2034354062","https://openalex.org/W2038702914","https://openalex.org/W2045155277","https://openalex.org/W2047600440","https://openalex.org/W2049240985","https://openalex.org/W2058673890","https://openalex.org/W2068737686","https://openalex.org/W2070217628","https://openalex.org/W2079248317","https://openalex.org/W2095596879","https://openalex.org/W2098889731","https://openalex.org/W2111044246","https://openalex.org/W2115964835","https://openalex.org/W2121244856","https://openalex.org/W2125552472","https://openalex.org/W2125904022","https://openalex.org/W2127239015","https://openalex.org/W2133208308","https://openalex.org/W2148797284","https://openalex.org/W2170876339","https://openalex.org/W2315533568","https://openalex.org/W2526887497","https://openalex.org/W4233602311"],"related_works":["https://openalex.org/W2378076731","https://openalex.org/W4286888643","https://openalex.org/W3210795196","https://openalex.org/W2088988140","https://openalex.org/W2803103875","https://openalex.org/W2103019253","https://openalex.org/W2951529875","https://openalex.org/W2391453316","https://openalex.org/W2297768894","https://openalex.org/W1988064119"],"abstract_inverted_index":{"The":[0],"Open-Source":[1],"Chemistry":[2],"Analysis":[3],"Routines":[4],"(OSCAR)":[5],"software,":[6],"a":[7,47,69],"toolkit":[8],"for":[9],"the":[10,30,33,41],"recognition":[11],"of":[12,32,53],"named":[13],"entities":[14],"and":[15,37,81,84],"data":[16],"in":[17,29],"chemistry":[18,74],"publications,":[19],"has":[20,27],"been":[21],"developed":[22],"since":[23],"2002.":[24],"Recent":[25],"work":[26],"resulted":[28],"separation":[31],"core":[34],"OSCAR":[35],"functionality":[36],"its":[38,82],"release":[39],"as":[40],"OSCAR4":[42,67],"library.":[43],"This":[44],"library":[45],"features":[46],"modular":[48],"API":[49],"(based":[50],"on":[51],"reduction":[52],"surface":[54],"coupling)":[55],"that":[56],"permits":[57],"client":[58],"programmers":[59],"to":[60],"easily":[61],"incorporate":[62],"it":[63],"into":[64],"external":[65],"applications.":[66],"offers":[68],"domain-independent":[70],"architecture":[71],"upon":[72],"which":[73],"specific":[75],"text-mining":[76],"tools":[77],"can":[78],"be":[79],"built,":[80],"development":[83],"usage":[85],"are":[86],"discussed.":[87]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":20},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":15},{"year":2022,"cited_by_count":21},{"year":2021,"cited_by_count":21},{"year":2020,"cited_by_count":12},{"year":2019,"cited_by_count":11},{"year":2018,"cited_by_count":7},{"year":2017,"cited_by_count":10},{"year":2016,"cited_by_count":22},{"year":2015,"cited_by_count":20},{"year":2014,"cited_by_count":14},{"year":2013,"cited_by_count":14},{"year":2012,"cited_by_count":13}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
