{"id":"https://openalex.org/W1535228720","doi":"https://doi.org/10.1109/icdm.2003.1250900","title":"Frequent sub-structure-based approaches for classifying chemical compounds","display_name":"Frequent sub-structure-based approaches for classifying chemical compounds","publication_year":2004,"publication_date":"2004-03-30","ids":{"openalex":"https://openalex.org/W1535228720","doi":"https://doi.org/10.1109/icdm.2003.1250900","mag":"1535228720"},"language":"en","primary_location":{"id":"doi:10.1109/icdm.2003.1250900","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdm.2003.1250900","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Third IEEE International Conference on Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://conservancy.umn.edu/bitstreams/674df573-96da-490d-b7df-0725934f1697/download","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112711159","display_name":"Mukund Deshpande","orcid":null},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mukund Deshpande","raw_affiliation_strings":["Department of Computer Science/Army HPC Research Center, University of Minnesota, Minneapolis, MN, USA","Dept. of Comput. Sci., Minnesota Univ., Minneapolis, MN, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science/Army HPC Research Center, University of Minnesota, Minneapolis, MN, USA","institution_ids":["https://openalex.org/I130238516"]},{"raw_affiliation_string":"Dept. of Comput. Sci., Minnesota Univ., Minneapolis, MN, USA","institution_ids":["https://openalex.org/I130238516"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062191522","display_name":"M. Kuramochi","orcid":"https://orcid.org/0009-0002-3845-0077"},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"M. Kuramochi","raw_affiliation_strings":["Department of Computer Science/Army HPC Research Center, University of Minnesota, Minneapolis, MN, USA","Dept. of Comput. Sci., Minnesota Univ., Minneapolis, MN, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science/Army HPC Research Center, University of Minnesota, Minneapolis, MN, USA","institution_ids":["https://openalex.org/I130238516"]},{"raw_affiliation_string":"Dept. of Comput. Sci., Minnesota Univ., Minneapolis, MN, USA","institution_ids":["https://openalex.org/I130238516"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082384108","display_name":"George Karypis","orcid":"https://orcid.org/0000-0003-2753-1437"},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"G. Karypis","raw_affiliation_strings":["Department of Computer Science/Army HPC Research Center, University of Minnesota, Minneapolis, MN, USA","Dept. of Comput. Sci., Minnesota Univ., Minneapolis, MN, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science/Army HPC Research Center, University of Minnesota, Minneapolis, MN, USA","institution_ids":["https://openalex.org/I130238516"]},{"raw_affiliation_string":"Dept. of Comput. Sci., Minnesota Univ., Minneapolis, MN, USA","institution_ids":["https://openalex.org/I130238516"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":16.6136,"has_fulltext":true,"cited_by_count":154,"citation_normalized_percentile":{"value":0.99498814,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"35","last_page":"42"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10908","display_name":"Analytical Chemistry and Chromatography","score":0.9585999846458435,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10640","display_name":"Spectroscopy and Chemometric Analyses","score":0.940500020980835,"subfield":{"id":"https://openalex.org/subfields/1602","display_name":"Analytical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6168591976165771},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4291520416736603}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6168591976165771},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4291520416736603}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1109/icdm.2003.1250900","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdm.2003.1250900","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Third IEEE International Conference on Data Mining","raw_type":"proceedings-article"},{"id":"pmh:oai:conservancy.umn.edu:11299/215559","is_oa":true,"landing_page_url":"http://hdl.handle.net/11299/215559","pdf_url":"https://conservancy.umn.edu/bitstreams/674df573-96da-490d-b7df-0725934f1697/download","source":{"id":"https://openalex.org/S4306402521","display_name":"University of Minnesota Digital Conservancy (University of Minnesota)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I130238516","host_organization_name":"University of Minnesota","host_organization_lineage":["https://openalex.org/I130238516"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Report"},{"id":"pmh:ADA439580","is_oa":false,"landing_page_url":"http://oai.dtic.mil/oai/oai?&amp;verb=getRecord&amp;metadataPrefix=html&amp;identifier=ADA439580","pdf_url":null,"source":{"id":"https://openalex.org/S4406923043","display_name":"Defense Technical Information Center (DTIC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"DTIC AND NTIS","raw_type":"Text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.12.4863","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.12.4863","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www-users.cs.umn.edu/~karypis/publications/Papers/PDF/chemclassify.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.12.6330","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.12.6330","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www-users.cs.umn.edu/~karypis/publications/Papers/Postscript/chemclassify.ps","raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:conservancy.umn.edu:11299/215559","is_oa":true,"landing_page_url":"http://hdl.handle.net/11299/215559","pdf_url":"https://conservancy.umn.edu/bitstreams/674df573-96da-490d-b7df-0725934f1697/download","source":{"id":"https://openalex.org/S4306402521","display_name":"University of Minnesota Digital Conservancy (University of Minnesota)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I130238516","host_organization_name":"University of Minnesota","host_organization_lineage":["https://openalex.org/I130238516"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Report"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.75,"display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G2991020469","display_name":"Multi-Constraint, Multi-Objective Graph Partitioning","funder_award_id":"9972519","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4968282825","display_name":"CAREER: Scalable Algorithms for Knowledge Discovery in Scientific Data Sets","funder_award_id":"0133464","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8609813352","display_name":"Dynamic Feature Extraction and Data Mining for the Analysis of Turbulent Flows","funder_award_id":"9982274","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8804007457","display_name":"CISE Research Instrumentation: Cluster Computing for Knowledge Discovery in Diverse Data Sets","funder_award_id":"9986042","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1535228720.pdf","grobid_xml":"https://content.openalex.org/works/W1535228720.grobid-xml"},"referenced_works_count":93,"referenced_works":["https://openalex.org/W4909282","https://openalex.org/W22405845","https://openalex.org/W107234074","https://openalex.org/W113396932","https://openalex.org/W590490886","https://openalex.org/W592696926","https://openalex.org/W655356045","https://openalex.org/W1497782867","https://openalex.org/W1504694836","https://openalex.org/W1544481768","https://openalex.org/W1547701650","https://openalex.org/W1549439022","https://openalex.org/W1560182410","https://openalex.org/W1565236324","https://openalex.org/W1581588296","https://openalex.org/W1604938182","https://openalex.org/W1606992230","https://openalex.org/W1619260253","https://openalex.org/W1641749581","https://openalex.org/W1919031954","https://openalex.org/W1967436230","https://openalex.org/W1970202530","https://openalex.org/W1970259423","https://openalex.org/W1970651561","https://openalex.org/W1972156862","https://openalex.org/W1975147762","https://openalex.org/W1976683819","https://openalex.org/W1985104873","https://openalex.org/W1987902506","https://openalex.org/W1989141250","https://openalex.org/W1991286793","https://openalex.org/W1994126845","https://openalex.org/W1996249351","https://openalex.org/W2003932717","https://openalex.org/W2014123957","https://openalex.org/W2014728572","https://openalex.org/W2015422283","https://openalex.org/W2016979469","https://openalex.org/W2017398555","https://openalex.org/W2018590585","https://openalex.org/W2021748110","https://openalex.org/W2023532185","https://openalex.org/W2026909852","https://openalex.org/W2029883642","https://openalex.org/W2034411740","https://openalex.org/W2051589410","https://openalex.org/W2059556517","https://openalex.org/W2060531713","https://openalex.org/W2061111857","https://openalex.org/W2062097402","https://openalex.org/W2071744657","https://openalex.org/W2079775628","https://openalex.org/W2080632942","https://openalex.org/W2081050523","https://openalex.org/W2083534494","https://openalex.org/W2095175954","https://openalex.org/W2096729078","https://openalex.org/W2096942889","https://openalex.org/W2099404336","https://openalex.org/W2101649019","https://openalex.org/W2116296021","https://openalex.org/W2118349699","https://openalex.org/W2119148238","https://openalex.org/W2119831128","https://openalex.org/W2125055259","https://openalex.org/W2134097564","https://openalex.org/W2136593687","https://openalex.org/W2138024338","https://openalex.org/W2141753133","https://openalex.org/W2148603752","https://openalex.org/W2154642793","https://openalex.org/W2156909104","https://openalex.org/W2167404361","https://openalex.org/W2167681385","https://openalex.org/W2168209541","https://openalex.org/W2170726034","https://openalex.org/W2321929586","https://openalex.org/W2522853541","https://openalex.org/W2792455800","https://openalex.org/W2977827582","https://openalex.org/W3023786531","https://openalex.org/W4253626616","https://openalex.org/W4254721730","https://openalex.org/W6600201224","https://openalex.org/W6600927619","https://openalex.org/W6604347334","https://openalex.org/W6632694911","https://openalex.org/W6636756987","https://openalex.org/W6640284990","https://openalex.org/W6682837551","https://openalex.org/W6684495928","https://openalex.org/W6684716869","https://openalex.org/W6685146747"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2530322880","https://openalex.org/W1596801655","https://openalex.org/W2359140296"],"abstract_inverted_index":{"We":[0,9],"study":[1],"the":[2,17,22,41,60,65,75,106],"problem":[3],"of":[4,45,77],"classifying":[5],"chemical":[6],"compound":[7],"datasets.":[8],"present":[10,39],"a":[11],"substructure-based":[12],"classification":[13,23,51,95],"algorithm":[14],"that":[15,49,98],"decouples":[16],"substructure":[18],"discovery":[19,30,82],"process":[20],"from":[21],"model":[24,52],"construction":[25],"and":[26,36,104],"uses":[27],"frequent":[28,80],"subgraph":[29,81],"algorithms":[31,83],"to":[32,62,113],"find":[33],"all":[34,54],"topological":[35],"geometric":[37],"substructures":[38,56],"in":[40],"dataset.":[42],"The":[43,69],"advantage":[44],"our":[46,99],"approach":[47,100],"is":[48,72,101],"during":[50],"construction,":[53],"relevant":[55],"are":[57],"available":[58],"allowing":[59],"classifier":[61],"intelligently":[63],"select":[64],"most":[66],"discriminating":[67],"ones.":[68],"computational":[70],"scalability":[71],"ensured":[73],"by":[74,111],"use":[76],"highly":[78],"efficient":[79],"coupled":[84],"with":[85],"aggressive":[86],"feature":[87],"selection.":[88],"Our":[89],"experimental":[90],"evaluation":[91],"on":[92,105],"eight":[93],"different":[94],"problems":[96],"shows":[97],"computationally":[102],"scalable":[103],"average,":[107],"outperforms":[108],"existing":[109],"schemes":[110],"10%":[112],"35%.":[114]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":5},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":7},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":14}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
