{"id":"https://openalex.org/W2133733197","doi":"https://doi.org/10.1109/csb.2003.1227302","title":"Clustering binary fingerprint vectors with missing values for DNA array data analysis","display_name":"Clustering binary fingerprint vectors with missing values for DNA array data analysis","publication_year":2004,"publication_date":"2004-03-23","ids":{"openalex":"https://openalex.org/W2133733197","doi":"https://doi.org/10.1109/csb.2003.1227302","mag":"2133733197"},"language":"en","primary_location":{"id":"doi:10.1109/csb.2003.1227302","is_oa":false,"landing_page_url":"https://doi.org/10.1109/csb.2003.1227302","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Systems Bioinformatics. CSB2003. Proceedings of the 2003 IEEE Bioinformatics Conference. CSB2003","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025492477","display_name":"A. Figueroa","orcid":"https://orcid.org/0000-0002-9417-855X"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"education","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"A. Figueroa","raw_affiliation_strings":["Department of Computer Sci, University of California, Riverside, USA","Dept. of Comput. Sci., California, Univ., Riverside, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Sci, University of California, Riverside, USA","institution_ids":["https://openalex.org/I103635307"]},{"raw_affiliation_string":"Dept. of Comput. Sci., California, Univ., Riverside, CA, USA","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020920809","display_name":"James Borneman","orcid":"https://orcid.org/0000-0003-0661-4970"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"education","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"J. Borneman","raw_affiliation_strings":["Department of Plant Pathology, University of California, Riverside, USA","Univ. of Calif., Riverside"],"affiliations":[{"raw_affiliation_string":"Department of Plant Pathology, University of California, Riverside, USA","institution_ids":["https://openalex.org/I103635307"]},{"raw_affiliation_string":"Univ. of Calif., Riverside","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101911266","display_name":"Tao Jiang","orcid":"https://orcid.org/0000-0003-3833-4498"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"education","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"T. Jiang","raw_affiliation_strings":["Department of Computer Sci, University of California, Riverside, USA","Univ. of Calif., Riverside"],"affiliations":[{"raw_affiliation_string":"Department of Computer Sci, University of California, Riverside, USA","institution_ids":["https://openalex.org/I103635307"]},{"raw_affiliation_string":"Univ. of Calif., Riverside","institution_ids":["https://openalex.org/I103635307"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5025492477"],"corresponding_institution_ids":["https://openalex.org/I103635307"],"apc_list":null,"apc_paid":null,"fwci":0.5847,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.64807711,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"38","last_page":"47"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10222","display_name":"Genomics and Chromatin Dynamics","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11970","display_name":"Molecular Biology Techniques and Applications","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6972843408584595},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.53005450963974},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4678187072277069},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.43100759387016296},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3764793872833252},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3529456555843353},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3410775661468506}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6972843408584595},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.53005450963974},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4678187072277069},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.43100759387016296},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3764793872833252},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3529456555843353},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3410775661468506}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/csb.2003.1227302","is_oa":false,"landing_page_url":"https://doi.org/10.1109/csb.2003.1227302","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Systems Bioinformatics. CSB2003. Proceedings of the 2003 IEEE Bioinformatics Conference. CSB2003","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W156555589","https://openalex.org/W1769049279","https://openalex.org/W1866755320","https://openalex.org/W1969838199","https://openalex.org/W1977545325","https://openalex.org/W1981746357","https://openalex.org/W1989297334","https://openalex.org/W2028761382","https://openalex.org/W2033903399","https://openalex.org/W2039381534","https://openalex.org/W2052888257","https://openalex.org/W2054416990","https://openalex.org/W2113836695","https://openalex.org/W2115996640","https://openalex.org/W2118727666","https://openalex.org/W2125220573","https://openalex.org/W2135187880","https://openalex.org/W2137560895","https://openalex.org/W2146301357","https://openalex.org/W2150926065","https://openalex.org/W2152012752","https://openalex.org/W2154604426","https://openalex.org/W2158973107","https://openalex.org/W2159207877","https://openalex.org/W2486715098","https://openalex.org/W2542394219","https://openalex.org/W2611831635","https://openalex.org/W2612166593","https://openalex.org/W4285719527","https://openalex.org/W6637940469","https://openalex.org/W6638030395","https://openalex.org/W6664271236"],"related_works":["https://openalex.org/W2051487156","https://openalex.org/W2073681303","https://openalex.org/W2544423928","https://openalex.org/W2052122378","https://openalex.org/W2804364458","https://openalex.org/W2053286651","https://openalex.org/W4298130764","https://openalex.org/W2181743346","https://openalex.org/W2187401768","https://openalex.org/W2132641928"],"abstract_inverted_index":{"Oligonucleotide":[0],"fingerprinting":[1],"is":[2,44,240],"a":[3,91,126,154],"powerful":[4],"DNA":[5,27,53,103,231],"array":[6,54],"based":[7,164,246],"method":[8,43],"to":[9,62,132,187,262],"characterize":[10],"cDNA":[11],"and":[12,18,26,69,75,99,135,153,158,205,214,221],"ribosomal":[13],"RNA":[14],"gene":[15,23],"(rDNA)":[16],"libraries":[17],"has":[19],"many":[20],"applications":[21],"including":[22],"expression":[24],"profiling":[25],"clone":[28,232],"classification.":[29],"We":[30,144],"are":[31,82,96],"especially":[32],"interested":[33],"in":[34,41,113,140,251],"the":[35,42,45,59,119,137,141,146,180,190,210,263],"latter":[36],"application.":[37],"A":[38],"key":[39],"step":[40],"cluster":[46],"analysis":[47],"of":[48,58,121,149,175,179,253],"fingerprint":[49],"data":[50,95,207,229],"obtained":[51],"from":[52,230],"hybridization":[55,77],"experiments.":[56],"Most":[57],"existing":[60],"approaches":[61],"clustering":[63,120,151,223,244],"use":[64],"(normalized)":[65],"real":[66,206,228,248],"intensity":[67,249],"values":[68,112,139],"thus":[70],"do":[71],"not":[72],"treat":[73],"positive":[74],"negative":[76],"signals":[78,81],"equally":[79],"(positive":[80],"much":[83],"more":[84,241],"emphasized).":[85],"In":[86],"this":[87,114,150,237],"paper,":[88],"we":[89,117],"consider":[90],"discrete":[92,238],"approach.":[93],"Fingerprint":[94],"first":[97],"normalized":[98],"binarized":[100],"using":[101],"control":[102],"clones.":[104],"Because":[105],"there":[106],"may":[107],"exist":[108],"unresolved":[109],"(or":[110],"missing)":[111],"binarization":[115],"process,":[116],"formulate":[118],"(binary)":[122],"oligonucleotide":[123,265],"fingerprints":[124,142],"as":[125,193,195],"combinatorial":[127],"optimization":[128],"problem":[129,152],"that":[130,209,236,256],"attempts":[131],"identify":[133],"clusters":[134],"resolve":[136],"missing":[138],"simultaneously.":[143],"study":[145],"computational":[147],"complexity":[148],"natural":[155],"parameterized":[156],"version,":[157],"present":[159],"an":[160],"efficient":[161],"greedy":[162],"algorithm":[163,172,211],"on":[165,169,203,227,247],"minimum":[166],"clique":[167],"partition":[168],"graphs.":[170],"The":[171,225],"takes":[173],"advantage":[174],"some":[176,196,218],"unique":[177],"properties":[178],"graphs":[181],"considered":[182],"here,":[183],"which":[184],"allow":[185],"us":[186],"efficiently":[188],"find":[189],"maximum":[191],"cliques":[192],"well":[194],"special":[197],"maximal":[198],"cliques.":[199],"Our":[200],"experimental":[201],"results":[202,226],"simulated":[204],"demonstrate":[208],"runs":[212],"faster":[213],"performs":[215],"better":[216],"than":[217,243],"popular":[219],"hierarchical":[220],"graph-based":[222],"methods.":[224],"classification":[233],"also":[234],"suggest":[235],"approach":[239],"accurate":[242],"methods":[245],"values,":[250],"terms":[252],"separating":[254],"clones":[255],"have":[257],"different":[258],"characteristics":[259],"with":[260],"respect":[261],"given":[264],"probes.":[266]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
