{"id":"https://openalex.org/W3099485719","doi":"https://doi.org/10.1145/3388440.3412424","title":"MinIsoClust","display_name":"MinIsoClust","publication_year":2020,"publication_date":"2020-09-21","ids":{"openalex":"https://openalex.org/W3099485719","doi":"https://doi.org/10.1145/3388440.3412424","mag":"3099485719"},"language":"en","primary_location":{"id":"doi:10.1145/3388440.3412424","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3388440.3412424","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 11th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011002061","display_name":"Sairam Behera","orcid":"https://orcid.org/0000-0002-9047-0203"},"institutions":[{"id":"https://openalex.org/I114395901","display_name":"University of Nebraska\u2013Lincoln","ror":"https://ror.org/043mer456","country_code":"US","type":"education","lineage":["https://openalex.org/I114395901"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sairam Behera","raw_affiliation_strings":["Dept. of Computer Sc. &amp; Engineering, University of Nebraska-Lincoln, Lincoln, NE, USA"],"affiliations":[{"raw_affiliation_string":"Dept. of Computer Sc. &amp; Engineering, University of Nebraska-Lincoln, Lincoln, NE, USA","institution_ids":["https://openalex.org/I114395901"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071975084","display_name":"Jitender S. Deogun","orcid":"https://orcid.org/0000-0001-6402-2549"},"institutions":[{"id":"https://openalex.org/I114395901","display_name":"University of Nebraska\u2013Lincoln","ror":"https://ror.org/043mer456","country_code":"US","type":"education","lineage":["https://openalex.org/I114395901"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jitender S. Deogun","raw_affiliation_strings":["Dept. of Computer Sc. &amp; Engineering, University of Nebraska-Lincoln, Lincoln, NE, USA"],"affiliations":[{"raw_affiliation_string":"Dept. of Computer Sc. &amp; Engineering, University of Nebraska-Lincoln, Lincoln, NE, USA","institution_ids":["https://openalex.org/I114395901"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038951436","display_name":"Etsuko N. Moriyama","orcid":"https://orcid.org/0000-0003-1672-5818"},"institutions":[{"id":"https://openalex.org/I114395901","display_name":"University of Nebraska\u2013Lincoln","ror":"https://ror.org/043mer456","country_code":"US","type":"education","lineage":["https://openalex.org/I114395901"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Etsuko N. Moriyama","raw_affiliation_strings":["School of Biological Sciences, Center for Plant Science Innovation, University of Nebraska-Lincoln, Lincoln, NE, USA"],"affiliations":[{"raw_affiliation_string":"School of Biological Sciences, Center for Plant Science Innovation, University of Nebraska-Lincoln, Lincoln, NE, USA","institution_ids":["https://openalex.org/I114395901"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5011002061"],"corresponding_institution_ids":["https://openalex.org/I114395901"],"apc_list":null,"apc_paid":null,"fwci":0.1657,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.5056946,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11482","display_name":"RNA modifications and cancer","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6744405031204224},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6445941925048828},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.6144197583198547},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5771393179893494},{"id":"https://openalex.org/keywords/gene-isoform","display_name":"Gene isoform","score":0.5045841932296753},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4239964485168457},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.41038793325424194},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.29649847745895386},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.21002784371376038},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.170305073261261},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.15602612495422363}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6744405031204224},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6445941925048828},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.6144197583198547},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5771393179893494},{"id":"https://openalex.org/C53345823","wikidata":"https://www.wikidata.org/wiki/Q5531554","display_name":"Gene isoform","level":3,"score":0.5045841932296753},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4239964485168457},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.41038793325424194},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.29649847745895386},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.21002784371376038},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.170305073261261},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.15602612495422363},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3388440.3412424","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3388440.3412424","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 11th ACM International Conference on Bioinformatics, Computational Biology and Health Informatics","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1455310343","https://openalex.org/W1566352582","https://openalex.org/W1736726159","https://openalex.org/W1922411861","https://openalex.org/W1983924599","https://openalex.org/W2011920499","https://openalex.org/W2025857851","https://openalex.org/W2081193615","https://openalex.org/W2100305481","https://openalex.org/W2101234009","https://openalex.org/W2104005232","https://openalex.org/W2123845384","https://openalex.org/W2156125289","https://openalex.org/W2164883482","https://openalex.org/W2167865654","https://openalex.org/W2574633002","https://openalex.org/W2618735189","https://openalex.org/W2808736068","https://openalex.org/W2949600294","https://openalex.org/W2950150251","https://openalex.org/W2950287694","https://openalex.org/W2950954328","https://openalex.org/W2953174564","https://openalex.org/W2955167895","https://openalex.org/W2995527562","https://openalex.org/W2997591727","https://openalex.org/W3170515990","https://openalex.org/W4235169531","https://openalex.org/W6675354045"],"related_works":["https://openalex.org/W1540936366","https://openalex.org/W2079625624","https://openalex.org/W2004254765","https://openalex.org/W2126407448","https://openalex.org/W2125691904","https://openalex.org/W200174347","https://openalex.org/W2048132363","https://openalex.org/W2953122964","https://openalex.org/W1971262350","https://openalex.org/W2507850257"],"abstract_inverted_index":{"With":[0],"the":[1,34],"advent":[2],"of":[3,10,26,36,54,64,89,93,116,126,159,168],"next-generation":[4],"sequencing":[5],"technologies,":[6],"computational":[7,160],"transcriptome":[8,28],"assembly":[9,29],"RNA-Seq":[11],"data":[12],"has":[13],"become":[14],"a":[15,90,98,106],"critical":[16],"step":[17],"in":[18,48,157],"many":[19,53],"biological":[20,51],"and":[21,42,113,147,155,162],"biomedical":[22],"studies.":[23],"The":[24,136,165],"accuracy":[25],"these":[27],"methods":[30],"is":[31,45,78,170],"hindered":[32],"by":[33],"presence":[35],"alternatively":[37],"spliced":[38],"transcripts":[39],"(isoforms).":[40],"Identifying":[41],"quantifying":[43],"isoforms":[44],"also":[46,96,150],"essential":[47],"understanding":[49],"complex":[50],"functions,":[52],"which":[55],"are":[56,75],"often":[57,79],"associated":[58],"with":[59],"various":[60],"diseases.":[61],"However,":[62],"clustering":[63,115],"isoform":[65],"sequences":[66,95,118],"using":[67,133],"only":[68],"sequence":[69],"identities":[70],"when":[71],"quality":[72],"reference":[73],"genomes":[74],"not":[76],"available":[77,172],"difficult":[80],"due":[81],"to":[82,123],"heterogeneous":[83],"exon":[84],"composition":[85],"among":[86],"isoforms.":[87,127],"Clustering":[88],"large":[91],"number":[92],"transcript":[94,117],"requires":[97],"scalable":[99],"technique.":[100],"In":[101],"this":[102,130],"study,":[103],"we":[104],"propose":[105],"minwise-hashing":[107],"based":[108],"method,":[109],"MinIsoClust,":[110],"for":[111],"fast":[112],"accurate":[114,143],"that":[119,139],"can":[120],"be":[121],"used":[122],"identify":[124],"groups":[125],"We":[128],"tested":[129],"new":[131],"method":[132],"simulated":[134],"datasets.":[135],"results":[137],"demonstrated":[138],"MinIso-Clust":[140],"was":[141],"more":[142],"than":[144,153],"CD-HIT-EST,":[145],"isONclust,":[146],"MM-seqs2/Linclust.":[148],"MinIsoClust":[149,169],"performed":[151],"better":[152],"isONclust":[154],"MMseqs2/Linclust":[156],"terms":[158],"time":[161],"space":[163],"efficiency.":[164],"source":[166],"codes":[167],"freely":[171],"at":[173],"https://github.com/srbehera/MinIsoClust.":[174]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2020-11-23T00:00:00"}
