{"id":"https://openalex.org/W2046591130","doi":"https://doi.org/10.1109/gensips.2012.6507733","title":"MiB: A comparative assembly processing pipeline","display_name":"MiB: A comparative assembly processing pipeline","publication_year":2012,"publication_date":"2012-12-01","ids":{"openalex":"https://openalex.org/W2046591130","doi":"https://doi.org/10.1109/gensips.2012.6507733","mag":"2046591130"},"language":"en","primary_location":{"id":"doi:10.1109/gensips.2012.6507733","is_oa":false,"landing_page_url":"https://doi.org/10.1109/gensips.2012.6507733","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings 2012 IEEE International Workshop on Genomic Signal Processing and Statistics (GENSIPS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051600305","display_name":"Bilal Wajid","orcid":"https://orcid.org/0000-0003-0220-7788"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]},{"id":"https://openalex.org/I142732210","display_name":"University of Engineering and Technology Lahore","ror":"https://ror.org/0051w2v06","country_code":"PK","type":"education","lineage":["https://openalex.org/I142732210"]}],"countries":["PK","US"],"is_corresponding":true,"raw_author_name":"Bilal Wajid","raw_affiliation_strings":["Department of Electrical Engineering, University of Engineering & Technology, Lahore, Punjab, Pakistan","Department of Electrical and Computer Engineering, Texas A&M University, College Station, TX, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, University of Engineering & Technology, Lahore, Punjab, Pakistan","institution_ids":["https://openalex.org/I142732210"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Texas A&M University, College Station, TX, USA","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034213361","display_name":"Erchin Serpedin","orcid":"https://orcid.org/0000-0001-9069-770X"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Erchin Serpedin","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Texas A&M University, College Station, TX, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Texas A&M University, College Station, TX, USA","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056444635","display_name":"Mohamed Nounou","orcid":"https://orcid.org/0000-0003-0520-9623"},"institutions":[{"id":"https://openalex.org/I58152225","display_name":"Texas A&M University at Qatar","ror":"https://ror.org/03vb4dm14","country_code":"QA","type":"education","lineage":["https://openalex.org/I58152225","https://openalex.org/I91045830"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Mohamed Nounou","raw_affiliation_strings":["Department of Chemical Engineering, Texas A&M University, Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Department of Chemical Engineering, Texas A&M University, Doha, Qatar","institution_ids":["https://openalex.org/I58152225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025512804","display_name":"Hazem Nounou","orcid":"https://orcid.org/0000-0001-8075-1581"},"institutions":[{"id":"https://openalex.org/I58152225","display_name":"Texas A&M University at Qatar","ror":"https://ror.org/03vb4dm14","country_code":"QA","type":"education","lineage":["https://openalex.org/I58152225","https://openalex.org/I91045830"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Hazem Nounou","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Texas A&M University, Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Texas A&M University, Doha, Qatar","institution_ids":["https://openalex.org/I58152225"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5051600305"],"corresponding_institution_ids":["https://openalex.org/I142732210","https://openalex.org/I91045830"],"apc_list":null,"apc_paid":null,"fwci":0.394,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.61109957,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"86","last_page":"89"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reference-genome","display_name":"Reference genome","score":0.7546141743659973},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.6553286910057068},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5891373157501221},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5740615725517273},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5452384352684021},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.4892466068267822},{"id":"https://openalex.org/keywords/sequence-assembly","display_name":"Sequence assembly","score":0.47484901547431946},{"id":"https://openalex.org/keywords/minimum-description-length","display_name":"Minimum description length","score":0.46570947766304016},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4629690647125244},{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.4595905542373657},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.45119142532348633},{"id":"https://openalex.org/keywords/k-mer","display_name":"k-mer","score":0.42268335819244385},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.3575848340988159},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3346971273422241},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.2816716134548187},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2524556517601013},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.1295117735862732}],"concepts":[{"id":"https://openalex.org/C192953774","wikidata":"https://www.wikidata.org/wiki/Q7307127","display_name":"Reference genome","level":4,"score":0.7546141743659973},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.6553286910057068},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5891373157501221},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5740615725517273},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5452384352684021},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.4892466068267822},{"id":"https://openalex.org/C18949551","wikidata":"https://www.wikidata.org/wiki/Q740578","display_name":"Sequence assembly","level":5,"score":0.47484901547431946},{"id":"https://openalex.org/C87465248","wikidata":"https://www.wikidata.org/wiki/Q1417790","display_name":"Minimum description length","level":2,"score":0.46570947766304016},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4629690647125244},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.4595905542373657},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.45119142532348633},{"id":"https://openalex.org/C2279292","wikidata":"https://www.wikidata.org/wiki/Q6322851","display_name":"k-mer","level":4,"score":0.42268335819244385},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.3575848340988159},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3346971273422241},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.2816716134548187},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2524556517601013},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.1295117735862732},{"id":"https://openalex.org/C162317418","wikidata":"https://www.wikidata.org/wiki/Q252857","display_name":"Transcriptome","level":4,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/gensips.2012.6507733","is_oa":false,"landing_page_url":"https://doi.org/10.1109/gensips.2012.6507733","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings 2012 IEEE International Workshop on Genomic Signal Processing and Statistics (GENSIPS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1559448277","https://openalex.org/W1995839104","https://openalex.org/W2001792012","https://openalex.org/W2024112220","https://openalex.org/W2054658115","https://openalex.org/W2099111195","https://openalex.org/W2169002484","https://openalex.org/W2552720424","https://openalex.org/W2991116385","https://openalex.org/W3123545922","https://openalex.org/W6770729006"],"related_works":["https://openalex.org/W4210830088","https://openalex.org/W2131823082","https://openalex.org/W1995839104","https://openalex.org/W2484133401","https://openalex.org/W2216477337","https://openalex.org/W2115501618","https://openalex.org/W2772185703","https://openalex.org/W3011183076","https://openalex.org/W2767590279","https://openalex.org/W3090794301"],"abstract_inverted_index":{"This":[0],"paper":[1],"introduces":[2],"MiB,":[3,164],"a":[4,48,103],"comparative":[5],"genome":[6,186,195],"assembly":[7,50],"pipeline":[8],"that":[9,75,91,108],"uses":[10,85,127,135],"three":[11],"key":[12],"steps.":[13],"The":[14,31,66,82,124],"first":[15],"step":[16],"involves":[17],"choosing":[18],"the":[19,25,37,45,54,60,63,71,79,86,96,110,113,143,152,156,160,167,174,179,184,189,193,223],"best":[20,38,157],"reference":[21,39,64,80,97,114,176,190],"sequence":[22,40,98,115,177,191],"by":[23,51,196],"using":[24,207,210,217],"Minimum":[26],"Description":[27],"Length":[28],"(MDL)":[29],"principle.":[30],"MDL":[32,67],"principle":[33,68],"not":[34,93],"only":[35],"chooses":[36],"(model)":[41],"but":[42],"also":[43,69],"fine-tunes":[44],"model":[46],"for":[47,130,139,146],"better":[49],"rectifying":[52,199],"all":[53],"inversions":[55,204],"and":[56,116,149,159,178,187,205,212],"removing":[57,197],"most":[58],"of":[59,73,89,142,169,181,202,222],"insertions":[61,206],"from":[62,166,183],"sequence.":[65,81,162],"identifies":[70],"set":[72,88,180,201],"reads":[74,90,182],"could":[76],"align":[77,94],"to":[78,95,102,154,172],"second":[83],"stage":[84,126],"same":[87],"did":[92],"as":[99],"an":[100],"input":[101],"de-Buijn":[104],"graph":[105],"based":[106],"algorithm":[107],"Identifies":[109],"Deletions":[111],"in":[112],"then":[117,150],"Inserts":[118],"Them":[119],"at":[120],"Appropriate":[121],"Places":[122],"(IDITAP).":[123],"last":[125],"Bayesian":[128],"Estimation":[129],"Comparative":[131],"Assembly":[132],"(BECA).":[133],"BECA":[134],"Quality":[136],"(Q-)":[137],"values":[138],"identifying":[140],"probabilities":[141],"base":[144],"calls":[145],"every":[147],"read":[148],"exploits":[151],"Q-values":[153],"find":[155],"alignments":[158],"consensus":[161],"Therefore,":[163],"derived":[165],"use":[168],"MDL-IDITAP-BECA":[170],"aims":[171],"take":[173],"optimal":[175],"unassembled":[185],"transform":[188],"into":[192],"novel":[194],"or":[198],"four":[200],"mutations:":[203],"MDL,":[208],"deletions":[209],"IDITAP":[211],"Single":[213],"Nucleotide":[214],"Polymorphisms":[215],"(SNPs)":[216],"BECA.":[218],"Preliminary":[219],"test":[220],"results":[221],"proposed":[224],"framework":[225],"revealed":[226],"promising":[227],"results.":[228]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
