{"id":"https://openalex.org/W3046173909","doi":"https://doi.org/10.13016/g6vf-gqke","title":"Applications of Graph Segmentation Algorithms For Quantitative Genomic Analyses","display_name":"Applications of Graph Segmentation Algorithms For Quantitative Genomic Analyses","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3046173909","doi":"https://doi.org/10.13016/g6vf-gqke","mag":"3046173909"},"language":"en","primary_location":{"id":"mag:3046173909","is_oa":false,"landing_page_url":"https://drum.lib.umd.edu/handle/1903/26145","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null},"type":"dissertation","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.13016/g6vf-gqke","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078592550","display_name":"Mohamed K. Gunady","orcid":"https://orcid.org/0000-0002-5027-9279"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gunady, Mohamed","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5078592550"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9363999962806702,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47240275144577026},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4666343331336975},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4210956394672394},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.40653958916664124},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3269270658493042},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.3251211643218994},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2688477039337158},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.16744494438171387}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47240275144577026},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4666343331336975},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4210956394672394},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.40653958916664124},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3269270658493042},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.3251211643218994},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2688477039337158},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.16744494438171387}],"mesh":[],"locations_count":2,"locations":[{"id":"mag:3046173909","is_oa":false,"landing_page_url":"https://drum.lib.umd.edu/handle/1903/26145","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null},{"id":"doi:10.13016/g6vf-gqke","is_oa":true,"landing_page_url":"https://doi.org/10.13016/g6vf-gqke","pdf_url":null,"source":{"id":"https://openalex.org/S4306402644","display_name":"Digital Repository at the University of Maryland (University of Maryland College Park)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66946132","host_organization_name":"University of Maryland, College Park","host_organization_lineage":["https://openalex.org/I66946132"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"thesis"}],"best_oa_location":{"id":"doi:10.13016/g6vf-gqke","is_oa":true,"landing_page_url":"https://doi.org/10.13016/g6vf-gqke","pdf_url":null,"source":{"id":"https://openalex.org/S4306402644","display_name":"Digital Repository at the University of Maryland (University of Maryland College Park)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66946132","host_organization_name":"University of Maryland, College Park","host_organization_lineage":["https://openalex.org/I66946132"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"thesis"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2768520257","https://openalex.org/W2794692603","https://openalex.org/W2188510933","https://openalex.org/W2905498282","https://openalex.org/W207237548","https://openalex.org/W1987165735","https://openalex.org/W2910124299","https://openalex.org/W1539969737","https://openalex.org/W2542804967","https://openalex.org/W1990984714","https://openalex.org/W2789213053","https://openalex.org/W1564526305","https://openalex.org/W3163742664","https://openalex.org/W3141102284","https://openalex.org/W3150704150","https://openalex.org/W2111932463","https://openalex.org/W3108887057","https://openalex.org/W1542280544","https://openalex.org/W1764533123","https://openalex.org/W644277551"],"abstract_inverted_index":{"There":[0],"is":[1,63,306,403],"a":[2,21,82,90,96,103,110,202,237,392,399,420,482],"growing":[3],"interest":[4],"in":[5,12,44,188,201,236,255,269,284,313,383,430,455,489,516,519,544],"utilizing":[6],"graph":[7,42,303,349],"formulations":[8],"and":[9,23,50,120,138,161,168,186,337,378,416,419,521,547],"graph-based":[10,333],"algorithms":[11,200],"different":[13],"subproblems":[14],"of":[15,26,28,47,56,85,89,105,135,172,180,196,205,243,253,273,281,301,351,360,369,422,436,452,468,495,532],"genomic":[16,324],"analysis.":[17,439],"Since":[18],"graphs":[19,311],"provide":[20,169],"natural":[22],"efficient":[24,141,348],"representation":[25,350],"sequences":[27,150],"data":[29,62,381,458,470,488],"where":[30],"some":[31,41,323],"structural":[32,121],"relationships":[33,122],"are":[34,80,335,413],"observed":[35,245],"within":[36],"the":[37,66,77,86,133,165,173,191,194,241,244,251,270,274,279,290,294,347,356,367,376,396,434,469,493,509,529,545,549],"data,":[38,491,546],"we":[39,131,209,249,365,443],"study":[40],"applications":[43],"quantitative":[45],"analysis":[46,325],"typical":[48],"RNA-seq":[49,61,70,206,286,554],"Whole":[51,314],"Genome":[52,315],"Sequencing":[53,316],"pipelines.":[54],"Analysis":[55],"differential":[57],"alternative":[58,162],"splicing":[59,163],"from":[60,109,217],"complicated":[64],"by":[65,278,464,525],"fact":[67],"that":[68,225,239,266,502],"many":[69],"reads":[71],"map":[72],"to":[73,101,157,231,292,427,448,479,486,508],"multiple":[74],"transcripts,":[75],"besides,":[76],"annotated":[78,275],"transcripts":[79,88,124,233,276,283,296],"often":[81],"small":[83],"subset":[84],"possible":[87],"gene.":[91],"This":[92],"work":[93,473],"describes":[94],"Yanagi,":[95],"tool":[97],"for":[98,143,175,193,322,374],"segmenting":[99],"transcriptomes":[100],"create":[102],"library":[104,116],"maximal":[106],"L-disjoint":[107],"segments":[108,174,341],"complete":[111],"transcriptome":[112,118,136,212],"annotation.":[113],"That":[114],"segment":[115,145,149,166,227],"preserves":[117],"substrings":[119],"between":[123],"while":[125,288,354,513],"eliminating":[126],"unnecessary":[127],"sequence":[128],"duplications.":[129],"First,":[130],"formalize":[132],"concept":[134],"segmentation":[137,182,304],"propose":[139,261,444],"an":[140,222,256,262,285,445,466,477],"algorithm":[142,224],"generating":[144],"libraries.":[146],"The":[147,178,472],"resulting":[148],"can":[151,214,319],"be":[152,215,320],"used":[153,312],"with":[154,346,433,551],"pseudo-alignment":[155,199],"tools":[156],"quantify":[158],"gene":[159],"expression":[160,380],"at":[164],"level":[167],"gene-level":[170],"visualization":[171],"more":[176],"interpretability.":[177],"notion":[179],"transcript":[181],"as":[183,229],"introduced":[184],"here":[185,475],"implemented":[187],"Yanagi":[189],"opens":[190],"door":[192],"application":[195],"lightweight,":[197],"ultra-fast":[198],"wide":[203],"variety":[204],"analyses.":[207],"Furthermore,":[208],"show":[210,501],"how":[211],"quantification":[213,254],"performed":[216],"segment-level":[218],"statistics.":[219],"We":[220,260],"present":[221],"EM":[223],"uses":[226],"counts":[228,451],"features":[230],"estimate":[232],"relative":[234],"abundances":[235,272],"way":[238],"maximizes":[240],"likelihood":[242],"sequenced":[246],"data.":[247,499,523],"Then":[248],"tackle":[250],"problem":[252],"incomplete":[257],"annotation":[258],"setting.":[259],"assembly-free":[263],"correction":[264],"procedure":[265],"reduces":[267],"bias":[268],"estimated":[271],"caused":[277],"presence":[280],"unannotated":[282],"sample,":[287],"avoiding":[289,355],"need":[291],"assemble":[293],"missing":[295],"first.":[297],"Another":[298],"use":[299,368],"case":[300],"our":[302],"approach":[305,478],"representing":[307],"population":[308,352,401],"reference":[309],"genome":[310],"(WGS),":[317],"which":[318,402],"crucial":[321],"studying":[326],"highly":[327],"polymorphic":[328],"genes":[329,454],"like":[330],"HLA.":[331],"Usually":[332],"aligners":[334],"slow":[336],"computationally":[338],"demanding.":[339],"Using":[340],"empowers":[342],"any":[343],"linear":[344],"aligner":[345],"variations,":[353],"expensive":[357],"computational":[358],"overhead":[359],"aligning":[361],"over":[362],"graphs.":[363],"Lastly,":[364],"explore":[366],"Generative":[370,460],"Adversarial":[371,461],"Networks":[372,462],"(GANs)":[373,463],"imputing":[375,496],"sparse":[377],"noisy":[379,415],"obtained":[382],"single":[384,456,497],"cell":[385,400,457,498,533],"RNA":[386],"sequencing":[387],"(scRNA-seq)":[388],"experiments.":[389,555],"scRNA-seq":[390],"provides":[391,535],"rich":[393],"view":[394],"into":[395,492],"heterogeneity":[397],"underlying":[398,530],"usually":[404,414],"lost":[405],"when":[406],"performing":[407],"bulk":[408,553],"RNA-seq.":[409],"However,":[410],"these":[411,431],"datasets":[412,432],"very":[417],"sparse,":[418],"number":[421],"methods":[423],"have":[424],"been":[425],"proposed":[426],"impute":[428,449,487],"zeros":[429],"goal":[435],"improving":[437],"downstream":[438],"In":[440],"this":[441],"work,":[442],"approach,":[446],"scGAIN,":[447],"zero":[450],"dropout":[453],"using":[459],"learning":[465],"approximation":[467],"distribution.":[471],"presented":[474],"discusses":[476],"adopt":[480],"GAIN,":[481],"GAN":[483],"model":[484],"developed":[485],"image":[490],"domain":[494],"Experiments":[500],"scGAIN":[503,526],"gives":[504],"competitive":[505],"results":[506],"compared":[507],"state-of-the-art":[510],"imputation":[511],"approaches":[512],"showing":[514],"superiority":[515],"various":[517],"aspects":[518],"simulation":[520],"real":[522],"Imputation":[524],"successfully":[527],"recovers":[528],"clustering":[531],"sub-populations,":[534],"sharp":[536],"estimates":[537],"around":[538],"true":[539],"mean":[540],"expression,":[541],"reducing":[542],"variability":[543],"increases":[548],"correspondence":[550],"matched":[552]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
