{"id":"https://openalex.org/W4283788459","doi":"https://doi.org/10.1093/bib/bbac252","title":"LmTag: functional-enrichment and imputation-aware tag SNP selection for population-specific genotyping arrays","display_name":"LmTag: functional-enrichment and imputation-aware tag SNP selection for population-specific genotyping arrays","publication_year":2022,"publication_date":"2022-07-02","ids":{"openalex":"https://openalex.org/W4283788459","doi":"https://doi.org/10.1093/bib/bbac252","pmid":"https://pubmed.ncbi.nlm.nih.gov/35780383"},"language":"en","primary_location":{"id":"doi:10.1093/bib/bbac252","is_oa":false,"landing_page_url":"https://doi.org/10.1093/bib/bbac252","pdf_url":null,"source":{"id":"https://openalex.org/S91767247","display_name":"Briefings in Bioinformatics","issn_l":"1467-5463","issn":["1467-5463","1477-4054"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Briefings in Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020547925","display_name":"Dat Nguyen","orcid":"https://orcid.org/0000-0003-3852-9578"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dat Thanh Nguyen","raw_affiliation_strings":["Center for Biomedical Informatics, Vingroup Big Data Institute , 458 Minh Khai, 10000, Hanoi, Vietnam"],"raw_orcid":"https://orcid.org/0000-0003-3852-9578","affiliations":[{"raw_affiliation_string":"Center for Biomedical Informatics, Vingroup Big Data Institute , 458 Minh Khai, 10000, Hanoi, Vietnam","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034599952","display_name":"Quan Nguyen","orcid":"https://orcid.org/0000-0001-7870-5703"},"institutions":[{"id":"https://openalex.org/I165143802","display_name":"The University of Queensland","ror":"https://ror.org/00rqy9422","country_code":"AU","type":"education","lineage":["https://openalex.org/I165143802"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Quan Hoang Nguyen","raw_affiliation_strings":["Institute for Molecular Bioscience, University of Queensland , st Lucia, QLD 4067, Brisbane, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Molecular Bioscience, University of Queensland , st Lucia, QLD 4067, Brisbane, Australia","institution_ids":["https://openalex.org/I165143802"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025792398","display_name":"Nguy\u1ec5n Th\u00f9y D\u01b0\u01a1ng","orcid":"https://orcid.org/0000-0001-8691-9138"},"institutions":[{"id":"https://openalex.org/I70349855","display_name":"Vietnam Academy of Science and Technology","ror":"https://ror.org/02wsd5p50","country_code":"VN","type":"government","lineage":["https://openalex.org/I70349855"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Nguyen Thuy Duong","raw_affiliation_strings":["Center for Biomedical Informatics, Vingroup Big Data Institute , 458 Minh Khai, 10000, Hanoi, Vietnam","Institute of Genome Research, Vietnam Academy of Science and Technology , 18 Hoang Quoc Viet, 10000, Hanoi, Vietnam"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Center for Biomedical Informatics, Vingroup Big Data Institute , 458 Minh Khai, 10000, Hanoi, Vietnam","institution_ids":[]},{"raw_affiliation_string":"Institute of Genome Research, Vietnam Academy of Science and Technology , 18 Hoang Quoc Viet, 10000, Hanoi, Vietnam","institution_ids":["https://openalex.org/I70349855"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043745628","display_name":"Nam S. Vo","orcid":"https://orcid.org/0000-0002-5454-9176"},"institutions":[{"id":"https://openalex.org/I4210142044","display_name":"VinUniversity","ror":"https://ror.org/052dmdr17","country_code":"VN","type":"education","lineage":["https://openalex.org/I4210142044"]}],"countries":["VN"],"is_corresponding":true,"raw_author_name":"Nam S Vo","raw_affiliation_strings":["Center for Biomedical Informatics, Vingroup Big Data Institute , 458 Minh Khai, 10000, Hanoi, Vietnam","College of Engineering and Computer Science, VinUniversity , Vinhomes Ocean Park, 10000, Hanoi, Vietnam"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Center for Biomedical Informatics, Vingroup Big Data Institute , 458 Minh Khai, 10000, Hanoi, Vietnam","institution_ids":[]},{"raw_affiliation_string":"College of Engineering and Computer Science, VinUniversity , Vinhomes Ocean Park, 10000, Hanoi, Vietnam","institution_ids":["https://openalex.org/I4210142044"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5020547925","https://openalex.org/A5043745628"],"corresponding_institution_ids":["https://openalex.org/I4210142044"],"apc_list":{"value":4011,"currency":"USD","value_usd":4011},"apc_paid":null,"fwci":1.3049,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.81516151,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"23","issue":"4","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10261","display_name":"Genetic Associations and Epidemiology","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10261","display_name":"Genetic Associations and Epidemiology","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10594","display_name":"Genetic and phenotypic traits in livestock","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imputation","display_name":"Imputation (statistics)","score":0.8398894667625427},{"id":"https://openalex.org/keywords/genotyping","display_name":"Genotyping","score":0.7069253921508789},{"id":"https://openalex.org/keywords/snp","display_name":"SNP","score":0.5631860494613647},{"id":"https://openalex.org/keywords/single-nucleotide-polymorphism","display_name":"Single-nucleotide polymorphism","score":0.5572211742401123},{"id":"https://openalex.org/keywords/snp-genotyping","display_name":"SNP genotyping","score":0.5294727087020874},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.4822476804256439},{"id":"https://openalex.org/keywords/genomics","display_name":"Genomics","score":0.4623711109161377},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.4444512724876404},{"id":"https://openalex.org/keywords/genome-wide-association-study","display_name":"Genome-wide association study","score":0.42833849787712097},{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.35514694452285767},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.348824679851532},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.3061424493789673},{"id":"https://openalex.org/keywords/genotype","display_name":"Genotype","score":0.2567136883735657},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.11198225617408752},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.08985933661460876},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.08486589789390564}],"concepts":[{"id":"https://openalex.org/C58041806","wikidata":"https://www.wikidata.org/wiki/Q1660484","display_name":"Imputation (statistics)","level":3,"score":0.8398894667625427},{"id":"https://openalex.org/C31467283","wikidata":"https://www.wikidata.org/wiki/Q912147","display_name":"Genotyping","level":4,"score":0.7069253921508789},{"id":"https://openalex.org/C139275648","wikidata":"https://www.wikidata.org/wiki/Q17134011","display_name":"SNP","level":5,"score":0.5631860494613647},{"id":"https://openalex.org/C153209595","wikidata":"https://www.wikidata.org/wiki/Q501128","display_name":"Single-nucleotide polymorphism","level":4,"score":0.5572211742401123},{"id":"https://openalex.org/C163691529","wikidata":"https://www.wikidata.org/wiki/Q7391886","display_name":"SNP genotyping","level":5,"score":0.5294727087020874},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.4822476804256439},{"id":"https://openalex.org/C189206191","wikidata":"https://www.wikidata.org/wiki/Q222046","display_name":"Genomics","level":4,"score":0.4623711109161377},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.4444512724876404},{"id":"https://openalex.org/C106208931","wikidata":"https://www.wikidata.org/wiki/Q1098876","display_name":"Genome-wide association study","level":5,"score":0.42833849787712097},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.35514694452285767},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.348824679851532},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.3061424493789673},{"id":"https://openalex.org/C135763542","wikidata":"https://www.wikidata.org/wiki/Q106016","display_name":"Genotype","level":3,"score":0.2567136883735657},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.11198225617408752},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.08985933661460876},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.08486589789390564}],"mesh":[{"descriptor_ui":"D002874","descriptor_name":"Chromosome Mapping","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D002874","descriptor_name":"Chromosome Mapping","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D002874","descriptor_name":"Chromosome Mapping","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D005838","descriptor_name":"Genotype","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D005838","descriptor_name":"Genotype","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D005838","descriptor_name":"Genotype","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010641","descriptor_name":"Phenotype","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010641","descriptor_name":"Phenotype","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010641","descriptor_name":"Phenotype","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020641","descriptor_name":"Polymorphism, Single Nucleotide","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020641","descriptor_name":"Polymorphism, Single Nucleotide","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020641","descriptor_name":"Polymorphism, Single Nucleotide","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1093/bib/bbac252","is_oa":false,"landing_page_url":"https://doi.org/10.1093/bib/bbac252","pdf_url":null,"source":{"id":"https://openalex.org/S91767247","display_name":"Briefings in Bioinformatics","issn_l":"1467-5463","issn":["1467-5463","1477-4054"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Briefings in Bioinformatics","raw_type":"journal-article"},{"id":"pmid:35780383","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35780383","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Briefings in bioinformatics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","score":0.5400000214576721,"display_name":"Partnerships for the goals"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":57,"referenced_works":["https://openalex.org/W1487785114","https://openalex.org/W1583476286","https://openalex.org/W1587035534","https://openalex.org/W1919257374","https://openalex.org/W1982516282","https://openalex.org/W2014461167","https://openalex.org/W2015408724","https://openalex.org/W2032227130","https://openalex.org/W2034581323","https://openalex.org/W2081067541","https://openalex.org/W2087546077","https://openalex.org/W2099085143","https://openalex.org/W2101071606","https://openalex.org/W2101305463","https://openalex.org/W2104549677","https://openalex.org/W2107121611","https://openalex.org/W2112869109","https://openalex.org/W2115692554","https://openalex.org/W2135732313","https://openalex.org/W2136078375","https://openalex.org/W2137095888","https://openalex.org/W2149796867","https://openalex.org/W2152596080","https://openalex.org/W2160995259","https://openalex.org/W2162468038","https://openalex.org/W2216458865","https://openalex.org/W2510973425","https://openalex.org/W2511515754","https://openalex.org/W2521137711","https://openalex.org/W2539164385","https://openalex.org/W2550933502","https://openalex.org/W2559028527","https://openalex.org/W2725988230","https://openalex.org/W2744601887","https://openalex.org/W2770026599","https://openalex.org/W2806225217","https://openalex.org/W2888434560","https://openalex.org/W2895486342","https://openalex.org/W2903034115","https://openalex.org/W2905452503","https://openalex.org/W2920792207","https://openalex.org/W2932671560","https://openalex.org/W2944540884","https://openalex.org/W2951207043","https://openalex.org/W2952013316","https://openalex.org/W2956442594","https://openalex.org/W2963160524","https://openalex.org/W2970480306","https://openalex.org/W2990059271","https://openalex.org/W2990805831","https://openalex.org/W3028329270","https://openalex.org/W3165929960","https://openalex.org/W3169047316","https://openalex.org/W4206164985","https://openalex.org/W4242721817","https://openalex.org/W6680244570","https://openalex.org/W6728451393"],"related_works":["https://openalex.org/W4296620168","https://openalex.org/W2387667413","https://openalex.org/W3144318733","https://openalex.org/W2021147140","https://openalex.org/W2019041567","https://openalex.org/W2067161950","https://openalex.org/W2791888721","https://openalex.org/W2799467107","https://openalex.org/W3013571429","https://openalex.org/W2002454583"],"abstract_inverted_index":{"Despite":[0],"the":[1,13,28,93,115,119,198],"rapid":[2,29],"development":[3,30],"of":[4,31,35,118,164],"sequencing":[5,172,240],"technology,":[6],"single-nucleotide":[7],"polymorphism":[8],"(SNP)":[9],"arrays":[10,53,202,217,244],"are":[11,43,127,218,234],"still":[12,44],"most":[14,78,128],"cost-effective":[15,60],"genotyping":[16,33,201],"solutions":[17],"for":[18,47,55,77,140,221],"large-scale":[19],"genomic":[20],"research":[21],"and":[22,38,111,169,184],"applications.":[23],"Recent":[24],"years":[25],"have":[26],"witnessed":[27],"numerous":[32],"platforms":[34,42,80],"different":[36],"sizes":[37],"designs,":[39],"but":[40,113,150],"population-specific":[41],"lacking,":[45],"especially":[46],"those":[48,123],"in":[49,92,224,238],"developing":[50,225],"countries.":[51],"SNP":[52,103,142,155,243],"designed":[54],"these":[56],"countries":[57,226],"should":[58],"be":[59,98],"(small":[61],"size),":[62],"yet":[63],"incorporate":[64],"key":[65,74],"information":[66],"needed":[67],"to":[68,82,189,197],"associate":[69],"genotypes":[70],"with":[71,131],"traits.":[72,132],"A":[73],"design":[75],"principle":[76],"current":[79,101],"is":[81,122,245,248],"improve":[83],"genome-wide":[84,185],"imputation":[85,109,148,186,206],"so":[86],"that":[87,126,144,177,203],"more":[88],"SNPs":[89,125],"not":[90,114,145],"included":[91],"array":[94],"(imputed":[95],"SNPs)":[96],"can":[97],"predicted.":[99],"However,":[100],"tag":[102,141],"selection":[104,143],"methods":[105],"mostly":[106],"focus":[107],"on":[108,160],"accuracy":[110,187],"coverage,":[112],"functional":[116,124,154,181,213],"content":[117],"array.":[120],"It":[121],"likely":[129],"associated":[130],"Here,":[133],"we":[134],"propose":[135],"LmTag,":[136],"a":[137,161],"novel":[138,193],"method":[139],"only":[146],"improves":[147],"performance":[149],"also":[151],"prioritizes":[152],"highly":[153],"markers.":[156],"We":[157],"apply":[158],"LmTag":[159,178],"wide":[162],"range":[163],"populations":[165,223],"using":[166],"both":[167,180],"public":[168],"in-house":[170],"whole-genome":[171],"databases.":[173],"Our":[174],"results":[175],"show":[176],"improved":[179],"marker":[182],"prioritization":[183],"compared":[188],"existing":[190],"methods.":[191],"This":[192],"approach":[194],"could":[195],"contribute":[196],"next":[199],"generation":[200],"provide":[204],"excellent":[205],"capability":[207],"as":[208,210],"well":[209],"facilitate":[211],"array-based":[212],"genetic":[214],"studies.":[215],"Such":[216],"particularly":[219],"suitable":[220],"under-represented":[222],"or":[227,241],"non-model":[228],"species,":[229],"where":[230],"little":[231],"genomics":[232],"data":[233],"available":[235,249],"while":[236],"investment":[237],"genome":[239],"high-density":[242],"limited.":[246],"$\\textrm{LmTag}$":[247],"at:":[250],"https://github.com/datngu/LmTag.":[251]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2022,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
