{"id":"https://openalex.org/W4401692506","doi":"https://doi.org/10.1109/isit57864.2024.10619392","title":"On $k$-Mer-Based and Maximum Likelihood Estimation Algorithms for Trace Reconstruction","display_name":"On $k$-Mer-Based and Maximum Likelihood Estimation Algorithms for Trace Reconstruction","publication_year":2024,"publication_date":"2024-07-07","ids":{"openalex":"https://openalex.org/W4401692506","doi":"https://doi.org/10.1109/isit57864.2024.10619392"},"language":"en","primary_location":{"id":"doi:10.1109/isit57864.2024.10619392","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isit57864.2024.10619392","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Symposium on Information Theory (ISIT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014279694","display_name":"Kuan Cheng","orcid":"https://orcid.org/0000-0002-8972-1749"},"institutions":[{"id":"https://openalex.org/I4210161752","display_name":"Beijing Haidian Hospital","ror":"https://ror.org/058x5eq06","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210161752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kuan Cheng","raw_affiliation_strings":["Peking University, Haidian,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Peking University, Haidian,Beijing,China","institution_ids":["https://openalex.org/I4210161752"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090091569","display_name":"Elena Grigorescu","orcid":"https://orcid.org/0000-0001-9673-4313"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Elena Grigorescu","raw_affiliation_strings":["Purdue University,West Lafayette,IN,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Purdue University,West Lafayette,IN,USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100353875","display_name":"Xin Li","orcid":"https://orcid.org/0000-0002-4691-4508"},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xin Li","raw_affiliation_strings":["Johns Hopkins University,Baltimore,MD,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Johns Hopkins University,Baltimore,MD,USA","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101519422","display_name":"Madhu Sudan","orcid":"https://orcid.org/0000-0003-3718-6489"},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Madhu Sudan","raw_affiliation_strings":["Harvard University,Cambridge,Massachusetts,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harvard University,Cambridge,Massachusetts,USA","institution_ids":["https://openalex.org/I2801851002"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085562284","display_name":"Minshen Zhu","orcid":"https://orcid.org/0000-0003-1927-6085"},"institutions":[{"id":"https://openalex.org/I4210161752","display_name":"Beijing Haidian Hospital","ror":"https://ror.org/058x5eq06","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210161752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minshen Zhu","raw_affiliation_strings":["Peking University, Haidian,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Peking University, Haidian,Beijing,China","institution_ids":["https://openalex.org/I4210161752"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4375,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.61651077,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"879","last_page":"884"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9366000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9366000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10522","display_name":"Medical Imaging Techniques and Applications","score":0.9258999824523926,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9164000153541565,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/trace","display_name":"TRACE (psycholinguistics)","score":0.617404043674469},{"id":"https://openalex.org/keywords/maximum-likelihood","display_name":"Maximum likelihood","score":0.6145336031913757},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6069689989089966},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5853474736213684},{"id":"https://openalex.org/keywords/maximum-likelihood-sequence-estimation","display_name":"Maximum likelihood sequence estimation","score":0.4175110459327698},{"id":"https://openalex.org/keywords/estimation-theory","display_name":"Estimation theory","score":0.3136143684387207},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.21480578184127808},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.16161063313484192}],"concepts":[{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.617404043674469},{"id":"https://openalex.org/C49781872","wikidata":"https://www.wikidata.org/wiki/Q1045555","display_name":"Maximum likelihood","level":2,"score":0.6145336031913757},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6069689989089966},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5853474736213684},{"id":"https://openalex.org/C191462741","wikidata":"https://www.wikidata.org/wiki/Q6795902","display_name":"Maximum likelihood sequence estimation","level":3,"score":0.4175110459327698},{"id":"https://openalex.org/C167928553","wikidata":"https://www.wikidata.org/wiki/Q1376021","display_name":"Estimation theory","level":2,"score":0.3136143684387207},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21480578184127808},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.16161063313484192},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/isit57864.2024.10619392","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isit57864.2024.10619392","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Symposium on Information Theory (ISIT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W1133414672","https://openalex.org/W1967505984","https://openalex.org/W2081933490","https://openalex.org/W2095554889","https://openalex.org/W2564763601","https://openalex.org/W2584062640","https://openalex.org/W2911475043","https://openalex.org/W2951269465","https://openalex.org/W2963134372","https://openalex.org/W2963670229","https://openalex.org/W2964199960","https://openalex.org/W2969308577","https://openalex.org/W2979059622","https://openalex.org/W3028579427","https://openalex.org/W3033084890","https://openalex.org/W3117245243","https://openalex.org/W3128220280","https://openalex.org/W3161798670","https://openalex.org/W3169706614","https://openalex.org/W3197288570","https://openalex.org/W3198708829","https://openalex.org/W4226090901","https://openalex.org/W4287079126","https://openalex.org/W4386057561","https://openalex.org/W6656576250","https://openalex.org/W6665204704","https://openalex.org/W6666485203","https://openalex.org/W6747734592","https://openalex.org/W6782677995","https://openalex.org/W6798252878","https://openalex.org/W6841087898","https://openalex.org/W6846800381"],"related_works":["https://openalex.org/W1499442185","https://openalex.org/W2366184732","https://openalex.org/W2379466508","https://openalex.org/W2120595071","https://openalex.org/W3139607207","https://openalex.org/W2090147078","https://openalex.org/W1600683375","https://openalex.org/W2155160077","https://openalex.org/W2978085921","https://openalex.org/W2353424004"],"abstract_inverted_index":{"The":[0],"goal":[1],"of":[2,20,32,46,60,69,86,136,154,161,201,204,241,274,281,288,300],"the":[3,49,57,79,93,137,146,149,155,185,188,199,211,230,239,242,250,255,260,266,286],"trace":[4,24,50,156,177],"reconstruction":[5,51,157,178],"problem":[6,158],"is":[7,25,65,217],"to":[8,127,228,258,278],"recover":[9],"a":[10,23,26,270,279],"string":[11,95,252],"x":[12,33,133],"E":[13],"{0,":[14],"1}":[15],"given":[16,37,134],"many":[17],"independent":[18],"traces":[19],"x,":[21,96],"where":[22],"subsequence":[27],"obtained":[28,76],"from":[29,118],"deleting":[30],"bits":[31],"independently":[34],"with":[35],"some":[36],"probability.":[38],"In":[39],"this":[40,202,298],"paper":[41],"we":[42,159],"consider":[43],"two":[44],"kinds":[45],"algorithms":[47,142],"for":[48,97,176,291],"problem.":[52],"We":[53,123,263],"first":[54],"observe":[55],"that":[56,106,172,187,210,253,265,297],"state-of-the-art":[58],"result":[59,170,237],"Chase":[61,216],"(STOC":[62],"2021),":[63],"which":[64,247],"based":[66],"on":[67],"statistics":[68,83,108],"arbitrary":[70],"length-k":[71],"subsequences,":[72],"can":[73,113],"also":[74,208],"be":[75,114,128,306],"by":[77,215],"considering":[78],"\u201ck-mer":[80],"statistics\u201d,":[81],"i.e.,":[82,276],"regarding":[84],"occurrences":[85],"contiguous":[87],"k-bit":[88],"strings":[89],"(a.k.a,":[90],"k-mers)":[91],"in":[92,148,226,285],"initial":[94],"k":[98],"=":[99],"Mazooji":[100],"and":[101,151,166,220,295],"Shomorony":[102],"(ISIT":[103],"2023)":[104],"show":[105,264,296],"such":[107],"(called":[109],"k-mer":[110,138],"density":[111,139],"map)":[112],"estimated":[115],"within":[116],"accuracy":[117],"poly(n,":[119],"2k,":[120],"l/e)":[121],"traces.":[122,205],"call":[124],"an":[125,292],"algorithm":[126,175,268],"k-mer-based":[129,174],"if":[130],"it":[131],"reconstructs":[132],"estimates":[135],"map.":[140],"Such":[141],"essentially":[143,218],"capture":[144],"all":[145],"analyses":[147],"worst-case":[150,231],"smoothed-complexity":[152],"models":[153],"know":[160],"so":[162],"far.":[163],"Our":[164,206,234],"first,":[165],"technically":[167],"more":[168],"involved,":[169],"shows":[171,209],"any":[173],"must":[179],"use":[180],"exp":[181],"n))":[182],"traces,":[183,196,275],"under":[184,308],"assumption":[186],"estimator":[189],"requires":[190],"poly(2<sup":[191],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[192,283,302],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">k</sup>,":[193],"1":[194],"e)":[195],"thus":[197],"establishing":[198],"optimality":[200],"number":[203,273,287],"analysis":[207,212],"technique":[213],"used":[214],"tight,":[219],"hence":[221],"new":[222],"techniques":[223],"are":[224],"needed":[225,290],"order":[227],"improve":[229],"upper":[232],"bound.":[233],"second,":[235],"simple,":[236],"considers":[238],"performance":[240],"Maximum":[243],"Likelihood":[244],"Estimator":[245],"(MLE),":[246],"specifically":[248],"picks":[249],"source":[251],"has":[254],"maximum":[256],"likelihood":[257],"generate":[259],"samples":[261,289],"(traces).":[262],"MLE":[267],"uses":[269],"nearly":[271],"optimal":[272,293],"up":[277],"factor":[280,299],"<tex":[282,301],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$n$</tex>":[284,303],"algorithm,":[294],"loss":[304],"may":[305],"necessary":[307],"general":[309],"\u201cmodel":[310],"estimation\u201d":[311],"settings.":[312]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
