{"id":"https://openalex.org/W6944774663","doi":"https://doi.org/10.21227/jm4k-6h43","title":"\"Echoes Dataset: Simulating Textual Transmission with Natural Language Processing Techniques\"","display_name":"\"Echoes Dataset: Simulating Textual Transmission with Natural Language Processing Techniques\"","publication_year":2025,"publication_date":"2025-06-04","ids":{"openalex":"https://openalex.org/W6944774663","doi":"https://doi.org/10.21227/jm4k-6h43"},"language":"en","primary_location":{"id":"doi:10.21227/jm4k-6h43","is_oa":true,"landing_page_url":"https://doi.org/10.21227/jm4k-6h43","pdf_url":null,"source":{"id":"https://openalex.org/S7407051695","display_name":"IEEE DataPort","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.21227/jm4k-6h43","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Fernando  Aguilar Canto","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fernando  Aguilar Canto","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Hiram Calvo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hiram Calvo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":null,"topics":[],"keywords":[{"id":"https://openalex.org/keywords/levenshtein-distance","display_name":"Levenshtein distance","score":0.7439000010490417},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6516000032424927},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.5586000084877014},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5051000118255615},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.501800000667572},{"id":"https://openalex.org/keywords/imperfect","display_name":"Imperfect","score":0.4242999851703644},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.39259999990463257},{"id":"https://openalex.org/keywords/natural-language-generation","display_name":"Natural language generation","score":0.3443000018596649}],"concepts":[{"id":"https://openalex.org/C2777515626","wikidata":"https://www.wikidata.org/wiki/Q496939","display_name":"Levenshtein distance","level":2,"score":0.7439000010490417},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7164000272750854},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6516000032424927},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6342999935150146},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5777000188827515},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.5586000084877014},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5051000118255615},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.501800000667572},{"id":"https://openalex.org/C2780310539","wikidata":"https://www.wikidata.org/wiki/Q12547192","display_name":"Imperfect","level":2,"score":0.4242999851703644},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.39259999990463257},{"id":"https://openalex.org/C2776187449","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Natural language generation","level":3,"score":0.3443000018596649},{"id":"https://openalex.org/C761482","wikidata":"https://www.wikidata.org/wiki/Q118093","display_name":"Transmission (telecommunications)","level":2,"score":0.3312000036239624},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3061999976634979},{"id":"https://openalex.org/C2985684807","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Text generation","level":2,"score":0.2921000123023987},{"id":"https://openalex.org/C2779500292","wikidata":"https://www.wikidata.org/wiki/Q14802672","display_name":"Text processing","level":2,"score":0.28850001096725464},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.27950000762939453},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.2759000062942505},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.2700999975204468},{"id":"https://openalex.org/C7991579","wikidata":"https://www.wikidata.org/wiki/Q17955","display_name":"Criticism","level":2,"score":0.2581999897956848},{"id":"https://openalex.org/C2987219923","wikidata":"https://www.wikidata.org/wiki/Q777864","display_name":"Linguistic analysis","level":2,"score":0.251800000667572}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21227/jm4k-6h43","is_oa":true,"landing_page_url":"https://doi.org/10.21227/jm4k-6h43","pdf_url":null,"source":{"id":"https://openalex.org/S7407051695","display_name":"IEEE DataPort","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"doi:10.21227/jm4k-6h43","is_oa":true,"landing_page_url":"https://doi.org/10.21227/jm4k-6h43","pdf_url":null,"source":{"id":"https://openalex.org/S7407051695","display_name":"IEEE DataPort","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.8207981586456299}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"\"Two":[0],"main":[1],"objectives":[2],"in":[3,26,38,50,141],"Computational":[4],"Textual":[5],"Criticism":[6],"correspond":[7],"to":[8,57,77,97],"the":[9,27,39,45,62,99,106,111,128,144,149],"development":[10],"of":[11,20,41,61,146],"algorithms":[12],"for":[13,91,118,122],"tree":[14,84,119],"and":[15,64,81,85,134,140],"text":[16,42,79,86,92,123],"reconstruction":[17,87],"under":[18],"conditions":[19],"imperfect":[21],"copying.":[22],"Despite":[23],"recent":[24,48],"developments":[25],"field,":[28],"few":[29],"comparative":[30,116],"studies":[31],"or":[32],"benchmarks":[33],"have":[34,55],"been":[35],"performed,":[36],"particularly":[37],"case":[40],"reconstruction.":[43,120],"On":[44],"other":[46],"hand,":[47],"advancements":[49],"Natural":[51],"Language":[52],"Processing":[53],"(NLP)":[54],"begun":[56],"impact":[58],"various":[59,72],"aspects":[60],"humanities":[63],"social":[65],"sciences.":[66],"In":[67,89],"this":[68],"paper,":[69],"we":[70,94,125],"incorporate":[71,95],"NLP":[73],"techniques":[74],"(including":[75],"LLMs)":[76],"simulate":[78],"transmission":[80],"benchmark":[82],"different":[83],"algorithms.":[88],"addition,":[90],"reconstruction,":[93,124],"LLMs":[96,147],"improve":[98],"final":[100,150],"result.":[101],"Our":[102],"results":[103,117],"show":[104],"that":[105,127],"UPGMA\\/NJ":[107],"method":[108],"combined":[109],"with":[110],"Levenshtein":[112],"metric":[113],"achieved":[114],"superior":[115],"Moreover,":[121],"found":[126],"Simple":[129],"Majority":[130],"Rule":[131],"(SMR),":[132],"UR,":[133],"RHM":[135],"methods":[136],"yielded":[137],"consistent":[138],"results,":[139],"most":[142],"cases,":[143],"incorporation":[145],"improved":[148],"output.\"":[151]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
