{"id":"https://openalex.org/W7131636434","doi":"https://doi.org/10.48550/arxiv.2602.22045","title":"DLT-Corpus: A Large-Scale Text Collection for the Distributed Ledger Technology Domain","display_name":"DLT-Corpus: A Large-Scale Text Collection for the Distributed Ledger Technology Domain","publication_year":2026,"publication_date":"2026-02-25","ids":{"openalex":"https://openalex.org/W7131636434","doi":"https://doi.org/10.48550/arxiv.2602.22045"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.22045","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126855482","display_name":"Walter Hernandez Cruz","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Cruz, Walter Hernandez","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086812532","display_name":"Peter Devine","orcid":"https://orcid.org/0000-0002-8083-320X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Devine, Peter","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072416060","display_name":"Nikhil Vadgama","orcid":"https://orcid.org/0000-0002-3303-646X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vadgama, Nikhil","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074632640","display_name":"Paolo Tasca","orcid":"https://orcid.org/0000-0002-5460-5940"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tasca, Paolo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126904383","display_name":"Jiahua Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Jiahua","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5126855482"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10270","display_name":"Blockchain Technology Applications and Security","score":0.40149998664855957,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10270","display_name":"Blockchain Technology Applications and Security","score":0.40149998664855957,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10856","display_name":"Intellectual Property and Patents","score":0.20069999992847443,"subfield":{"id":"https://openalex.org/subfields/1405","display_name":"Management of Technology and Innovation"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11995","display_name":"FinTech, Crowdfunding, Digital Finance","score":0.03530000150203705,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cryptocurrency","display_name":"Cryptocurrency","score":0.6962000131607056},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.5856999754905701},{"id":"https://openalex.org/keywords/ledger","display_name":"Ledger","score":0.5752000212669373},{"id":"https://openalex.org/keywords/distributed-ledger","display_name":"Distributed ledger","score":0.5235000252723694},{"id":"https://openalex.org/keywords/capitalization","display_name":"Capitalization","score":0.47429999709129333},{"id":"https://openalex.org/keywords/market-capitalization","display_name":"Market capitalization","score":0.4625000059604645},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4277999997138977},{"id":"https://openalex.org/keywords/trademark","display_name":"Trademark","score":0.4212000072002411}],"concepts":[{"id":"https://openalex.org/C180706569","wikidata":"https://www.wikidata.org/wiki/Q13479982","display_name":"Cryptocurrency","level":2,"score":0.6962000131607056},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.588100016117096},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.5856999754905701},{"id":"https://openalex.org/C91302708","wikidata":"https://www.wikidata.org/wiki/Q2732056","display_name":"Ledger","level":2,"score":0.5752000212669373},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5325999855995178},{"id":"https://openalex.org/C2777541363","wikidata":"https://www.wikidata.org/wiki/Q25110971","display_name":"Distributed ledger","level":3,"score":0.5235000252723694},{"id":"https://openalex.org/C2779137862","wikidata":"https://www.wikidata.org/wiki/Q425951","display_name":"Capitalization","level":2,"score":0.47429999709129333},{"id":"https://openalex.org/C193445137","wikidata":"https://www.wikidata.org/wiki/Q471719","display_name":"Market capitalization","level":4,"score":0.4625000059604645},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.43470001220703125},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4277999997138977},{"id":"https://openalex.org/C2779027411","wikidata":"https://www.wikidata.org/wiki/Q167270","display_name":"Trademark","level":2,"score":0.4212000072002411},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.353300005197525},{"id":"https://openalex.org/C34974158","wikidata":"https://www.wikidata.org/wiki/Q131257","display_name":"Intellectual property","level":2,"score":0.349700003862381},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.34689998626708984},{"id":"https://openalex.org/C40700","wikidata":"https://www.wikidata.org/wiki/Q1411783","display_name":"Industrial organization","level":1,"score":0.33489999175071716},{"id":"https://openalex.org/C540431452","wikidata":"https://www.wikidata.org/wiki/Q16319025","display_name":"FinTech","level":3,"score":0.3179999887943268},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.3131999969482422},{"id":"https://openalex.org/C27564746","wikidata":"https://www.wikidata.org/wiki/Q913709","display_name":"Market research","level":2,"score":0.3125},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.30489999055862427},{"id":"https://openalex.org/C30772137","wikidata":"https://www.wikidata.org/wiki/Q5164762","display_name":"Consumption (sociology)","level":2,"score":0.2809000015258789},{"id":"https://openalex.org/C2985879086","wikidata":"https://www.wikidata.org/wiki/Q1061910","display_name":"Technology transfer","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.2671999931335449},{"id":"https://openalex.org/C2777111884","wikidata":"https://www.wikidata.org/wiki/Q12002092","display_name":"Social security","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C2780342482","wikidata":"https://www.wikidata.org/wiki/Q1148446","display_name":"Patent office","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.2565000057220459}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.22045","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.22045","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22045","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.22045","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"score":0.5831294655799866,"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,77,147],"introduce":[1],"DLT-Corpus,":[2],"the":[3,67,150],"largest":[4],"domain-specific":[5,62],"text":[6],"collection":[7],"for":[8,50],"Distributed":[9],"Ledger":[10],"Technology":[11],"(DLT)":[12],"research":[13,137],"to":[14],"date:":[15],"2.98":[16],"billion":[17],"tokens":[18],"from":[19],"22.12":[20],"million":[21,42],"documents":[22],"spanning":[23],"scientific":[24,95,119],"literature":[25,96],"(37,440":[26],"publications),":[27],"United":[28],"States":[29],"Patent":[30],"and":[31,38,58,73,86,100,120,139,170,174],"Trademark":[32],"Office":[33],"(USPTO)":[34],"patents":[35,99],"(49,023":[36],"filings),":[37],"social":[39,101,109],"media":[40,110],"(22":[41],"posts).":[43],"Existing":[44],"Natural":[45],"Language":[46],"Processing":[47],"(NLP)":[48],"resources":[49],"DLT":[51],"focus":[52],"narrowly":[53],"on":[54,162],"cryptocurrencies":[55],"price":[56],"prediction":[57],"smart":[59],"contracts,":[60],"leaving":[61],"language":[63],"under":[64],"explored":[65],"despite":[66],"sector's":[68],"~$3":[69],"trillion":[70],"market":[71,126,130],"capitalization":[72],"rapid":[74],"technological":[75],"evolution.":[76],"demonstrate":[78],"DLT-Corpus'":[79],"utility":[80],"by":[81],"analyzing":[82],"technology":[83,105],"emergence":[84],"patterns":[85],"market-innovation":[87],"correlations.":[88],"Findings":[89],"reveal":[90],"that":[91,143],"technologies":[92],"originate":[93],"in":[94,132],"before":[97],"reaching":[98],"media,":[102],"following":[103],"traditional":[104],"transfer":[106],"patterns.":[107],"While":[108],"sentiment":[111],"remains":[112],"overwhelmingly":[113],"bullish":[114],"even":[115],"during":[116],"crypto":[117],"winters,":[118],"patent":[121],"activity":[122],"grow":[123],"independently":[124],"of":[125],"fluctuations,":[127],"tracking":[128],"overall":[129],"expansion":[131],"a":[133,154,163],"virtuous":[134],"cycle":[135],"where":[136],"precedes":[138],"enables":[140],"economic":[141],"growth":[142],"funds":[144],"further":[145],"innovation.":[146],"publicly":[148],"release":[149],"full":[151],"DLT-Corpus;":[152],"LedgerBERT,":[153],"domain-adapted":[155],"model":[156],"achieving":[157],"23%":[158],"improvement":[159],"over":[160],"BERT-base":[161],"DLT-specific":[164],"Named":[165],"Entity":[166],"Recognition":[167],"(NER)":[168],"task;":[169],"all":[171],"associated":[172],"tools":[173],"code.":[175]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-27T00:00:00"}
