{"id":"https://openalex.org/W7160544827","doi":"https://doi.org/10.48550/arxiv.2605.04257","title":"HUGO-CS: A Hybrid-Labeled, Uncertainty-Aware, General-Purpose, Observational Dataset for Cold Spray","display_name":"HUGO-CS: A Hybrid-Labeled, Uncertainty-Aware, General-Purpose, Observational Dataset for Cold Spray","publication_year":2026,"publication_date":"2026-05-05","ids":{"openalex":"https://openalex.org/W7160544827","doi":"https://doi.org/10.48550/arxiv.2605.04257"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.04257","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04257","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.04257","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135570025","display_name":"Stephen Price","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Price, Stephen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135599543","display_name":"Kyle Miller","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Miller, Kyle","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135614600","display_name":"Marco Musto","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Musto, Marco","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022004120","display_name":"Kenneth Kroenlein","orcid":"https://orcid.org/0000-0002-0210-0203"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kroenlein, Kenneth","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135613274","display_name":"James Saal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saal, James","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135635868","display_name":"Kyle Tsaknopoulos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tsaknopoulos, Kyle","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135605575","display_name":"Elke A. Rundensteiner","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rundensteiner, Elke A.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5003132026","display_name":"Danielle L. Cote","orcid":"https://orcid.org/0000-0002-3571-1721"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cote, Danielle L.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10626","display_name":"High-Temperature Coating Behaviors","score":0.3073999881744385,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10626","display_name":"High-Temperature Coating Behaviors","score":0.3073999881744385,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12161","display_name":"Plant Surface Properties and Treatments","score":0.05860000103712082,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12878","display_name":"Pharmaceutical Quality and Counterfeiting","score":0.03750000149011612,"subfield":{"id":"https://openalex.org/subfields/2739","display_name":"Public Health, Environmental and Occupational Health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/replicate","display_name":"Replicate","score":0.5806000232696533},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.5803999900817871},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.564300000667572},{"id":"https://openalex.org/keywords/raw-data","display_name":"Raw data","score":0.5526999831199646},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.521399974822998},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.4323999881744385},{"id":"https://openalex.org/keywords/observational-study","display_name":"Observational study","score":0.4156999886035919},{"id":"https://openalex.org/keywords/data-extraction","display_name":"Data extraction","score":0.41359999775886536}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5871999859809875},{"id":"https://openalex.org/C2781162219","wikidata":"https://www.wikidata.org/wiki/Q26250693","display_name":"Replicate","level":2,"score":0.5806000232696533},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.5803999900817871},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.564300000667572},{"id":"https://openalex.org/C132964779","wikidata":"https://www.wikidata.org/wiki/Q2110223","display_name":"Raw data","level":2,"score":0.5526999831199646},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.521399974822998},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4878000020980835},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.4323999881744385},{"id":"https://openalex.org/C23131810","wikidata":"https://www.wikidata.org/wiki/Q818574","display_name":"Observational study","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C2777466982","wikidata":"https://www.wikidata.org/wiki/Q5227287","display_name":"Data extraction","level":3,"score":0.41359999775886536},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3686000108718872},{"id":"https://openalex.org/C2780560020","wikidata":"https://www.wikidata.org/wiki/Q79719","display_name":"License","level":2,"score":0.3573000133037567},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.34610000252723694},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.33489999175071716},{"id":"https://openalex.org/C60478076","wikidata":"https://www.wikidata.org/wiki/Q3036835","display_name":"Reference data","level":2,"score":0.3188999891281128},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2928999960422516},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.288100004196167},{"id":"https://openalex.org/C176743888","wikidata":"https://www.wikidata.org/wiki/Q862797","display_name":"Observational methods in psychology","level":3,"score":0.2867000102996826},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27559998631477356},{"id":"https://openalex.org/C3020240193","wikidata":"https://www.wikidata.org/wiki/Q4116572","display_name":"Manual handling","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C2987875673","wikidata":"https://www.wikidata.org/wiki/Q187939","display_name":"Manufacturing process","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.2599000036716461},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2578999996185303},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.2565000057220459}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.04257","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04257","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.04257","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04257","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Cold":[0],"spraying":[1],"is":[2],"an":[3,98],"increasingly":[4],"common":[5],"approach":[6],"for":[7,168,209],"repairing":[8],"and":[9,28,53,55,108,191,213],"manufacturing":[10,16],"components":[11],"due":[12,23],"to":[13,24,35,119,133,157,219],"its":[14],"solid-state":[15],"capabilities.":[17],"However,":[18],"process":[19,139],"optimization":[20],"remains":[21],"difficult":[22],"many":[25,43],"interdependent":[26],"parameters":[27],"the":[29,39,85,197,225],"lack":[30],"of":[31,74,100,165],"large-scale,":[32],"machine-readable":[33],"data":[34,215],"support":[36,120],"modeling.":[37],"While":[38],"scientific":[40,141],"literature":[41],"contains":[42],"relevant":[44],"experiments,":[45,200],"results":[46],"are":[47,202,229],"inconsistently":[48],"reported":[49,184,199],"(often":[50],"in":[51],"tables":[52],"figures)":[54],"use":[56],"non-uniform":[57],"units,":[58],"limiting":[59],"utilization":[60],"at":[61,235],"scale.":[62],"To":[63,143],"address":[64],"these":[65],"limitations,":[66],"this":[67,105,121,135,221],"work":[68,106],"presents":[69],"HUGO-CS,":[70],"a":[71,110,152,162,205,232],"literature-derived":[72],"dataset":[73,88],"4,383":[75,198],"cold-spray":[76],"experiments":[77],"with":[78,128,147,161,224],"144":[79],"features":[80],"from":[81,140],"1,124":[82],"sources,":[83],"exceeding":[84],"previous":[86],"largest":[87],"(137":[89],"samples)":[90],"by":[91],"30x.":[92],"With":[93],"completely":[94],"manual":[95,130,169],"extraction":[96,115,138,148],"requiring":[97],"average":[99],"91":[101],"minutes":[102],"per":[103],"document,":[104],"designs":[107],"leverages":[109],"Hybrid-labeled,":[111],"Uncertainty-aware,":[112],"General-purpose,":[113],"Observational":[114],"framework,":[116],"called":[117],"HUGO,":[118],"extraction.":[122],"HUGO":[123,150,178],"combines":[124],"automated":[125],"LLM-based":[126],"labeling":[127,145],"targeted":[129],"label":[131],"refinement":[132],"handle":[134],"experimental":[136],"result":[137],"literature.":[142],"balance":[144],"efficiency":[146],"accuracy,":[149],"introduces":[151],"Hierarchical":[153],"Risk":[154],"Mitigation":[155],"(HRM)":[156],"route":[158],"LLM":[159],"outputs":[160],"high":[163],"risk":[164],"potential":[166],"errors":[167],"review,":[170],"while":[171],"retaining":[172],"low-risk":[173],"records":[174],"as":[175],"auto-labeled.":[176],"Lastly,":[177],"post-processing":[179],"consolidates":[180],"categorical":[181],"descriptors,":[182],"maps":[183],"feedstock":[185],"chemistries":[186],"into":[187],"structured":[188],"continuous":[189],"compositions,":[190],"normalizes":[192],"units":[193],"across":[194],"sources.":[195],"Of":[196],"1,765":[201],"hand-labeled,":[203],"providing":[204],"high-quality":[206],"labeled":[207],"subset":[208],"benchmarking,":[210],"error":[211],"analysis,":[212],"higher-fidelity":[214],"points.":[216],"All":[217],"code":[218],"replicate":[220],"work,":[222],"along":[223],"complete":[226],"HUGO-CS":[227],"dataset,":[228],"released":[230],"under":[231],"CC-BY":[233],"license":[234],"https://github.com/sprice134/HUGO.":[236]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-08T00:00:00"}
