{"id":"https://openalex.org/W4417292850","doi":"https://doi.org/10.48550/arxiv.2512.09895","title":"Human-in-the-Loop and AI: Crowdsourcing Metadata Vocabulary for Materials Science","display_name":"Human-in-the-Loop and AI: Crowdsourcing Metadata Vocabulary for Materials Science","publication_year":2025,"publication_date":"2025-12-10","ids":{"openalex":"https://openalex.org/W4417292850","doi":"https://doi.org/10.48550/arxiv.2512.09895"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2512.09895","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.09895","pdf_url":"https://arxiv.org/pdf/2512.09895","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2512.09895","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035913440","display_name":"Jane Greenberg","orcid":"https://orcid.org/0000-0001-7819-5360"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Greenberg, Jane","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030041065","display_name":"Scott McClellan","orcid":"https://orcid.org/0000-0002-1524-8346"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McClellan, Scott","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102607469","display_name":"Addy Ireland","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ireland, Addy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120790963","display_name":"Robert Sammarco","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sammarco, Robert","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5118856781","display_name":"Colton Gerber","orcid":"https://orcid.org/0000-0002-5471-0679"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gerber, Colton","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023877206","display_name":"Christopher B. Rauch","orcid":"https://orcid.org/0000-0003-2061-3413"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rauch, Christopher B.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020610681","display_name":"Mat Kelly","orcid":"https://orcid.org/0000-0002-0236-7389"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kelly, Mat","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045225134","display_name":"John Kunze","orcid":"https://orcid.org/0000-0001-7604-8041"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kunze, John","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102963623","display_name":"Yuan An","orcid":"https://orcid.org/0000-0002-3634-9744"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"An, Yuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5042988082","display_name":"Eric S. Toberer","orcid":"https://orcid.org/0000-0003-0826-2446"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Toberer, Eric","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5035913440"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.27239999175071716,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.27239999175071716,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.26930001378059387,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.11420000344514847,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.8605999946594238},{"id":"https://openalex.org/keywords/crowdsourcing","display_name":"Crowdsourcing","score":0.6642000079154968},{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.6195999979972839},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.6176000237464905},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5623999834060669},{"id":"https://openalex.org/keywords/controlled-vocabulary","display_name":"Controlled vocabulary","score":0.5055999755859375},{"id":"https://openalex.org/keywords/standardization","display_name":"Standardization","score":0.4625000059604645},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.4269999861717224}],"concepts":[{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.8605999946594238},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7785999774932861},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.6642000079154968},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.6195999979972839},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.6176000237464905},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5623999834060669},{"id":"https://openalex.org/C110615152","wikidata":"https://www.wikidata.org/wiki/Q1469824","display_name":"Controlled vocabulary","level":2,"score":0.5055999755859375},{"id":"https://openalex.org/C188087704","wikidata":"https://www.wikidata.org/wiki/Q369577","display_name":"Standardization","level":2,"score":0.4625000059604645},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.45890000462532043},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.4498000144958496},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.4269999861717224},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.40459999442100525},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.40119999647140503},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3630000054836273},{"id":"https://openalex.org/C110326360","wikidata":"https://www.wikidata.org/wiki/Q17149476","display_name":"Metadata modeling","level":4,"score":0.33899998664855957},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2906999886035919},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.27469998598098755},{"id":"https://openalex.org/C2777146004","wikidata":"https://www.wikidata.org/wiki/Q14949826","display_name":"CLARITY","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2630999982357025},{"id":"https://openalex.org/C2780148112","wikidata":"https://www.wikidata.org/wiki/Q1432581","display_name":"Proxy (statistics)","level":2,"score":0.2603999972343445}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2512.09895","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.09895","pdf_url":"https://arxiv.org/pdf/2512.09895","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2512.09895","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.09895","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2512.09895","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.09895","pdf_url":"https://arxiv.org/pdf/2512.09895","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1679355163","display_name":null,"funder_award_id":"OAC 2118201","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G2044452311","display_name":null,"funder_award_id":"2118201","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4417292850.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Metadata":[0],"vocabularies":[1],"are":[2],"essential":[3],"for":[4,71,144,163],"advancing":[5],"FAIR":[6,128],"and":[7,19,34,87,129,140,159,166],"FARR":[8],"data":[9],"principles,":[10,131],"but":[11],"their":[12],"development":[13],"constrained":[14],"by":[15],"limited":[16],"human":[17],"resources":[18],"inconsistent":[20],"standardization":[21],"practices.":[22],"This":[23],"paper":[24,45],"introduces":[25],"MatSci-YAMZ,":[26],"a":[27,48,59,120,133],"platform":[28],"that":[29],"integrates":[30],"artificial":[31],"intelligence":[32],"(AI)":[33],"human-in-the-loop":[35],"(HILT),":[36],"including":[37],"crowdsourcing,":[38],"to":[39,90,136,155],"support":[40],"metadata":[41,167],"vocabulary":[42,168],"development.":[43,169],"The":[44],"reports":[46],"on":[47],"proof-of-concept":[49],"use":[50],"case":[51],"evaluating":[52],"the":[53,68,78,92,107,114,142,153],"AI-HILT":[54,110,116],"model":[55,117,151],"in":[56],"materials":[57],"science,":[58],"highly":[60],"interdisciplinary":[61],"domain":[62],"Six":[63],"(6)":[64],"participants":[65],"affiliated":[66],"with":[67,77,102,127],"NSF":[69],"Institute":[70],"Data-Driven":[72],"Dynamical":[73],"Design":[74],"(ID4)":[75],"engaged":[76],"MatSci-YAMZ":[79],"plaform":[80],"over":[81],"several":[82],"weeks,":[83],"contributing":[84],"term":[85],"definitions":[86,98],"providing":[88],"examples":[89],"prompt":[91],"AI-definitions":[93],"refinement.":[94,111],"Nineteen":[95],"(19)":[96],"AI-generated":[97],"were":[99],"successfully":[100],"created,":[101],"iterative":[103],"feedback":[104],"loops":[105],"demonstrating":[106],"feasibility":[108,115],"of":[109,123],"Findings":[112],"confirm":[113],"highlighting":[118],"1)":[119],"successful":[121],"proof":[122],"concept,":[124],"2)":[125],"alignment":[126],"open-science":[130],"3)":[132],"research":[134],"protocol":[135],"guide":[137],"future":[138],"studies,":[139],"4)":[141],"potential":[143],"scalability":[145],"across":[146],"domains.":[147],"Overall,":[148],"MatSci-YAMZ's":[149],"underlying":[150],"has":[152],"capacity":[154],"enhance":[156],"semantic":[157],"transparency":[158],"reduce":[160],"time":[161],"required":[162],"consensus":[164],"building":[165]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-12-12T00:00:00"}
