{"id":"https://openalex.org/W7136314106","doi":"https://doi.org/10.48550/arxiv.2603.13098","title":"SldprtNet: A Large-Scale Multimodal Dataset for CAD Generation in Language-Driven 3D Design","display_name":"SldprtNet: A Large-Scale Multimodal Dataset for CAD Generation in Language-Driven 3D Design","publication_year":2026,"publication_date":"2026-03-13","ids":{"openalex":"https://openalex.org/W7136314106","doi":"https://doi.org/10.48550/arxiv.2603.13098"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.13098","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13098","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.13098","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129552062","display_name":"Ruogu Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Ruogu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129545714","display_name":"Sikai Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Sikai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129463262","display_name":"Yao Mu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mu, Yao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5022382771","display_name":"Mingyu Ding","orcid":"https://orcid.org/0000-0001-6556-8359"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Mingyu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5129552062"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.6025999784469604,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.6025999784469604,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11159","display_name":"Manufacturing Process and Optimization","score":0.11760000139474869,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.03150000050663948,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cad","display_name":"CAD","score":0.7508000135421753},{"id":"https://openalex.org/keywords/parameterized-complexity","display_name":"Parameterized complexity","score":0.6064000129699707},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5649999976158142},{"id":"https://openalex.org/keywords/parametric-model","display_name":"Parametric model","score":0.47369998693466187},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.45320001244544983},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.45019999146461487},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.424699991941452},{"id":"https://openalex.org/keywords/viewpoints","display_name":"Viewpoints","score":0.42399999499320984},{"id":"https://openalex.org/keywords/solid-modeling","display_name":"Solid modeling","score":0.41190001368522644},{"id":"https://openalex.org/keywords/3d-modeling","display_name":"3D modeling","score":0.40290001034736633}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7892000079154968},{"id":"https://openalex.org/C194789388","wikidata":"https://www.wikidata.org/wiki/Q17855283","display_name":"CAD","level":2,"score":0.7508000135421753},{"id":"https://openalex.org/C165464430","wikidata":"https://www.wikidata.org/wiki/Q1570441","display_name":"Parameterized complexity","level":2,"score":0.6064000129699707},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5649999976158142},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5260000228881836},{"id":"https://openalex.org/C24574437","wikidata":"https://www.wikidata.org/wiki/Q7135228","display_name":"Parametric model","level":3,"score":0.47369998693466187},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.45320001244544983},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.45019999146461487},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.424699991941452},{"id":"https://openalex.org/C2776035091","wikidata":"https://www.wikidata.org/wiki/Q7928819","display_name":"Viewpoints","level":2,"score":0.42399999499320984},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.41190001368522644},{"id":"https://openalex.org/C2777897806","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3D modeling","level":2,"score":0.40290001034736633},{"id":"https://openalex.org/C44210515","wikidata":"https://www.wikidata.org/wiki/Q16968978","display_name":"Bespoke","level":2,"score":0.38839998841285706},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37130001187324524},{"id":"https://openalex.org/C56435381","wikidata":"https://www.wikidata.org/wiki/Q1196371","display_name":"Geometric transformation","level":3,"score":0.34950000047683716},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.3287000060081482},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.31940001249313354},{"id":"https://openalex.org/C104065381","wikidata":"https://www.wikidata.org/wiki/Q1002535","display_name":"Geometric modeling","level":2,"score":0.31929999589920044},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.31839999556541443},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.3142000138759613},{"id":"https://openalex.org/C119823426","wikidata":"https://www.wikidata.org/wiki/Q184793","display_name":"Computer Aided Design","level":2,"score":0.31209999322891235},{"id":"https://openalex.org/C3019007443","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3d model","level":2,"score":0.3059999942779541},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3018999993801117},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.29809999465942383},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2777999937534332},{"id":"https://openalex.org/C84824328","wikidata":"https://www.wikidata.org/wiki/Q4633097","display_name":"2D to 3D conversion","level":3,"score":0.2754000127315521},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.27379998564720154},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.2703000009059906},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2671000063419342},{"id":"https://openalex.org/C2779791154","wikidata":"https://www.wikidata.org/wiki/Q258040","display_name":"Model transformation","level":3,"score":0.25920000672340393},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.25769999623298645},{"id":"https://openalex.org/C199639397","wikidata":"https://www.wikidata.org/wiki/Q1788588","display_name":"Engineering drawing","level":1,"score":0.2517000138759613},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.13098","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13098","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.13098","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13098","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.41742271184921265,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"introduce":[1],"SldprtNet,":[2],"a":[3,62,79,89,135,190,237],"large-scale":[4],"dataset":[5,31,53,191,222,240],"comprising":[6],"over":[7],"242,000":[8],"industrial":[9,216],"parts,":[10,217],"designed":[11],"for":[12,27,208,220,242],"semantic-driven":[13,243],"CAD":[14,69,209,244],"modeling,":[15],"geometric":[16,233],"deep":[17],"learning,":[18],"and":[19,22,38,45,51,61,71,78,110,143,151,158,171,203,226,232,246],"the":[20,102,118,123,127,153,165,201],"training":[21,44],"fine-tuning":[23],"of":[24,68,101,139,205],"multimodal":[25,129,206,239],"models":[26,34,77,188],"3D":[28,33,76,103,159,172],"design.":[29],"The":[30],"provides":[32],"in":[35,229],"both":[36],".step":[37],".sldprt":[39],"formats":[40],"to":[41,133,178],"support":[42,65],"diverse":[43,224],"testing.":[46],"To":[47,145,181],"enable":[48,72],"parametric":[49],"modeling":[50,167,245],"facilitate":[52],"scalability,":[54],"we":[55,125,148,185],"developed":[56],"supporting":[57,218],"tools,":[58],"an":[59],"encoder":[60],"decoder,":[63],"which":[64],"13":[66],"types":[67],"commands":[70],"lossless":[73],"transformation":[74],"between":[75],"structured":[80],"text":[81,120],"representation.":[82],"Additionally,":[83],"each":[84,140],"sample":[85],"is":[86],"paired":[87],"with":[88,117,164,196],"composite":[90],"image":[91,116],"created":[92],"by":[93],"merging":[94],"seven":[95],"rendered":[96,156,169],"views":[97],"from":[98,122],"different":[99],"viewpoints":[100],"model,":[104],"effectively":[105],"reducing":[106],"input":[107],"token":[108],"length":[109],"accelerating":[111],"inference.":[112],"By":[113],"combining":[114],"this":[115],"parameterized":[119,166],"output":[121],"encoder,":[124],"employ":[126],"lightweight":[128],"language":[130,137],"model":[131,173,230],"Qwen2.5-VL-7B":[132],"generate":[134],"natural":[136],"description":[138],"part's":[141],"appearance":[142],"functionality.":[144],"ensure":[146],"accuracy,":[147],"manually":[149],"verified":[150],"aligned":[152,177],"generated":[154],"descriptions,":[155,162],"images,":[157,170],"models.":[160],"These":[161],"along":[163],"scripts,":[168],"files,":[174],"are":[175],"fully":[176],"construct":[179],"SldprtNet.":[180],"assess":[182],"its":[183],"effectiveness,":[184],"fine-tuned":[186],"baseline":[187],"on":[189],"subset,":[192],"comparing":[193],"image-plus-text":[194],"inputs":[195],"text-only":[197],"inputs.":[198],"Results":[199],"confirm":[200],"necessity":[202],"value":[204],"datasets":[207],"generation.":[210],"It":[211],"features":[212],"carefully":[213],"selected":[214],"real-world":[215],"tools":[219],"scalable":[221],"expansion,":[223],"modalities,":[225],"ensured":[227],"diversity":[228],"complexity":[231],"features,":[234],"making":[235],"it":[236],"comprehensive":[238],"built":[241],"cross-modal":[247],"learning.":[248]},"counts_by_year":[],"updated_date":"2026-03-17T07:05:13.627479","created_date":"2026-03-17T00:00:00"}
