{"id":"https://openalex.org/W7160841459","doi":"https://doi.org/10.48550/arxiv.2605.06762","title":"A Linear-Transformer Hybrid for SNP-Based Genotype-to-Phenotype Prediction in Grapevine","display_name":"A Linear-Transformer Hybrid for SNP-Based Genotype-to-Phenotype Prediction in Grapevine","publication_year":2026,"publication_date":"2026-05-07","ids":{"openalex":"https://openalex.org/W7160841459","doi":"https://doi.org/10.48550/arxiv.2605.06762"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.06762","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06762","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.06762","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135844990","display_name":"Yibin Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yibin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135860250","display_name":"Murukarthick Jayakodi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jayakodi, Murukarthick","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135850372","display_name":"Silvas Kirubakaran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kirubakaran, Silvas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045833111","display_name":"Ambika Chandra","orcid":"https://orcid.org/0000-0002-4996-4383"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chandra, Ambika","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5033568355","display_name":"Azlan Zahid","orcid":"https://orcid.org/0000-0001-6202-8680"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zahid, Azlan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11796","display_name":"Horticultural and Viticultural Research","score":0.8111000061035156,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11796","display_name":"Horticultural and Viticultural Research","score":0.8111000061035156,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10594","display_name":"Genetic and phenotypic traits in livestock","score":0.08320000022649765,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11468","display_name":"Genetic Mapping and Diversity in Plants and Animals","score":0.01549999974668026,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7271999716758728},{"id":"https://openalex.org/keywords/snp","display_name":"SNP","score":0.4661000072956085},{"id":"https://openalex.org/keywords/quantitative-trait-locus","display_name":"Quantitative trait locus","score":0.4575999975204468},{"id":"https://openalex.org/keywords/mean-squared-prediction-error","display_name":"Mean squared prediction error","score":0.44609999656677246},{"id":"https://openalex.org/keywords/predictive-modelling","display_name":"Predictive modelling","score":0.3817000091075897},{"id":"https://openalex.org/keywords/genomic-selection","display_name":"Genomic selection","score":0.37950000166893005},{"id":"https://openalex.org/keywords/additive-model","display_name":"Additive model","score":0.3767000138759613},{"id":"https://openalex.org/keywords/single-nucleotide-polymorphism","display_name":"Single-nucleotide polymorphism","score":0.36959999799728394},{"id":"https://openalex.org/keywords/polygene","display_name":"Polygene","score":0.3628000020980835}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7271999716758728},{"id":"https://openalex.org/C139275648","wikidata":"https://www.wikidata.org/wiki/Q17134011","display_name":"SNP","level":5,"score":0.4661000072956085},{"id":"https://openalex.org/C81941488","wikidata":"https://www.wikidata.org/wiki/Q853421","display_name":"Quantitative trait locus","level":3,"score":0.4575999975204468},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.4555000066757202},{"id":"https://openalex.org/C167085575","wikidata":"https://www.wikidata.org/wiki/Q6803654","display_name":"Mean squared prediction error","level":2,"score":0.44609999656677246},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.38940000534057617},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.3817000091075897},{"id":"https://openalex.org/C2992444039","wikidata":"https://www.wikidata.org/wiki/Q17145598","display_name":"Genomic selection","level":5,"score":0.37950000166893005},{"id":"https://openalex.org/C203223496","wikidata":"https://www.wikidata.org/wiki/Q4681344","display_name":"Additive model","level":2,"score":0.3767000138759613},{"id":"https://openalex.org/C153209595","wikidata":"https://www.wikidata.org/wiki/Q501128","display_name":"Single-nucleotide polymorphism","level":4,"score":0.36959999799728394},{"id":"https://openalex.org/C84799019","wikidata":"https://www.wikidata.org/wiki/Q426365","display_name":"Polygene","level":4,"score":0.3628000020980835},{"id":"https://openalex.org/C103545067","wikidata":"https://www.wikidata.org/wiki/Q796265","display_name":"Best linear unbiased prediction","level":3,"score":0.36059999465942383},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.3580000102519989},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3337000012397766},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.3142000138759613},{"id":"https://openalex.org/C130073038","wikidata":"https://www.wikidata.org/wiki/Q1211967","display_name":"Phenotypic trait","level":4,"score":0.31040000915527344},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.30640000104904175},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.299699991941452},{"id":"https://openalex.org/C61727976","wikidata":"https://www.wikidata.org/wiki/Q751748","display_name":"Epistasis","level":3,"score":0.29330000281333923},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.29179999232292175},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.29010000824928284},{"id":"https://openalex.org/C127716648","wikidata":"https://www.wikidata.org/wiki/Q104053","display_name":"Phenotype","level":3,"score":0.2874999940395355},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.28380000591278076},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.2800000011920929},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27720001339912415},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2745000123977661},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.274399995803833},{"id":"https://openalex.org/C56221022","wikidata":"https://www.wikidata.org/wiki/Q1125215","display_name":"Trichome","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C3019719930","wikidata":"https://www.wikidata.org/wiki/Q3910099","display_name":"Predictive value","level":2,"score":0.2551000118255615}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.06762","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06762","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.06762","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06762","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Robust":[0],"genotype-to-phenotype":[1],"(G2P)":[2],"prediction":[3,103],"is":[4],"essential":[5],"for":[6,75,169,194],"accelerating":[7],"breeding":[8],"decisions":[9],"and":[10,25,73,88,96,120,127,137,160,188],"genetic":[11,46],"gain.":[12],"However,":[13],"it":[14],"remains":[15],"challenging":[16],"to":[17,164],"measure":[18],"complex":[19],"traits":[20,83],"under":[21],"variable":[22],"field":[23],"conditions":[24],"across":[26,77],"years.":[27,80],"In":[28,151],"this":[29],"study,":[30],"we":[31,153],"propose":[32],"a":[33,63],"linear-Transformer":[34],"approach,":[35],"LiT-G2P":[36,61,100,112,143],"(Linear-Transformer":[37],"Genotype-to-Phenotype),":[38],"an":[39],"automated":[40],"predictive":[41,192],"framework":[42],"that":[43,175],"integrates":[44],"additive":[45,178],"variance":[47],"effects":[48,179],"with":[49,70,106,123,180],"Transformer-based":[50],"nonlinear":[51],"interactions":[52],"using":[53],"genome-wide":[54],"single-nucleotide":[55],"polymorphisms":[56],"(SNPs)":[57],"data.":[58],"We":[59],"evaluated":[60],"on":[62],"panel":[64],"of":[65,91,125,135],"diverse":[66],"grape":[67],"accessions,":[68],"genotyped":[69],"SNP":[71],"markers":[72],"measured":[74],"phenotypes":[76],"two":[78],"consecutive":[79],"Target":[81],"phenotypic":[82],"include":[84],"leaf":[85],"hair":[86,110],"density":[87,90],"trichome":[89,141],"grapevines.":[92],"Across":[93],"both":[94,118],"single-year":[95,119],"cross-year":[97,121,186],"testing":[98],"scenarios,":[99],"consistently":[101],"improves":[102],"performance":[104],"compared":[105],"baseline":[107],"models.":[108],"For":[109,140],"density,":[111,142],"achieves":[113],"the":[114,146],"lowest":[115],"error":[116],"in":[117],"evaluations,":[122],"RMSEs":[124],"0.469":[126],"0.454,":[128],"respectively,":[129],"while":[130],"maintaining":[131],"strong":[132],"tolerance":[133],"accuracies":[134],"79.2%":[136],"74.6%,":[138],"respectively.":[139],"also":[144],"presents":[145],"best":[147],"overall":[148],"G2P":[149],"performance.":[150],"addition,":[152],"extract":[154],"model-prioritized":[155],"SNPs":[156],"from":[157],"attention":[158],"weights":[159],"apply":[161],"genotype-stratified":[162],"analysis":[163],"provide":[165],"interpretable":[166],"candidate":[167],"marker":[168],"downstream":[170],"validation.":[171],"These":[172],"results":[173],"demonstrate":[174],"integrating":[176],"stable":[177],"learned":[181],"interaction":[182],"patterns":[183],"can":[184],"enhance":[185],"robustness":[187],"support":[189],"practical":[190],"SNP-based":[191],"modeling":[193],"genomic":[195],"selection.":[196]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-12T00:00:00"}
