{"id":"https://openalex.org/W7119537018","doi":"https://doi.org/10.48550/arxiv.2601.03704","title":"Investigating Knowledge Distillation Through Neural Networks for Protein Binding Affinity Prediction","display_name":"Investigating Knowledge Distillation Through Neural Networks for Protein Binding Affinity Prediction","publication_year":2026,"publication_date":"2026-01-07","ids":{"openalex":"https://openalex.org/W7119537018","doi":"https://doi.org/10.48550/arxiv.2601.03704"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.03704","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.03704","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.03704","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012765005","display_name":"Wajid Arshad Abbasi","orcid":"https://orcid.org/0000-0001-7691-5715"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Abbasi, Wajid Arshad","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122376933","display_name":"Syed Ali Abbas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abbas, Syed Ali","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122317038","display_name":"Maryum Bibi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bibi, Maryum","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077224800","display_name":"Saiqa Andleeb","orcid":"https://orcid.org/0000-0001-7888-6444"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Andleeb, Saiqa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101098368","display_name":"Muhammad Naveed Akhtar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akhtar, Muhammad Naveed","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5012765005"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.5950000286102295,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.5950000286102295,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12576","display_name":"vaccines and immunoinformatics approaches","score":0.18850000202655792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.048700001090765,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6577000021934509},{"id":"https://openalex.org/keywords/mean-squared-error","display_name":"Mean squared error","score":0.6225000023841858},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6025000214576721},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.544700026512146},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5285000205039978},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.4999000132083893},{"id":"https://openalex.org/keywords/linear-regression","display_name":"Linear regression","score":0.4997999966144562},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.42080000042915344}],"concepts":[{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6577000021934509},{"id":"https://openalex.org/C139945424","wikidata":"https://www.wikidata.org/wiki/Q1940696","display_name":"Mean squared error","level":2,"score":0.6225000023841858},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6025000214576721},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6015999913215637},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5577999949455261},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.544700026512146},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5285000205039978},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.4999000132083893},{"id":"https://openalex.org/C48921125","wikidata":"https://www.wikidata.org/wiki/Q10861030","display_name":"Linear regression","level":2,"score":0.4997999966144562},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4984000027179718},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.43380001187324524},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.42080000042915344},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.37790000438690186},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37139999866485596},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.3594000041484833},{"id":"https://openalex.org/C167085575","wikidata":"https://www.wikidata.org/wiki/Q6803654","display_name":"Mean squared prediction error","level":2,"score":0.30469998717308044},{"id":"https://openalex.org/C2780092901","wikidata":"https://www.wikidata.org/wiki/Q3433612","display_name":"Correlation coefficient","level":2,"score":0.27900001406669617},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.27129998803138733},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.2653999924659729},{"id":"https://openalex.org/C128990827","wikidata":"https://www.wikidata.org/wiki/Q192830","display_name":"Coefficient of determination","level":2,"score":0.2630000114440918},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.2533000111579895},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.251800000667572},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.03704","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.03704","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.03704","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.03704","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,17,66,214],"trade-off":[1],"between":[2,187],"predictive":[3],"accuracy":[4],"and":[5,59,73,120,137,153,169,189],"data":[6,56,63],"availability":[7],"makes":[8],"it":[9],"difficult":[10],"to":[11,39,77,100,182,211],"predict":[12],"protein--protein":[13,107],"binding":[14,70,108,224],"affinity":[15,71,109,225],"accurately.":[16],"lack":[18],"of":[19,27,82,90,118,123,135,140,151,156],"experimentally":[20],"resolved":[21],"protein":[22,54],"structures":[23],"limits":[24],"the":[25,80,88,102,159,180,184,221],"performance":[26,185],"structure-based":[28,146,190],"machine":[29],"learning":[30],"models,":[31,131],"which":[32],"generally":[33],"outperform":[34],"sequence-based":[35,84,188,212],"methods.":[36],"In":[37],"order":[38],"overcome":[40],"this":[41],"constraint,":[42],"we":[43],"suggest":[44],"a":[45,83,91,105,133,149],"regression":[46],"framework":[47,103],"based":[48],"on":[49,104],"knowledge":[50,201,210],"distillation":[51,202],"that":[52,200],"uses":[53,69],"structural":[55,209],"during":[57,64],"training":[58,81],"only":[60],"needs":[61],"sequence":[62],"inference.":[65],"suggested":[67],"method":[68,206],"labels":[72],"intermediate":[74],"feature":[75],"representations":[76],"jointly":[78],"supervise":[79],"student":[85,161],"network":[86],"under":[87],"guidance":[89],"structure-informed":[92],"teacher":[93],"network.":[94],"Leave-One-Complex-Out":[95],"(LOCO)":[96],"cross-validation":[97],"was":[98],"used":[99],"assess":[101],"non-redundant":[106],"benchmark":[110],"dataset.":[111],"A":[112],"maximum":[113],"Pearson":[114],"correlation":[115],"coefficient":[116],"(P_r)":[117],"0.375":[119],"an":[121,138,154,204],"RMSE":[122,139,155],"2.712":[124],"kcal/mol":[125,142],"were":[126,143,172],"obtained":[127,144],"by":[128,145,175],"sequence-only":[129,165],"baseline":[130],"whereas":[132],"P_r":[134,150],"0.512":[136],"2.445":[141],"models.":[147],"With":[148,179],"0.481":[152],"2.488":[157],"kcal/mol,":[158],"distillation-based":[160,223],"model":[162],"greatly":[163],"enhanced":[164],"performance.":[166],"Improved":[167],"agreement":[168],"decreased":[170],"bias":[171],"further":[173],"confirmed":[174],"thorough":[176],"error":[177],"analyses.":[178],"potential":[181],"close":[183],"gap":[186],"models":[191],"as":[192],"larger":[193],"datasets":[194],"become":[195],"available,":[196],"these":[197],"findings":[198],"show":[199],"is":[203],"efficient":[205],"for":[207,217],"transferring":[208],"predictors.":[213],"source":[215],"code":[216],"running":[218],"inference":[219],"with":[220],"proposed":[222],"predictor":[226],"can":[227],"be":[228],"accessed":[229],"at":[230],"https://github.com/wajidarshad/ProteinAffinityKD.":[231]},"counts_by_year":[],"updated_date":"2026-05-03T08:25:01.440150","created_date":"2026-01-09T00:00:00"}
