{"id":"https://openalex.org/W7115596974","doi":"https://doi.org/10.48550/arxiv.2512.11184","title":"On the failure of ReLU activation for physics-informed machine learning","display_name":"On the failure of ReLU activation for physics-informed machine learning","publication_year":2025,"publication_date":"2025-12-12","ids":{"openalex":"https://openalex.org/W7115596974","doi":"https://doi.org/10.48550/arxiv.2512.11184"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.11184","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.11184","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.11184","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Rowan, Conor","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Rowan, Conor","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9670000076293945,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9670000076293945,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.012199999764561653,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.009200000204145908,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.65829998254776},{"id":"https://openalex.org/keywords/activation-function","display_name":"Activation function","score":0.597599983215332},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5766000151634216},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.49639999866485596},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4717999994754791},{"id":"https://openalex.org/keywords/piecewise","display_name":"Piecewise","score":0.4625999927520752},{"id":"https://openalex.org/keywords/differential","display_name":"Differential (mechanical device)","score":0.3889999985694885}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.65829998254776},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6195999979972839},{"id":"https://openalex.org/C38365724","wikidata":"https://www.wikidata.org/wiki/Q4677469","display_name":"Activation function","level":3,"score":0.597599983215332},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5766000151634216},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5217000246047974},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.49639999866485596},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4717999994754791},{"id":"https://openalex.org/C164660894","wikidata":"https://www.wikidata.org/wiki/Q2037833","display_name":"Piecewise","level":2,"score":0.4625999927520752},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45989999175071716},{"id":"https://openalex.org/C93226319","wikidata":"https://www.wikidata.org/wiki/Q193137","display_name":"Differential (mechanical device)","level":2,"score":0.3889999985694885},{"id":"https://openalex.org/C17095337","wikidata":"https://www.wikidata.org/wiki/Q2375229","display_name":"Piecewise linear function","level":2,"score":0.36970001459121704},{"id":"https://openalex.org/C91873725","wikidata":"https://www.wikidata.org/wiki/Q3445816","display_name":"Function approximation","level":3,"score":0.3222000002861023},{"id":"https://openalex.org/C39891107","wikidata":"https://www.wikidata.org/wiki/Q5767098","display_name":"Hinge loss","level":3,"score":0.3221000134944916},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.32179999351501465},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3197999894618988},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.31459999084472656},{"id":"https://openalex.org/C92047909","wikidata":"https://www.wikidata.org/wiki/Q204034","display_name":"Hyperbolic function","level":2,"score":0.29089999198913574},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.28700000047683716},{"id":"https://openalex.org/C78045399","wikidata":"https://www.wikidata.org/wiki/Q11214","display_name":"Differential equation","level":2,"score":0.25859999656677246}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.11184","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.11184","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.11184","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.11184","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.49946069717407227,"display_name":"No poverty","id":"https://metadata.un.org/sdg/1"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Physics-informed":[0],"machine":[1,21,88],"learning":[2,22,89],"uses":[3],"governing":[4],"ordinary":[5],"and/or":[6],"partial":[7],"differential":[8,50,109],"equations":[9],"to":[10,14,162,176],"train":[11],"neural":[12],"networks":[13],"represent":[15],"the":[16,24,30,35,57,68,81,96,126,135,142,145,149,170,173,181],"solution":[17,36],"field.":[18],"Like":[19],"any":[20],"problem,":[23],"choice":[25],"of":[26,34,84,100,128,134,144,151,165,172,184],"activation":[27,46,74],"function":[28],"influences":[29],"characteristics":[31],"and":[32,52,72],"performance":[33,83,183],"obtained":[37],"from":[38,104],"physics-informed":[39,87,174],"training.":[40,152],"Several":[41],"studies":[42],"have":[43,53],"compared":[44],"common":[45],"functions":[47],"on":[48,86,107,117],"benchmark":[49],"equations,":[51,110],"unanimously":[54],"found":[55],"that":[56,95,113,156],"rectified":[58],"linear":[59,98],"unit":[60],"(ReLU)":[61],"is":[62,93],"outperformed":[63],"by":[64],"competitors":[65],"such":[66],"as":[67,131],"sigmoid,":[69],"hyperbolic":[70],"tangent,":[71],"swish":[73],"functions.":[75],"In":[76],"this":[77,129],"work,":[78],"we":[79,111,154],"diagnose":[80],"poor":[82,182],"ReLU":[85,101,114],"problems.":[90],"While":[91],"it":[92,103],"well-known":[94],"piecewise":[97],"form":[99],"prevents":[102],"being":[105],"used":[106],"second-order":[108],"show":[112,155],"fails":[115,161],"even":[116],"variational":[118],"problems":[119],"involving":[120],"only":[121],"first":[122],"derivatives.":[123],"We":[124],"identify":[125],"cause":[127],"failure":[130],"second":[132],"derivatives":[133,164],"activation,":[136],"which":[137,168],"are":[138],"taken":[139],"not":[140],"in":[141,148,159],"formulation":[143],"loss,":[146],"but":[147],"process":[150],"Namely,":[153],"automatic":[157],"differentiation":[158],"PyTorch":[160],"characterize":[163],"discontinuous":[166],"fields,":[167],"causes":[169],"gradient":[171],"loss":[175],"be":[177],"mis-specified,":[178],"thus":[179],"explaining":[180],"ReLU.":[185]},"counts_by_year":[],"updated_date":"2025-12-16T23:48:00.217561","created_date":"2025-12-16T00:00:00"}
