{"id":"https://openalex.org/W4396744419","doi":"https://doi.org/10.48550/arxiv.2405.03095","title":"Loss Jump During Loss Switch in Solving PDEs with Neural Networks","display_name":"Loss Jump During Loss Switch in Solving PDEs with Neural Networks","publication_year":2024,"publication_date":"2024-05-06","ids":{"openalex":"https://openalex.org/W4396744419","doi":"https://doi.org/10.48550/arxiv.2405.03095"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2405.03095","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.03095","pdf_url":"https://arxiv.org/pdf/2405.03095","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2405.03095","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100449969","display_name":"Zhiwei Wang","orcid":"https://orcid.org/0000-0002-9402-4729"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Zhiwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083851669","display_name":"Lulu Zhang","orcid":"https://orcid.org/0000-0002-9069-1145"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Lulu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084678300","display_name":"Zhongwang Zhang","orcid":"https://orcid.org/0009-0006-4202-8556"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Zhongwang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5002236438","display_name":"Zhi\u2010Qin John Xu","orcid":"https://orcid.org/0000-0003-0627-3520"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Zhi-Qin John","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100449969"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13717","display_name":"Advanced Algorithms and Applications","score":0.13130000233650208,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13717","display_name":"Advanced Algorithms and Applications","score":0.13130000233650208,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11343","display_name":"Power Transformer Diagnostics and Insulation","score":0.12099999934434891,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14225","display_name":"Advanced Sensor and Control Systems","score":0.11890000104904175,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/jump","display_name":"Jump","score":0.7587053775787354},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6807235479354858},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47475770115852356},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.39009299874305725},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22101819515228271},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.1388421654701233}],"concepts":[{"id":"https://openalex.org/C2780695682","wikidata":"https://www.wikidata.org/wiki/Q4005959","display_name":"Jump","level":2,"score":0.7587053775787354},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6807235479354858},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47475770115852356},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.39009299874305725},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22101819515228271},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.1388421654701233},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2405.03095","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.03095","pdf_url":"https://arxiv.org/pdf/2405.03095","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2405.03095","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2405.03095","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2405.03095","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.03095","pdf_url":"https://arxiv.org/pdf/2405.03095","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4396744419.pdf","grobid_xml":"https://content.openalex.org/works/W4396744419.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"Using":[0],"neural":[1,115,147,170,183,201],"networks":[2,22,116,171,184,202],"to":[3,135],"solve":[4],"partial":[5],"differential":[6],"equations":[7],"(PDEs)":[8],"is":[9],"gaining":[10],"popularity":[11],"as":[12,78],"an":[13],"alternative":[14,83],"approach":[15,84],"in":[16,203],"the":[17,30,60,69,72,112,128,132,136,146,153,165,179,197],"scientific":[18],"computing":[19],"community.":[20],"Neural":[21],"can":[23,46,75],"integrate":[24],"different":[25,108,141,166,173],"types":[26],"of":[27,71,89,99,114,143,169,182,200],"information":[28],"into":[29,50],"loss":[31,44,55,65,109,129,134,174],"function.":[32],"These":[33,43],"include":[34],"observation":[35,53],"data,":[36],"governing":[37],"equations,":[38],"and":[39,58,96],"variational":[40],"forms,":[41],"etc.":[42],"functions":[45,66,110],"be":[47,76],"broadly":[48],"categorized":[49],"two":[51],"types:":[52],"data":[54,133],"directly":[56],"constrains":[57],"measures":[59],"model":[61,68,79,137,186],"output,":[62],"while":[63],"other":[64],"indirectly":[67],"performance":[70],"network,":[73],"which":[74,139],"classified":[77],"loss.":[80,187],"However,":[81],"this":[82,161],"lacks":[85],"a":[86,122,192],"thorough":[87],"understanding":[88],"its":[90],"underlying":[91,198],"mechanisms,":[92],"including":[93],"theoretical":[94],"foundations":[95],"rigorous":[97],"characterization":[98],"various":[100],"phenomena.":[101],"This":[102,188],"work":[103],"focuses":[104],"on":[105],"investigating":[106],"how":[107],"impact":[111],"training":[113],"for":[117,195],"solving":[118,204],"PDEs.":[119,205],"We":[120,176],"discover":[121],"stable":[123],"loss-jump":[124,189],"phenomenon:":[125],"when":[126],"switching":[127],"function":[130],"from":[131,152,164],"loss,":[138],"includes":[140],"orders":[142],"derivative":[144],"information,":[145],"network":[148],"solution":[149,155],"significantly":[150],"deviates":[151],"exact":[154],"immediately.":[156],"Further":[157],"experiments":[158],"reveal":[159],"that":[160],"phenomenon":[162,190],"arises":[163],"frequency":[167,180],"preferences":[168],"under":[172,185],"functions.":[175],"theoretically":[177],"analyze":[178],"preference":[181],"provides":[191],"valuable":[193],"perspective":[194],"examining":[196],"mechanisms":[199]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
