{"id":"https://openalex.org/W2902953211","doi":"https://doi.org/10.1109/icpr.2018.8546078","title":"Learning to Learn Second-Order Back-Propagation for CNNs Using LSTMs","display_name":"Learning to Learn Second-Order Back-Propagation for CNNs Using LSTMs","publication_year":2018,"publication_date":"2018-08-01","ids":{"openalex":"https://openalex.org/W2902953211","doi":"https://doi.org/10.1109/icpr.2018.8546078","mag":"2902953211"},"language":"en","primary_location":{"id":"doi:10.1109/icpr.2018.8546078","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr.2018.8546078","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 24th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076846018","display_name":"Anirban Roy","orcid":"https://orcid.org/0009-0000-6889-0204"},"institutions":[{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]},{"id":"https://openalex.org/I1298353152","display_name":"SRI International","ror":"https://ror.org/05s570m15","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1298353152"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Anirban Roy","raw_affiliation_strings":["SRI International, Menlo Park, USA"],"affiliations":[{"raw_affiliation_string":"SRI International, Menlo Park, USA","institution_ids":["https://openalex.org/I1298353152","https://openalex.org/I4210099336"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5027742996","display_name":"Sini\u0161a Todorovi\u0107","orcid":"https://orcid.org/0000-0001-5793-5921"},"institutions":[{"id":"https://openalex.org/I131249849","display_name":"Oregon State University","ror":"https://ror.org/00ysfqy60","country_code":"US","type":"education","lineage":["https://openalex.org/I131249849"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sinisa Todorovic","raw_affiliation_strings":["Oregon State University, Corvallis, USA"],"affiliations":[{"raw_affiliation_string":"Oregon State University, Corvallis, USA","institution_ids":["https://openalex.org/I131249849"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5076846018"],"corresponding_institution_ids":["https://openalex.org/I1298353152","https://openalex.org/I4210099336"],"apc_list":null,"apc_paid":null,"fwci":0.3258,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.68775422,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"4","issue":null,"first_page":"97","last_page":"102"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7940128445625305},{"id":"https://openalex.org/keywords/backpropagation","display_name":"Backpropagation","score":0.732417106628418},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7128972411155701},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7035866379737854},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6991324424743652},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5742292404174805},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5694238543510437},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4590604901313782},{"id":"https://openalex.org/keywords/rate-of-convergence","display_name":"Rate of convergence","score":0.4374709725379944},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4058886170387268},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3239481449127197},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.12430247664451599}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7940128445625305},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.732417106628418},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7128972411155701},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7035866379737854},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6991324424743652},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5742292404174805},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5694238543510437},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4590604901313782},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.4374709725379944},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4058886170387268},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3239481449127197},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.12430247664451599},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icpr.2018.8546078","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr.2018.8546078","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 24th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W19621276","https://openalex.org/W99485931","https://openalex.org/W196761320","https://openalex.org/W1522301498","https://openalex.org/W1899249567","https://openalex.org/W1904365287","https://openalex.org/W2064675550","https://openalex.org/W2089217417","https://openalex.org/W2097428361","https://openalex.org/W2108598243","https://openalex.org/W2112514080","https://openalex.org/W2112796928","https://openalex.org/W2122053572","https://openalex.org/W2136058147","https://openalex.org/W2766736793","https://openalex.org/W2951282416","https://openalex.org/W2963446085","https://openalex.org/W2963586744","https://openalex.org/W2963775850","https://openalex.org/W2964121744","https://openalex.org/W3118608800","https://openalex.org/W6600828528","https://openalex.org/W6608133726","https://openalex.org/W6631190155","https://openalex.org/W6639736602","https://openalex.org/W6674634876","https://openalex.org/W6680358937","https://openalex.org/W6681804681","https://openalex.org/W6713348437","https://openalex.org/W6717367658"],"related_works":["https://openalex.org/W4239286941","https://openalex.org/W2088845016","https://openalex.org/W589102260","https://openalex.org/W4226493464","https://openalex.org/W4312417841","https://openalex.org/W3133861977","https://openalex.org/W2951211570","https://openalex.org/W3103566983","https://openalex.org/W3167935049","https://openalex.org/W3029198973"],"abstract_inverted_index":{"Convolutional":[0],"neural":[1],"networks":[2],"(CNNs)":[3],"typically":[4],"suffer":[5],"from":[6],"slow":[7],"convergence":[8],"rates":[9,34,117],"in":[10,88],"training,":[11],"which":[12],"limits":[13],"their":[14],"wider":[15],"application.":[16],"This":[17],"paper":[18],"presents":[19],"a":[20,75,138,152,162],"new":[21],"CNN":[22,86,101,154],"learning":[23,46,49,68,90,98,121,161],"approach,":[24],"based":[25],"on":[26,106],"second-order":[27,112],"methods,":[28,38],"aimed":[29],"at":[30],"improving:":[31],"a)":[32],"Convergence":[33],"of":[35,45,65,85,94,99],"existing":[36],"gradient-based":[37,120],"and":[39,62,97,126],"b)":[40],"Robustness":[41],"to":[42,74,81,130,134,150],"the":[43,66,95,100,123],"choice":[44],"hyper-parameters":[47],"(e.g.,":[48],"rate).":[50],"We":[51,143],"derive":[52],"an":[53,147],"efficient":[54],"back-propagation":[55],"algorithm":[56],"for":[57,122,141,160],"simultaneously":[58],"computing":[59],"both":[60],"gradients":[61],"second":[63],"derivatives":[64],"CNN's":[67],"objective.":[69],"These":[70],"are":[71,102],"then":[72],"input":[73],"Long":[76],"Short":[77],"Term":[78],"Memory":[79],"(LSTM)":[80],"predict":[82],"optimal":[83],"updates":[84],"parameters":[87],"each":[89],"iteration.":[91],"Both":[92],"meta-learning":[93],"LSTM":[96,148],"conducted":[103],"jointly.":[104],"Evaluation":[105],"image":[107],"classification":[108],"demonstrates":[109],"that":[110,127,146],"our":[111],"backpropagation":[113],"has":[114],"faster":[115],"convergences":[116],"than":[118],"standard":[119],"same":[124],"CNN,":[125],"it":[128],"converges":[129],"better":[131,135],"optima":[132],"leading":[133],"performance":[136],"under":[137],"budgeted":[139],"time":[140],"learning.":[142],"also":[144],"show":[145],"learned":[149],"learn":[151],"small":[153],"network":[155],"can":[156],"be":[157],"readily":[158],"used":[159],"larger":[163],"network.":[164]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
