{"id":"https://openalex.org/W4387587690","doi":"https://doi.org/10.1109/tai.2023.3323918","title":"Kullback\u2013Leibler Divergence-Based Regularized Normalization for Low-Resource Tasks","display_name":"Kullback\u2013Leibler Divergence-Based Regularized Normalization for Low-Resource Tasks","publication_year":2023,"publication_date":"2023-10-12","ids":{"openalex":"https://openalex.org/W4387587690","doi":"https://doi.org/10.1109/tai.2023.3323918"},"language":"en","primary_location":{"id":"doi:10.1109/tai.2023.3323918","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2023.3323918","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108049369","display_name":"Neeraj Kumar","orcid":"https://orcid.org/0000-0002-0485-392X"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Neeraj Kumar","raw_affiliation_strings":["Bharti School of Telecommunication Technology & Management, Indian Institute of Technology Delhi, New Delhi, India"],"affiliations":[{"raw_affiliation_string":"Bharti School of Telecommunication Technology & Management, Indian Institute of Technology Delhi, New Delhi, India","institution_ids":["https://openalex.org/I68891433"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109064591","display_name":"Ankur Narang","orcid":null},"institutions":[{"id":"https://openalex.org/I3132238960","display_name":"Institute of Electrical and Electronics Engineers","ror":"https://ror.org/01n002310","country_code":"US","type":"education","lineage":["https://openalex.org/I3132238960"]},{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN","US"],"is_corresponding":false,"raw_author_name":"Ankur Narang","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Technology Delhi, New Delhi, India","IEEE, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Technology Delhi, New Delhi, India","institution_ids":["https://openalex.org/I68891433"]},{"raw_affiliation_string":"IEEE, USA","institution_ids":["https://openalex.org/I3132238960"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066116024","display_name":"Brejesh Lall","orcid":"https://orcid.org/0000-0003-2677-3071"},"institutions":[{"id":"https://openalex.org/I68891433","display_name":"Indian Institute of Technology Delhi","ror":"https://ror.org/049tgcd06","country_code":"IN","type":"education","lineage":["https://openalex.org/I68891433"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Brejesh Lall","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Technology Delhi, New Delhi, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Technology Delhi, New Delhi, India","institution_ids":["https://openalex.org/I68891433"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5108049369"],"corresponding_institution_ids":["https://openalex.org/I68891433"],"apc_list":null,"apc_paid":null,"fwci":2.0876,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.89762038,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"5","issue":"6","first_page":"2638","last_page":"2650"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7900958061218262},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.7301077842712402},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.7121639251708984},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6015276908874512},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5325044393539429},{"id":"https://openalex.org/keywords/affine-transformation","display_name":"Affine transformation","score":0.5235661864280701},{"id":"https://openalex.org/keywords/kullback\u2013leibler-divergence","display_name":"Kullback\u2013Leibler divergence","score":0.5096127986907959},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.45378395915031433},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.35060441493988037},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3330567479133606},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09625935554504395}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7900958061218262},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.7301077842712402},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.7121639251708984},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6015276908874512},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5325044393539429},{"id":"https://openalex.org/C92757383","wikidata":"https://www.wikidata.org/wiki/Q382497","display_name":"Affine transformation","level":2,"score":0.5235661864280701},{"id":"https://openalex.org/C171752962","wikidata":"https://www.wikidata.org/wiki/Q255166","display_name":"Kullback\u2013Leibler divergence","level":2,"score":0.5096127986907959},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.45378395915031433},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.35060441493988037},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3330567479133606},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09625935554504395},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tai.2023.3323918","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2023.3323918","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":72,"referenced_works":["https://openalex.org/W1731081199","https://openalex.org/W1922655562","https://openalex.org/W2095705004","https://openalex.org/W2096707493","https://openalex.org/W2124541940","https://openalex.org/W2180093461","https://openalex.org/W2251386628","https://openalex.org/W2502312327","https://openalex.org/W2515796212","https://openalex.org/W2548036585","https://openalex.org/W2552194003","https://openalex.org/W2593833795","https://openalex.org/W2603777577","https://openalex.org/W2786712888","https://openalex.org/W2788496822","https://openalex.org/W2888161220","https://openalex.org/W2896457183","https://openalex.org/W2927966956","https://openalex.org/W2962736243","https://openalex.org/W2962974533","https://openalex.org/W2963088995","https://openalex.org/W2963096121","https://openalex.org/W2963223306","https://openalex.org/W2963596039","https://openalex.org/W2966269666","https://openalex.org/W2971033911","https://openalex.org/W2979826702","https://openalex.org/W2998659916","https://openalex.org/W3035139434","https://openalex.org/W3096628760","https://openalex.org/W3140270772","https://openalex.org/W3140957872","https://openalex.org/W3198275944","https://openalex.org/W3198377975","https://openalex.org/W4224212073","https://openalex.org/W4225422191","https://openalex.org/W4250482878","https://openalex.org/W4294710606","https://openalex.org/W4297097688","https://openalex.org/W4297841843","https://openalex.org/W4385605073","https://openalex.org/W6637618735","https://openalex.org/W6637625617","https://openalex.org/W6638523607","https://openalex.org/W6640090968","https://openalex.org/W6640963894","https://openalex.org/W6674330103","https://openalex.org/W6681151457","https://openalex.org/W6691303741","https://openalex.org/W6695676441","https://openalex.org/W6701650085","https://openalex.org/W6724804524","https://openalex.org/W6729906282","https://openalex.org/W6743583902","https://openalex.org/W6744627333","https://openalex.org/W6745573522","https://openalex.org/W6746921017","https://openalex.org/W6748163547","https://openalex.org/W6748375146","https://openalex.org/W6749107692","https://openalex.org/W6751546485","https://openalex.org/W6752083267","https://openalex.org/W6768586863","https://openalex.org/W6779469252","https://openalex.org/W6779629370","https://openalex.org/W6780218876","https://openalex.org/W6780226713","https://openalex.org/W6785827884","https://openalex.org/W6792367290","https://openalex.org/W6807429924","https://openalex.org/W6810268879","https://openalex.org/W6810480526"],"related_works":["https://openalex.org/W4362597605","https://openalex.org/W1574414179","https://openalex.org/W4297676672","https://openalex.org/W3009056573","https://openalex.org/W2922073769","https://openalex.org/W4281702477","https://openalex.org/W2490526372","https://openalex.org/W4376166922","https://openalex.org/W4378510483","https://openalex.org/W4221142204"],"abstract_inverted_index":{"Large":[0],"pretrained":[1,48,195],"models":[2],"like":[3,52],"Bert,":[4],"GPT,":[5],"and":[6,34,80,100,152,179,208,220,255,271],"Wav2Vec":[7],"have":[8,41],"demonstrated":[9],"their":[10,43,89,94],"ability":[11],"to":[12,32,45,145,153,226],"learn":[13],"transferable":[14],"representations":[15],"for":[16,109],"various":[17,92],"downstream":[18,233,264],"tasks.":[19,235],"However,":[20],"obtaining":[21],"a":[22,29,38,66,129,161,239],"substantial":[23],"amount":[24],"of":[25,84,121,142,222,242],"supervised":[26],"data":[27,149],"remains":[28],"challenge":[30],"due":[31],"resource":[33,61,98,232],"time":[35],"limitations.":[36],"As":[37],"solution,":[39],"researchers":[40],"turned":[42],"attention":[44],"using":[46,118],"large":[47],"datasets":[49],"via":[50],"techniques":[51,64,229],"fine-tuning,":[53],"linear":[54],"probing,":[55],"or":[56,137,188,194],"prompt":[57],"tuning":[58],"in":[59,69,91,96,115,165,191,205,224,263,268],"low":[60,97,231],"settings.":[62],"Normalization":[63],"play":[65],"crucial":[67],"role":[68],"speeding":[70],"up":[71],"training,":[72],"style":[73],"transfer,":[74],"object":[75],"detection,":[76],"recurrent":[77],"neural":[78,86],"networks":[79],"improving":[81],"the":[82,113,166,192,217],"generalization":[83,155],"deep":[85],"networks.":[87],"Despite":[88],"success":[90],"domains,":[93],"effectiveness":[95],"NLP":[99,234],"speech":[101,265],"tasks":[102,237],"has":[103],"been":[104],"limited.":[105],"A":[106],"notable":[107],"reason":[108],"this":[110,125,171],"limitation":[111],"is":[112,144,150],"difficulty":[114],"capturing":[116],"expressiveness":[117],"affine":[119],"parameters":[120,207],"normalization.":[122],"To":[123],"address":[124],"issue,":[126],"we":[127,215],"propose":[128],"novel":[130],"approach":[131],"called":[132],"Kullback-Leibler":[133],"(KL)":[134],"Regularized":[135],"normalization,":[136],"KL-Norm.":[138],"The":[139],"main":[140],"objective":[141],"KL-Norm":[143,198,223,259],"ensure":[146],"that":[147],"normalized":[148],"well-behaved":[151],"improve":[154],"by":[156,159,172],"reducing":[157],"overfitting":[158],"including":[160,244],"regularization":[162],"loss":[163],"function":[164],"training":[167],"process.":[168],"It":[169],"achieves":[170],"promoting":[173],"good":[174],"performance":[175,221],"on":[176,230],"out-of-domain":[177],"distributions":[178],"effectively":[180],"filters":[181],"relevant":[182],"features":[183,187],"while":[184],"eliminating":[185],"superficial":[186],"biases":[189],"present":[190],"dataset":[193],"model.":[196],"Remarkably,":[197],"accomplishes":[199],"these":[200],"objectives":[201],"with":[202],"minimal":[203],"increase":[204],"model":[206],"memory":[209],"overheads.":[210],"Through":[211],"extensive":[212],"experimental":[213],"analysis,":[214],"showcase":[216],"improved":[218],"accuracy":[219],"comparison":[225],"other":[227],"normalization":[228],"These":[236],"encompass":[238],"wide":[240],"range":[241],"applications,":[243],"sentiment":[245],"classification,":[246],"semantic":[247,250],"relationship":[248],"characterization,":[249],"textual":[251,253],"similarity,":[252],"entailment,":[254],"paraphrase":[256],"detection.":[257],"Additionally,":[258],"exhibits":[260],"superior":[261],"results":[262],"tasks,":[266],"specifically":[267],"keyword":[269],"detection":[270],"emotion":[272],"classification.":[273]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
