{"id":"https://openalex.org/W4281822368","doi":"https://doi.org/10.1007/s40747-022-00651-7","title":"Developing sequentially trained robust Punjabi speech recognition system under matched and mismatched conditions","display_name":"Developing sequentially trained robust Punjabi speech recognition system under matched and mismatched conditions","publication_year":2022,"publication_date":"2022-06-02","ids":{"openalex":"https://openalex.org/W4281822368","doi":"https://doi.org/10.1007/s40747-022-00651-7","pmid":"https://pubmed.ncbi.nlm.nih.gov/35668730"},"language":"en","primary_location":{"id":"doi:10.1007/s40747-022-00651-7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-022-00651-7","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-022-00651-7.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1007/s40747-022-00651-7.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076299882","display_name":"Puneet Bawa","orcid":"https://orcid.org/0000-0001-5508-537X"},"institutions":[{"id":"https://openalex.org/I74319210","display_name":"Chitkara University","ror":"https://ror.org/057d6z539","country_code":"IN","type":"education","lineage":["https://openalex.org/I74319210"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Puneet Bawa","raw_affiliation_strings":["Centre of Excellence for Speech and Multimodal Laboratory, Chitkara University Institute of Engineering and Technology, Chitkara University, Punjab, India"],"affiliations":[{"raw_affiliation_string":"Centre of Excellence for Speech and Multimodal Laboratory, Chitkara University Institute of Engineering and Technology, Chitkara University, Punjab, India","institution_ids":["https://openalex.org/I74319210"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072742671","display_name":"Virender Kadyan","orcid":"https://orcid.org/0000-0001-8708-9738"},"institutions":[{"id":"https://openalex.org/I5847235","display_name":"University of Petroleum and Energy Studies","ror":"https://ror.org/04q2jes40","country_code":"IN","type":"education","lineage":["https://openalex.org/I5847235"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Virender Kadyan","raw_affiliation_strings":["Speech and Language Research Centre, School of Computer Science, University of Petroleum and Energy Studies (UPES), Energy Acres, Bidholi, Dehradun, Uttarakhand 248007 India","Speech and Language Research Centre, School of Computer Science, University of Petroleum and Energy Studies (UPES), Energy Acres, Bidholi, Dehradun, Uttarakhand, 248007, India"],"affiliations":[{"raw_affiliation_string":"Speech and Language Research Centre, School of Computer Science, University of Petroleum and Energy Studies (UPES), Energy Acres, Bidholi, Dehradun, Uttarakhand 248007 India","institution_ids":[]},{"raw_affiliation_string":"Speech and Language Research Centre, School of Computer Science, University of Petroleum and Energy Studies (UPES), Energy Acres, Bidholi, Dehradun, Uttarakhand, 248007, India","institution_ids":["https://openalex.org/I5847235"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035481870","display_name":"Abinash Tripathy","orcid":"https://orcid.org/0000-0001-9919-3399"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abinash Tripathy","raw_affiliation_strings":["Department of Computer Science and Engineering, Raghu Engineering College, Visakhapatnam, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Raghu Engineering College, Visakhapatnam, India","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022805973","display_name":"Thipendra P. Singh","orcid":"https://orcid.org/0000-0002-9991-6494"},"institutions":[{"id":"https://openalex.org/I5847235","display_name":"University of Petroleum and Energy Studies","ror":"https://ror.org/04q2jes40","country_code":"IN","type":"education","lineage":["https://openalex.org/I5847235"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Thipendra P. Singh","raw_affiliation_strings":["Speech and Language Research Centre, School of Computer Science, University of Petroleum and Energy Studies (UPES), Energy Acres, Bidholi, Dehradun, Uttarakhand 248007 India","Speech and Language Research Centre, School of Computer Science, University of Petroleum and Energy Studies (UPES), Energy Acres, Bidholi, Dehradun, Uttarakhand, 248007, India"],"affiliations":[{"raw_affiliation_string":"Speech and Language Research Centre, School of Computer Science, University of Petroleum and Energy Studies (UPES), Energy Acres, Bidholi, Dehradun, Uttarakhand 248007 India","institution_ids":[]},{"raw_affiliation_string":"Speech and Language Research Centre, School of Computer Science, University of Petroleum and Energy Studies (UPES), Energy Acres, Bidholi, Dehradun, Uttarakhand, 248007, India","institution_ids":["https://openalex.org/I5847235"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5076299882"],"corresponding_institution_ids":["https://openalex.org/I74319210"],"apc_list":{"value":1320,"currency":"GBP","value_usd":1619},"apc_paid":{"value":1320,"currency":"GBP","value_usd":1619},"fwci":0.9654,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.79162065,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"9","issue":"1","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6597612500190735},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6555511951446533},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.6476626396179199},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.6265201568603516},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.6177115440368652},{"id":"https://openalex.org/keywords/vocal-tract","display_name":"Vocal tract","score":0.6100919246673584},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5331399440765381},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5091678500175476},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.5072605013847351},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.4709682762622833},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.4659126102924347},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4646465480327606},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.4155009090900421},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.39407071471214294},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.3723699450492859}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6597612500190735},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6555511951446533},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.6476626396179199},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.6265201568603516},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.6177115440368652},{"id":"https://openalex.org/C47401133","wikidata":"https://www.wikidata.org/wiki/Q748953","display_name":"Vocal tract","level":2,"score":0.6100919246673584},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5331399440765381},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5091678500175476},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.5072605013847351},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.4709682762622833},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.4659126102924347},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4646465480327606},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.4155009090900421},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.39407071471214294},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.3723699450492859},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1007/s40747-022-00651-7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-022-00651-7","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-022-00651-7.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},{"id":"pmid:35668730","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35668730","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex & intelligent systems","raw_type":null},{"id":"pmh:oai:doaj.org/article:ce1049a3df584cf795ab915579227965","is_oa":true,"landing_page_url":"https://doaj.org/article/ce1049a3df584cf795ab915579227965","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Complex & Intelligent Systems, Vol 9, Iss 1, Pp 1-23 (2022)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:9160864","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/9160864","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Complex Intell Systems","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1007/s40747-022-00651-7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-022-00651-7","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-022-00651-7.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.4399999976158142}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4281822368.pdf","grobid_xml":"https://content.openalex.org/works/W4281822368.grobid-xml"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W1543643713","https://openalex.org/W1877570817","https://openalex.org/W1974387177","https://openalex.org/W2007645738","https://openalex.org/W2066972841","https://openalex.org/W2080921589","https://openalex.org/W2102804087","https://openalex.org/W2124558353","https://openalex.org/W2125234026","https://openalex.org/W2127469744","https://openalex.org/W2135984923","https://openalex.org/W2157749010","https://openalex.org/W2170083398","https://openalex.org/W2326699523","https://openalex.org/W2398998316","https://openalex.org/W2404856031","https://openalex.org/W2511419867","https://openalex.org/W2748130992","https://openalex.org/W2783089003","https://openalex.org/W2800057634","https://openalex.org/W2801093643","https://openalex.org/W2905083703","https://openalex.org/W2918896719","https://openalex.org/W2967236561","https://openalex.org/W2972686346","https://openalex.org/W2987535013","https://openalex.org/W3007928779","https://openalex.org/W3016941674","https://openalex.org/W3047742545","https://openalex.org/W3082603178","https://openalex.org/W3115268634","https://openalex.org/W3129120362","https://openalex.org/W3137295626","https://openalex.org/W3149335959","https://openalex.org/W3154887765","https://openalex.org/W3159139854","https://openalex.org/W3170985288","https://openalex.org/W3199514045","https://openalex.org/W4213343795","https://openalex.org/W4239273178"],"related_works":["https://openalex.org/W1482212662","https://openalex.org/W2100012411","https://openalex.org/W3162157266","https://openalex.org/W2162084437","https://openalex.org/W1997579527","https://openalex.org/W2102353451","https://openalex.org/W3044927199","https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W2387604097"],"abstract_inverted_index":{"Development":[0],"of":[1,17,24,47,129,133,140,182,276],"a":[2,48,272],"native":[3],"language":[4],"robust":[5,83],"ASR":[6],"framework":[7,256],"is":[8,233],"very":[9,219],"challenging":[10],"as":[11,13,27,29],"well":[12,28],"an":[14,20,130,254],"active":[15],"area":[16],"research.":[18],"Although":[19],"urge":[21],"for":[22,34],"investigation":[23],"effective":[25,255],"front-end":[26,55,262],"back-end":[30],"approaches":[31,157],"are":[32],"required":[33],"tackling":[35],"environment":[36],"differences,":[37],"large":[38,94,216],"training":[39,95,105],"complexity":[40],"and":[41,71,82,117,138,173,194,198,200,204,211,218,238,243,279,284,292],"inter-speaker":[42],"variability":[43],"in":[44,170,281],"achieving":[45],"success":[46],"recognition":[49],"system.":[50],"In":[51,143],"this":[52],"paper,":[53],"four":[54,146],"approaches:":[56],"mel-frequency":[57],"cepstral":[58,63,73],"coefficients":[59,64,74],"(MFCC),":[60],"Gammatone":[61],"frequency":[62],"(GFCC),":[65],"relative":[66,273],"spectral-perceptual":[67],"linear":[68],"prediction":[69],"(RASTA-PLP)":[70],"power-normalized":[72],"(PNCC)":[75],"have":[76,149,225],"been":[77,101,125,150,226],"investigated":[78],"to":[79,91,235],"generate":[80],"unique":[81],"feature":[84,155],"vectors":[85],"at":[86],"different":[87,147],"SNR":[88],"values.":[89],"Furthermore,":[90],"handle":[92],"the":[93],"data":[96,231],"complexity,":[97],"parameter":[98,268],"optimization":[99,269],"has":[100,124],"performed":[102],"with":[103,177],"sequence-discriminative":[104],"techniques:":[106],"maximum":[107],"mutual":[108],"information":[109],"(MMI),":[110],"minimum":[111,119],"phone":[112],"error":[113],"(MPE),":[114],"boosted-MMI":[115],"(bMMI),":[116],"state-level":[118],"Bayes":[120],"risk":[121],"(sMBR).":[122],"It":[123],"demonstrated":[126],"by":[127,152],"selection":[128],"optimal":[131],"value":[132],"parameters":[134],"using":[135,264],"lattice":[136],"generation,":[137],"adjustments":[139],"learning":[141],"rates.":[142],"proposed":[144],"framework,":[145],"systems":[148,214],"tested":[151],"analyzing":[153],"various":[154],"extraction":[156],"(with":[158],"or":[159,178],"without":[160,179],"speaker":[161],"normalization":[162],"through":[163,267],"Vocal":[164],"Tract":[165],"Length":[166],"Normalization":[167],"(VTLN)":[168],"approach":[169,263],"test":[171],"set)":[172],"classification":[174],"strategy":[175],"on":[176,215,258],"artificial":[180],"extension":[181],"train":[183,193,197,203,210],"dataset.":[184],"To":[185],"compare":[186],"each":[187],"system":[188,288],"performance,":[189],"true":[190],"matched":[191],"(adult":[192,202],"test-S1,":[195],"child":[196,205,209,212],"test-S2)":[199],"mismatched":[201,247,283],"test-S3,":[206],"adult":[207,217,242],"+":[208,260],"test-S4)":[213],"small":[220],"Punjabi":[221],"clean":[222,291],"speech":[223,245],"corpus":[224],"demonstrated.":[227],"Consequently,":[228],"gender-based":[229,285],"in-domain":[230,286],"augmented":[232,287],"used":[234],"moderate":[236],"acoustic":[237],"phonetic":[239],"variations":[240],"throughout":[241],"children's":[244],"under":[246,289],"conditions.":[248],"The":[249],"experiment":[250],"result":[251],"shows":[252],"that":[253],"developed":[257],"PNCC":[259],"VTLN":[261],"TDNN-sMBR-based":[265],"model":[266],"technique":[270],"yields":[271],"improvement":[274],"(RI)":[275],"40.18%,":[277],"47.51%,":[278],"49.87%":[280],"matched,":[282],"typical":[290],"noisy":[293],"conditions,":[294],"respectively.":[295]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-31T07:56:22.981413","created_date":"2025-10-10T00:00:00"}
