{"id":"https://openalex.org/W7125422850","doi":"https://doi.org/10.48550/arxiv.2601.15083","title":"Bangla Music Genre Classification Using Bidirectional LSTMS","display_name":"Bangla Music Genre Classification Using Bidirectional LSTMS","publication_year":2026,"publication_date":"2026-01-21","ids":{"openalex":"https://openalex.org/W7125422850","doi":"https://doi.org/10.48550/arxiv.2601.15083"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.15083","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.15083","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.15083","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123575262","display_name":"Muntakimur Rahaman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rahaman, Muntakimur","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123616399","display_name":"Md Mahmudul Hoque","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hoque, Md Mahmudul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5095828819","display_name":"Md Mehedi Hassain","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hassain, Md Mehedi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9871000051498413,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9871000051498413,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.0006000000284984708,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.0005000000237487257,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bengali","display_name":"Bengali","score":0.8057000041007996},{"id":"https://openalex.org/keywords/digital-audio","display_name":"Digital audio","score":0.640999972820282},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5109999775886536},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4984999895095825},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4763999879360199},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.46549999713897705},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.43959999084472656},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.375}],"concepts":[{"id":"https://openalex.org/C19235068","wikidata":"https://www.wikidata.org/wiki/Q9610","display_name":"Bengali","level":2,"score":0.8057000041007996},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7820000052452087},{"id":"https://openalex.org/C87687168","wikidata":"https://www.wikidata.org/wiki/Q173114","display_name":"Digital audio","level":4,"score":0.640999972820282},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.608299970626831},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5109999775886536},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4984999895095825},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4763999879360199},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4708000123500824},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4683000147342682},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.46549999713897705},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.43959999084472656},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.375},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.36239999532699585},{"id":"https://openalex.org/C2777946086","wikidata":"https://www.wikidata.org/wiki/Q1163335","display_name":"Music information retrieval","level":3,"score":0.34950000047683716},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.34709998965263367},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.33880001306533813},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3370000123977661},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.33480000495910645},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2896000146865845},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.2759000062942505},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.27549999952316284},{"id":"https://openalex.org/C169903167","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Test set","level":2,"score":0.27300000190734863},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2685999870300293},{"id":"https://openalex.org/C160372630","wikidata":"https://www.wikidata.org/wiki/Q4819855","display_name":"Audio analyzer","level":5,"score":0.2680000066757202},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.2630000114440918}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.15083","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.15083","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.15083","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.15083","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7429959774017334,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Bangla":[0,45,89,184],"music":[1,7,12,46,61,82,156,185],"is":[2,15,33,49,112],"enrich":[3],"in":[4,23,27,128],"its":[5],"own":[6],"cultures.":[8],"Now":[9],"a":[10,57,80,99,106,125,145,167],"days":[11],"genre":[13,48,66,157],"classification":[14,67,158,168],"very":[16],"significant":[17],"because":[18],"of":[19,88,94,150,170,183],"the":[20,92,116,120,173,181],"exponential":[21],"increase":[22],"available":[24],"music,":[25],"both":[26],"digital":[28],"and":[29,59,118,147,179],"physical":[30],"formats.":[31],"It":[32],"necessary":[34],"to":[35,39,114,139,177],"index":[36],"them":[37],"accordingly":[38],"facilitate":[40],"improved":[41],"retrieval.":[42],"Automatically":[43],"classifying":[44],"by":[47,159],"essential":[50],"for":[51,65],"efficiently":[52],"locating":[53],"specific":[54],"pieces":[55],"within":[56],"vast":[58],"diverse":[60],"library.":[62],"Prevailing":[63],"methods":[64],"predominantly":[68],"employ":[69],"conventional":[70],"machine":[71],"learning":[72,75],"or":[73],"deep":[74],"approaches.":[76],"This":[77,132],"work":[78],"introduces":[79],"novel":[81],"dataset":[83],"comprising":[84],"ten":[85],"distinct":[86],"genres":[87],"music.":[90],"For":[91],"task":[93],"audio":[95,129,142],"classification,":[96],"we":[97],"utilize":[98],"recurrent":[100],"neural":[101],"network":[102,111],"(RNN)":[103],"architecture.":[104],"Specifically,":[105],"Long":[107],"Short-Term":[108],"Memory":[109],"(LSTM)":[110],"implemented":[113],"train":[115],"model":[117],"perform":[119],"classification.":[121],"Feature":[122],"extraction":[123],"represents":[124],"foundational":[126],"stage":[127],"data":[130],"processing.":[131],"study":[133],"utilizes":[134],"Mel-Frequency":[135],"Cepstral":[136],"Coefficients":[137],"(MFCCs)":[138],"transform":[140],"raw":[141],"waveforms":[143],"into":[144],"compact":[146],"representative":[148],"set":[149],"features.":[151,163],"The":[152],"proposed":[153],"framework":[154],"facilitates":[155],"leveraging":[160],"these":[161],"extracted":[162],"Experimental":[164],"results":[165],"demonstrate":[166],"accuracy":[169],"78%,":[171],"indicating":[172],"system's":[174],"strong":[175],"potential":[176],"enhance":[178],"streamline":[180],"organization":[182],"genres.":[186]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-01-23T00:00:00"}
