{"id":"https://openalex.org/W2947738045","doi":"https://doi.org/10.1109/spcom.2018.8724420","title":"Classification of story-telling and poem recitation using head gesture of the talker","display_name":"Classification of story-telling and poem recitation using head gesture of the talker","publication_year":2018,"publication_date":"2018-07-01","ids":{"openalex":"https://openalex.org/W2947738045","doi":"https://doi.org/10.1109/spcom.2018.8724420","mag":"2947738045"},"language":"en","primary_location":{"id":"doi:10.1109/spcom.2018.8724420","is_oa":false,"landing_page_url":"https://doi.org/10.1109/spcom.2018.8724420","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 International Conference on Signal Processing and Communications (SPCOM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003478442","display_name":"C. A. Valliappan","orcid":null},"institutions":[{"id":"https://openalex.org/I59270414","display_name":"Indian Institute of Science Bangalore","ror":"https://ror.org/04dese585","country_code":"IN","type":"education","lineage":["https://openalex.org/I59270414"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"C.A. Valliappan","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Science, Bangalore, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Science, Bangalore, India","institution_ids":["https://openalex.org/I59270414"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110452392","display_name":"Anurag Das","orcid":"https://orcid.org/0009-0007-9800-0699"},"institutions":[{"id":"https://openalex.org/I59270414","display_name":"Indian Institute of Science Bangalore","ror":"https://ror.org/04dese585","country_code":"IN","type":"education","lineage":["https://openalex.org/I59270414"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Anurag Das","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Science, Bangalore, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Science, Bangalore, India","institution_ids":["https://openalex.org/I59270414"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046000500","display_name":"Prasanta Ghosh","orcid":"https://orcid.org/0000-0002-2925-1802"},"institutions":[{"id":"https://openalex.org/I59270414","display_name":"Indian Institute of Science Bangalore","ror":"https://ror.org/04dese585","country_code":"IN","type":"education","lineage":["https://openalex.org/I59270414"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Prasanta Kumar Ghosh","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Science, Bangalore, India"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Science, Bangalore, India","institution_ids":["https://openalex.org/I59270414"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5003478442"],"corresponding_institution_ids":["https://openalex.org/I59270414"],"apc_list":null,"apc_paid":null,"fwci":0.2191,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.66242591,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"15","issue":null,"first_page":"36","last_page":"40"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/gesture","display_name":"Gesture","score":0.8625158071517944},{"id":"https://openalex.org/keywords/head","display_name":"Head (geology)","score":0.6414462327957153},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5645676255226135},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5641345977783203},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.509323239326477},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4536556303501129},{"id":"https://openalex.org/keywords/poetry","display_name":"Poetry","score":0.4363757371902466},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.32383662462234497},{"id":"https://openalex.org/keywords/art","display_name":"Art","score":0.16302302479743958},{"id":"https://openalex.org/keywords/literature","display_name":"Literature","score":0.08244714140892029}],"concepts":[{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.8625158071517944},{"id":"https://openalex.org/C2780312720","wikidata":"https://www.wikidata.org/wiki/Q5689100","display_name":"Head (geology)","level":2,"score":0.6414462327957153},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5645676255226135},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5641345977783203},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.509323239326477},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4536556303501129},{"id":"https://openalex.org/C164913051","wikidata":"https://www.wikidata.org/wiki/Q482","display_name":"Poetry","level":2,"score":0.4363757371902466},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.32383662462234497},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.16302302479743958},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.08244714140892029},{"id":"https://openalex.org/C114793014","wikidata":"https://www.wikidata.org/wiki/Q52109","display_name":"Geomorphology","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/spcom.2018.8724420","is_oa":false,"landing_page_url":"https://doi.org/10.1109/spcom.2018.8724420","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 International Conference on Signal Processing and Communications (SPCOM)","raw_type":"proceedings-article"},{"id":"pmh:oai::75484","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306401429","display_name":"ePrints@IISc (Indian Institute of Science)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I59270414","host_organization_name":"Indian Institute of Science Bangalore","host_organization_lineage":["https://openalex.org/I59270414"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6399999856948853,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W106576909","https://openalex.org/W198720948","https://openalex.org/W1524333225","https://openalex.org/W1836465849","https://openalex.org/W1988874269","https://openalex.org/W1996543588","https://openalex.org/W2030695833","https://openalex.org/W2054721804","https://openalex.org/W2084133839","https://openalex.org/W2095705004","https://openalex.org/W2104259291","https://openalex.org/W2118004237","https://openalex.org/W2124399597","https://openalex.org/W2144961093","https://openalex.org/W2151369449","https://openalex.org/W2157777396","https://openalex.org/W2167636130","https://openalex.org/W2288315699","https://openalex.org/W2747228564","https://openalex.org/W4253024038","https://openalex.org/W6608075110","https://openalex.org/W6631362777","https://openalex.org/W6638667902","https://openalex.org/W6674330103"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2935909890","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W2748952813","https://openalex.org/W1531601525"],"abstract_inverted_index":{"In":[0],"this":[1],"work,":[2],"we":[3,47],"investigate":[4],"the":[5,72,136,163,182,198,253,259,263],"nature":[6],"of":[7,41,53,95,106,119,129,173,179,191],"head":[8,25,82,130,165,205,237,254],"gestures":[9,26,131,166,206,238,255],"in":[10,15,19,39,168,185],"spontaneous":[11,42],"speech":[12],"during":[13,27,142,148],"story-telling":[14,60,155],"comparison":[16],"to":[17,37,146,258],"that":[18,24,135,147,162,197,252],"poem":[20,28,62,126,143,157],"recitation.":[21,127],"We":[22,56],"hypothesize":[23],"recitation":[29,63,144,158],"would":[30],"be":[31],"more":[32,208],"repetitive":[33],"and":[34,88,102,125,156,175,189,193,216,239,248],"structured":[35],"compared":[36,145],"those":[38,221],"case":[40],"speech.":[43],"To":[44],"quantify":[45],"this,":[46],"proposed":[48],"a":[49,59,93,103,243],"measure":[50],"called":[51],"degree":[52],"repetition":[54],"(DoR).":[55],"also":[57],"perform":[58],"vs":[61],"classification":[64,152,171,264],"experiment":[65,153],"using":[66,92,132,159,226],"deep":[67],"neural":[68],"network":[69],"(DNN).":[70],"For":[71],"classification,":[73],"both":[74],"DoR":[75,133,183,211],"as":[76,78,230],"well":[77],"context":[79],"dependent":[80],"raw":[81,164,204,236],"gesture":[83],"data":[84,118],"are":[85,90,207,218,256],"used.":[86],"Analysis":[87,128],"experiments":[89],"performed":[91],"database":[94],"24":[96],"subjects":[97,108],"each":[98,109],"telling":[99,124],"five":[100],"stories":[101],"different":[104],"set":[105],"10":[107],"reciting":[110],"20":[111],"poems,":[112],"three":[113],"times":[114],"each,":[115],"thus":[116],"having":[117],"comparable":[120],"durations":[121],"for":[122,262],"story":[123],"reveals":[134],"DoR,":[137],"on":[138],"average,":[139],"is":[140],"higher":[141,244],"story-telling.":[149],"A":[150],"four-fold":[151],"between":[154],"DNN":[160,202],"demonstrates":[161],"result":[167],"an":[169,176,186],"average":[170,177,187,245],"accuracy":[172,188,215,246],"85.79%":[174],"F-score":[178,190,217,249],"89.05%":[180],"while":[181],"results":[184],"80.59%":[192],"82.30%":[194],"respectively":[195],"indicating":[196,251],"features":[199,261],"learnt":[200],"by":[201],"from":[203],"discriminative":[209],"than":[210,220],"features.":[212],"While":[213],"these":[214],"less":[219],"(94.67%":[222],"&":[223],"95.60%)":[224],"obtained":[225],"acoustic":[227,260],"feature":[228],"such":[229],"Mel":[231],"frequency":[232],"cepstral":[233],"coefficients":[234],"(MFCCs),":[235],"MFCCs":[240],"together":[241],"yield":[242],"(98.62%)":[247],"(98.92%),":[250],"complementary":[257],"task.":[265]},"counts_by_year":[{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
