{"id":"https://openalex.org/W4380926695","doi":"https://doi.org/10.1145/3581791.3597375","title":"Poster: VoCopilot: Enabling Voice-Activated Tracking for Everyday Interactions","display_name":"Poster: VoCopilot: Enabling Voice-Activated Tracking for Everyday Interactions","publication_year":2023,"publication_date":"2023-06-16","ids":{"openalex":"https://openalex.org/W4380926695","doi":"https://doi.org/10.1145/3581791.3597375"},"language":"en","primary_location":{"id":"doi:10.1145/3581791.3597375","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581791.3597375","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 21st Annual International Conference on Mobile Systems, Applications and Services","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092187110","display_name":"Goh Sheen An","orcid":"https://orcid.org/0009-0002-1378-0192"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Goh Sheen An","raw_affiliation_strings":["National University of Singapore, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0009-0002-1378-0192","affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017722360","display_name":"Ambuj Varshney","orcid":"https://orcid.org/0000-0002-9282-4108"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Ambuj Varshney","raw_affiliation_strings":["National University of Singapore, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-9282-4108","affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5092187110"],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.05800062,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"579","last_page":"580"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9689000248908997,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9689000248908997,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.95660001039505,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.8490244150161743},{"id":"https://openalex.org/keywords/firmware","display_name":"Firmware","score":0.8258329629898071},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7840923070907593},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5492319464683533},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5430389046669006},{"id":"https://openalex.org/keywords/voice-command-device","display_name":"Voice command device","score":0.5022153854370117},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.47658297419548035},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3569335639476776},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.26711124181747437},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24808666110038757},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.14471864700317383},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.11196652054786682}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.8490244150161743},{"id":"https://openalex.org/C67212190","wikidata":"https://www.wikidata.org/wiki/Q104851","display_name":"Firmware","level":2,"score":0.8258329629898071},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7840923070907593},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5492319464683533},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5430389046669006},{"id":"https://openalex.org/C178718744","wikidata":"https://www.wikidata.org/wiki/Q2350070","display_name":"Voice command device","level":2,"score":0.5022153854370117},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.47658297419548035},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3569335639476776},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.26711124181747437},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24808666110038757},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.14471864700317383},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.11196652054786682},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3581791.3597375","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581791.3597375","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 21st Annual International Conference on Mobile Systems, Applications and Services","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4300000071525574,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W4389238932","https://openalex.org/W2582981600","https://openalex.org/W2091301346","https://openalex.org/W3148229873","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W4387467152","https://openalex.org/W3010413952"],"abstract_inverted_index":{"Voice":[0],"plays":[1],"a":[2,18,40,74,101],"crucial":[3],"role":[4],"in":[5],"our":[6,15,31,36,124],"daily":[7,77],"lives,":[8],"enabling":[9],"communication,":[10],"conveying":[11],"emotions,":[12],"and":[13,60,79,97,120,131],"indicating":[14],"health.":[16],"As":[17],"result,":[19],"tracking":[20],"vocal":[21,49],"interactions":[22],"can":[23,56,71],"provide":[24,151],"valuable":[25],"insights":[26],"into":[27],"various":[28,48],"aspects":[29],"of":[30,104,135],"lives.":[32],"This":[33,112],"poster":[34],"presents":[35],"preliminary":[37],"work":[38],"for":[39,138],"novel":[41],"voice":[42,117],"tracker":[43,55,106],"(VoCopilot)":[44],"that":[45],"effectively":[46],"tracks":[47],"interactions.":[50],"For":[51],"example,":[52],"the":[53],"VoCopilot":[54,105,128,144],"help":[57],"document":[58],"meetings":[59],"generate":[61],"notes,":[62],"even":[63],"when":[64],"participants":[65],"speak":[66],"different":[67],"languages.":[68],"Additionally,":[69],"it":[70],"serve":[72],"as":[73],"life-logger,":[75],"monitoring":[76],"conversations":[78],"extracting":[80],"key":[81],"points":[82],"to":[83,88,154],"summarize":[84],"their":[85],"content.":[86],"Central":[87],"VoCopilot's":[89],"design":[90,130],"is":[91],"an":[92],"energy-efficient,":[93],"co-developed":[94],"acoustic":[95],"hardware":[96,129],"firmware":[98],"combined":[99],"with":[100,107],"comprehensive":[102],"integration":[103,114],"advanced":[108],"machine":[109],"learning":[110],"systems.":[111],"harmonious":[113],"ensures":[115],"precise":[116],"transcription,":[118],"summarization,":[119],"analysis.":[121],"We":[122,142],"present":[123],"early":[125,133,152],"thoughts":[126,153],"on":[127],"share":[132],"results":[134],"utilizing":[136],"Whisper":[137],"efficient":[139],"multilingual":[140],"transcribing.":[141],"acknowledge":[143],"may":[145],"raise":[146],"privacy":[147],"issues;":[148],"therefore,":[149],"we":[150],"address":[155],"these":[156],"concerns.":[157]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
