{"id":"https://openalex.org/W7133528933","doi":"https://doi.org/10.48550/arxiv.2603.02569","title":"An LLM-Assisted Toolkit for Inspectable Multimodal Emotion Data Annotation","display_name":"An LLM-Assisted Toolkit for Inspectable Multimodal Emotion Data Annotation","publication_year":2026,"publication_date":"2026-03-03","ids":{"openalex":"https://openalex.org/W7133528933","doi":"https://doi.org/10.48550/arxiv.2603.02569"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.02569","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02569","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.02569","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110093418","display_name":"Zheyuan Kuang","orcid":"https://orcid.org/0009-0009-0184-6159"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kuang, Zheyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128073257","display_name":"Weiwei Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Weiwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024247430","display_name":"Nicholas A. Koemel","orcid":"https://orcid.org/0000-0002-5463-6894"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koemel, Nicholas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122911376","display_name":"Matthew N. Ahmadi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahmadi, Matthew","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128046106","display_name":"Emmanuel Stamatakis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stamatakis, Emmanuel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128066103","display_name":"Benjamin Tag","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tag, Benjamin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047568623","display_name":"Anusha Withana","orcid":"https://orcid.org/0000-0001-6587-1278"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Withana, Anusha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5024805223","display_name":"Zhanna Sarsenbayeva","orcid":"https://orcid.org/0000-0002-1247-6036"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sarsenbayeva, Zhanna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5110093418"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9793000221252441,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9793000221252441,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.002300000051036477,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.0010999999940395355,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.699400007724762},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.6546000242233276},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.5910999774932861},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5285000205039978},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4456000030040741},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.4442000091075897},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.4309999942779541}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8334000110626221},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.699400007724762},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.6546000242233276},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.5910999774932861},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5285000205039978},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4456000030040741},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.4442000091075897},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.43810001015663147},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.4309999942779541},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.3806000053882599},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37860000133514404},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.33059999346733093},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.3230000138282776},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3167000114917755},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2989000082015991},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.2985000014305115},{"id":"https://openalex.org/C158379750","wikidata":"https://www.wikidata.org/wiki/Q214111","display_name":"Network packet","level":2,"score":0.2978000044822693},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.29660001397132874}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.02569","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02569","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.02569","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02569","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multimodal":[0],"Emotion":[1],"Recognition":[2],"(MER)":[3],"increasingly":[4],"depends":[5],"on":[6,56,121],"fine":[7],"grained,":[8],"evidence":[9],"grounded":[10],"annotations,":[11],"yet":[12],"inspection":[13],"and":[14,25,49,61,78,82,105,115],"label":[15],"construction":[16],"are":[17,23],"hard":[18],"to":[19,91,108],"scale":[20],"when":[21],"cues":[22],"dynamic":[24],"misaligned":[26],"across":[27],"modalities.":[28],"We":[29,117],"present":[30],"an":[31,41,57,99],"LLM-assisted":[32],"toolkit":[33,47,97],"that":[34],"supports":[35],"multimodal":[36,122],"emotion":[37,124],"data":[38],"annotation":[39],"through":[40],"inspectable,":[42],"event":[43,86],"centered":[44],"workflow.":[45],"The":[46],"preprocesses":[48],"aligns":[50],"heterogeneous":[51],"recordings,":[52],"visualizes":[53],"all":[54],"modalities":[55],"interactive":[58],"shared":[59],"timeline,":[60],"renders":[62],"structured":[63,110],"signals":[64],"as":[65,85],"video":[66],"tracks":[67],"for":[68,112],"cross":[69],"modal":[70],"consistency":[71],"checks.":[72],"It":[73],"then":[74],"detects":[75],"candidate":[76],"events":[77],"packages":[79],"synchronized":[80],"keyframes":[81],"time":[83],"windows":[84],"packets":[87],"with":[88,101,126],"traceable":[89],"pointers":[90],"the":[92,96,119],"source":[93],"data.":[94],"Finally,":[95],"integrates":[98],"LLM":[100],"modality":[102],"specific":[103],"tools":[104],"prompt":[106],"templates":[107],"draft":[109],"annotations":[111],"analyst":[113],"verification":[114],"editing.":[116],"demonstrate":[118],"workflow":[120],"VR":[123],"recordings":[125],"representative":[127],"examples.":[128]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-05T00:00:00"}
