{"id":"https://openalex.org/W4388624058","doi":"https://doi.org/10.1109/ro-man57019.2023.10309435","title":"I\u00b3: Interactive Iterative Improvement for Few-Shot Action Segmentation","display_name":"I\u00b3: Interactive Iterative Improvement for Few-Shot Action Segmentation","publication_year":2023,"publication_date":"2023-08-28","ids":{"openalex":"https://openalex.org/W4388624058","doi":"https://doi.org/10.1109/ro-man57019.2023.10309435"},"language":"en","primary_location":{"id":"doi:10.1109/ro-man57019.2023.10309435","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ro-man57019.2023.10309435","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 32nd IEEE International Conference on Robot and Human Interactive Communication (RO-MAN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093251756","display_name":"Martina Gassen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Martina Gassen","raw_affiliation_strings":["Interactive AI &#x0026; Cognitive Models for Human-AI Interaction (IKIDA),TU Darmstadt,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Interactive AI &#x0026; Cognitive Models for Human-AI Interaction (IKIDA),TU Darmstadt,Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093251757","display_name":"Frederic Metzler","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Frederic Metzler","raw_affiliation_strings":["Interactive AI &#x0026; Cognitive Models for Human-AI Interaction (IKIDA),TU Darmstadt,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Interactive AI &#x0026; Cognitive Models for Human-AI Interaction (IKIDA),TU Darmstadt,Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093251758","display_name":"Erik Prescher","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Erik Prescher","raw_affiliation_strings":["Interactive AI &#x0026; Cognitive Models for Human-AI Interaction (IKIDA),TU Darmstadt,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Interactive AI &#x0026; Cognitive Models for Human-AI Interaction (IKIDA),TU Darmstadt,Germany","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082442455","display_name":"Lisa Scherf","orcid":"https://orcid.org/0009-0004-0950-5184"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technische Universit\u00e4t Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Lisa Scherf","raw_affiliation_strings":["Interactive AI &#x0026; Cognitive Models for Human-AI Interaction (IKIDA),TU Darmstadt,Germany","Centre for Cognitive Science, TU Darmstadt, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Interactive AI &#x0026; Cognitive Models for Human-AI Interaction (IKIDA),TU Darmstadt,Germany","institution_ids":[]},{"raw_affiliation_string":"Centre for Cognitive Science, TU Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024771523","display_name":"Vignesh Prasad","orcid":"https://orcid.org/0000-0002-9729-2454"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technische Universit\u00e4t Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Vignesh Prasad","raw_affiliation_strings":["Institute for Intelligent Autonomous Systems,Department of Computer Science,TU Darmstadt,Germany","Department of Computer Science, Institute for Intelligent Autonomous Systems, TU Darmstadt, Germany","Department of Law and Economics, Chair for Marketing and Human Resource Management, TU Darmstadt, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Autonomous Systems,Department of Computer Science,TU Darmstadt,Germany","institution_ids":["https://openalex.org/I31512782"]},{"raw_affiliation_string":"Department of Computer Science, Institute for Intelligent Autonomous Systems, TU Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]},{"raw_affiliation_string":"Department of Law and Economics, Chair for Marketing and Human Resource Management, TU Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114099285","display_name":"Felix Kaiser","orcid":null},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technische Universit\u00e4t Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Felix Kaiser","raw_affiliation_strings":["Institute for Intelligent Autonomous Systems,Department of Computer Science,TU Darmstadt,Germany","Department of Computer Science, Institute for Intelligent Autonomous Systems, TU Darmstadt, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Intelligent Autonomous Systems,Department of Computer Science,TU Darmstadt,Germany","institution_ids":["https://openalex.org/I31512782"]},{"raw_affiliation_string":"Department of Computer Science, Institute for Intelligent Autonomous Systems, TU Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063353075","display_name":"Dorothea Koert","orcid":"https://orcid.org/0000-0002-3571-6848"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technische Universit\u00e4t Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Dorothea Koert","raw_affiliation_strings":["Interactive AI &#x0026; Cognitive Models for Human-AI Interaction (IKIDA),TU Darmstadt,Germany","Centre for Cognitive Science, TU Darmstadt, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Interactive AI &#x0026; Cognitive Models for Human-AI Interaction (IKIDA),TU Darmstadt,Germany","institution_ids":[]},{"raw_affiliation_string":"Centre for Cognitive Science, TU Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2246,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.52809809,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"378","last_page":"385"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8441104888916016},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7722667455673218},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6607974767684937},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5926341414451599},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5300720930099487},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.4975791275501251},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.471383661031723},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.4269990921020508},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.41599711775779724},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.4145314693450928},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.32468798756599426}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8441104888916016},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7722667455673218},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6607974767684937},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5926341414451599},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5300720930099487},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4975791275501251},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.471383661031723},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.4269990921020508},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.41599711775779724},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.4145314693450928},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.32468798756599426},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ro-man57019.2023.10309435","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ro-man57019.2023.10309435","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 32nd IEEE International Conference on Robot and Human Interactive Communication (RO-MAN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321408","display_name":"Ministry of Education","ror":"https://ror.org/01p262204"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W132147841","https://openalex.org/W2031688197","https://openalex.org/W2064675550","https://openalex.org/W2076618452","https://openalex.org/W2099614498","https://openalex.org/W2100993276","https://openalex.org/W2115733720","https://openalex.org/W2144656844","https://openalex.org/W2159799403","https://openalex.org/W2169551590","https://openalex.org/W2403890723","https://openalex.org/W2605907393","https://openalex.org/W2721233823","https://openalex.org/W2747141180","https://openalex.org/W2794079986","https://openalex.org/W2808912095","https://openalex.org/W2900410888","https://openalex.org/W2906270977","https://openalex.org/W2962916463","https://openalex.org/W2963150697","https://openalex.org/W2963524571","https://openalex.org/W2964199361","https://openalex.org/W2982335217","https://openalex.org/W2999889331","https://openalex.org/W3009622574","https://openalex.org/W3034942609","https://openalex.org/W3036954260","https://openalex.org/W3052825600","https://openalex.org/W3131362130","https://openalex.org/W3165641326","https://openalex.org/W3165867039","https://openalex.org/W3174700686","https://openalex.org/W3192495122","https://openalex.org/W4200578307","https://openalex.org/W4220783478","https://openalex.org/W4229052852","https://openalex.org/W4291653271","https://openalex.org/W4303647730","https://openalex.org/W4312982010","https://openalex.org/W4313118773","https://openalex.org/W6681389334","https://openalex.org/W6752846148","https://openalex.org/W6763446388","https://openalex.org/W6779442434","https://openalex.org/W6795951589","https://openalex.org/W6843180136","https://openalex.org/W6845924719","https://openalex.org/W6847353123"],"related_works":["https://openalex.org/W2074502265","https://openalex.org/W4214877189","https://openalex.org/W2773965352","https://openalex.org/W2381179799","https://openalex.org/W2980279061","https://openalex.org/W2334685461","https://openalex.org/W2364370872","https://openalex.org/W2053269318","https://openalex.org/W2366718574","https://openalex.org/W2025614924"],"abstract_inverted_index":{"Extracting":[0],"modular":[1],"segments":[2,38],"from":[3],"raw":[4],"video":[5],"demonstrations":[6],"of":[7,96,129,134,181,195,202,217],"high-level":[8],"actions":[9,46],"is":[10,151,166],"important":[11],"to":[12,69,79,146,211,228,234],"understand":[13],"the":[14,36,94,200,239],"underlying":[15,37],"building":[16],"blocks":[17],"for":[18,29,86,108,117,139,178,225],"different":[19,182],"tasks":[20,89,97],"in":[21,67,154,168,173],"human-robot":[22],"interaction.":[23],"While":[24],"(data-hungry)":[25],"supervised":[26],"learning":[27,204],"approaches":[28,62],"Action":[30,73,110],"Segmentation":[31],"show":[32],"good":[33,65],"performance":[34,42,66],"when":[35,44],"are":[39,47,54],"predefined,":[40],"their":[41],"degrades":[43],"unseen":[45,70],"introduced":[48],"on-the-go":[49],"as":[50,93],"new":[51,83],"data":[52,84,197],"samples":[53],"scarce.":[55],"In":[56,72,99],"this":[57,100],"regard,":[58],"Zero-and":[59],"Few-Shot":[60,109,124],"Learning":[61,119,125],"have":[63,235],"shown":[64],"generalizing":[68],"examples.":[71],"Segmentation,":[74,111],"where":[75],"each":[76],"frame":[77],"needs":[78],"be":[80,176],"labeled,":[81],"annotating":[82],"even":[85],"a":[87,112,135,144,163,169,179,192,214],"few":[88],"can":[90,175],"become":[91],"tedious":[92],"number":[95,180,216],"scale.":[98],"work,":[101],"we":[102],"propose":[103],"Interactive":[104,114],"Iterative":[105],"Improvement":[106],"$(I^{3})$":[107],"Semi-Supervised":[113],"Meta-Learning":[115],"approach":[116],"Zero-Shot":[118],"on":[120,126],"unlabeled":[121],"videos":[122],"and":[123],"small":[127],"amounts":[128],"labeled":[130,196],"videos.":[131],"$I^{3}$":[132],"consists":[133],"Prototypical":[136],"Network":[137],"model":[138,150,185],"frame-wise":[140],"prediction":[141],"coupled":[142],"with":[143],"Hidden-Semi-Markov-Model":[145],"prevent":[147],"over-segmentation.":[148],"The":[149],"iteratively":[152],"improved":[153],"an":[155],"interactive":[156],"manner":[157,171],"through":[158],"users\u2019":[159],"annotations":[160,231],"provided":[161],"via":[162],"webinterface.":[164],"This":[165],"done":[167],"task-agnostic":[170],"that,":[172],"theory,":[174],"reused":[177],"actions.":[183],"Our":[184],"provides":[186],"sequentially":[187],"accurate":[188],"segmentations":[189],"using":[190],"only":[191],"limited":[193],"amount":[194],"which":[198],"shows":[199],"efficacy":[201],"our":[203],"approach.":[205],"A":[206],"lower":[207,215],"edit":[208],"distance":[209],"compared":[210],"baselines":[212],"indicates":[213],"required":[218],"user":[219],"edits":[220],"making":[221],"it":[222],"well":[223],"suited":[224],"non-expert":[226],"users":[227],"smoothly":[229],"provide":[230],"enabling":[232],"them":[233],"more":[236],"control":[237],"over":[238],"learned":[240],"model.":[241]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
