{"id":"https://openalex.org/W7133336423","doi":"https://doi.org/10.48550/arxiv.2603.02004","title":"CHOP: Counterfactual Human Preference Labels Improve Obstacle Avoidance in Visuomotor Navigation Policies","display_name":"CHOP: Counterfactual Human Preference Labels Improve Obstacle Avoidance in Visuomotor Navigation Policies","publication_year":2026,"publication_date":"2026-03-02","ids":{"openalex":"https://openalex.org/W7133336423","doi":"https://doi.org/10.48550/arxiv.2603.02004"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.02004","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02004","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.02004","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108716741","display_name":"Gershom Seneviratne","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Seneviratne, Gershom","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060252105","display_name":"Jianyu An","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"An, Jianyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127874523","display_name":"Vaibhav Shende","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shende, Vaibhav","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120717808","display_name":"Sahire Ellahy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ellahy, Sahire","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128008129","display_name":"Yaxita Amin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Amin, Yaxita","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128030753","display_name":"Kondapi Manasanjani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manasanjani, Kondapi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127961907","display_name":"Samarth Chopra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chopra, Samarth","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120697547","display_name":"Jonathan Deepak Kannan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kannan, Jonathan Deepak","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5127931835","display_name":"Dinesh Manocha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manocha, Dinesh","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5108716741"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.20999999344348907,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.20999999344348907,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.15690000355243683,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.09459999948740005,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/counterfactual-thinking","display_name":"Counterfactual thinking","score":0.8258000016212463},{"id":"https://openalex.org/keywords/obstacle-avoidance","display_name":"Obstacle avoidance","score":0.7706999778747559},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.5332000255584717},{"id":"https://openalex.org/keywords/preference","display_name":"Preference","score":0.4846999943256378},{"id":"https://openalex.org/keywords/obstacle","display_name":"Obstacle","score":0.4747999906539917},{"id":"https://openalex.org/keywords/preference-elicitation","display_name":"Preference elicitation","score":0.40799999237060547},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.39570000767707825},{"id":"https://openalex.org/keywords/safer","display_name":"SAFER","score":0.38589999079704285}],"concepts":[{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.8258000016212463},{"id":"https://openalex.org/C6683253","wikidata":"https://www.wikidata.org/wiki/Q7075535","display_name":"Obstacle avoidance","level":4,"score":0.7706999778747559},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6305999755859375},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5845999717712402},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.5332000255584717},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.4846999943256378},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.4747999906539917},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4713999927043915},{"id":"https://openalex.org/C2777868144","wikidata":"https://www.wikidata.org/wiki/Q7239817","display_name":"Preference elicitation","level":3,"score":0.40799999237060547},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.39570000767707825},{"id":"https://openalex.org/C2776654903","wikidata":"https://www.wikidata.org/wiki/Q2601463","display_name":"SAFER","level":2,"score":0.38589999079704285},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3817000091075897},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.3790999948978424},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.37779998779296875},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.36410000920295715},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.34459999203681946},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.34060001373291016},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.33980000019073486},{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.32499998807907104},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.29980000853538513},{"id":"https://openalex.org/C132010649","wikidata":"https://www.wikidata.org/wiki/Q189222","display_name":"Intuition","level":2,"score":0.2806999981403351},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2766000032424927},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.27320000529289246},{"id":"https://openalex.org/C3017944768","wikidata":"https://www.wikidata.org/wiki/Q1450463","display_name":"Poison control","level":2,"score":0.2727999985218048},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.2578999996185303},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.25459998846054077}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.02004","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02004","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.02004","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02004","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Visuomotor":[0],"navigation":[1,17,41,70,111,129,209],"policies":[2,42,130,178,232],"have":[3,77],"shown":[4],"strong":[5],"perception-action":[6],"coupling":[7],"for":[8,55],"embodied":[9,236],"agents,":[10],"yet":[11],"they":[12],"often":[13],"struggle":[14],"with":[15,116,132],"safe":[16],"and":[18,48,99,146,194,199,233],"dynamic":[19],"obstacle":[20,49,149,188],"avoidance":[21,50],"in":[22,51,119,225],"complex":[23],"real-world":[24,168],"environments.":[25],"We":[26],"introduce":[27],"CHOP,":[28,54],"a":[29,66,171],"novel":[30],"approach":[31],"that":[32,127],"leverages":[33],"Counterfactual":[34],"Human":[35,82],"Preference":[36],"Labels":[37],"to":[38,108,160,167,212],"align":[39],"visuomotor":[40,110,128,231],"towards":[43],"human":[44,117],"intuition":[45],"of":[46,68,221],"safety":[47],"navigation.":[52,120,237],"In":[53],"each":[56],"visual":[57],"observation,":[58],"the":[59,74,123,219,227],"robot's":[60],"executed":[61],"trajectory":[62],"is":[63],"included":[64],"among":[65],"set":[67],"counterfactual":[69,222],"trajectories:":[71],"alternative":[72],"trajectories":[73,90,143],"robot":[75],"could":[76],"followed":[78],"under":[79],"identical":[80],"conditions.":[81],"annotators":[83],"provide":[84],"pairwise":[85],"preference":[86,223],"labels":[87],"over":[88],"these":[89],"based":[91],"on":[92,122,153,170,206],"anticipated":[93],"outcomes":[94],"such":[95],"as":[96],"collision":[97,193],"risk":[98],"path":[100,202],"efficiency.":[101],"These":[102,164],"aggregated":[103],"preferences":[104,118],"are":[105],"then":[106],"used":[107],"fine-tune":[109],"policies,":[112],"aligning":[113],"their":[114,161,213],"behavior":[115],"Experiments":[121],"SCAND":[124],"dataset":[125],"show":[126],"fine-tuned":[131],"CHOP":[133],"reduce":[134,192],"near-collision":[135],"events":[136,196],"by":[137,144,151,184,190,197,204],"49.7%,":[138],"decrease":[139],"deviation":[140],"from":[141],"human-preferred":[142],"45.0%,":[145],"increase":[147,186],"average":[148,154,180,207],"clearance":[150,189],"19.8%":[152],"across":[155,208],"multiple":[156],"state-of-the-art":[157],"models,":[158],"compared":[159,211],"pretrained":[162,214],"baselines.":[163,215],"improvements":[165],"transfer":[166],"deployments":[169],"Ghost":[172],"Robotics":[173],"Vision60":[174],"quadruped,":[175],"where":[176],"CHOP-aligned":[177],"improve":[179,200],"goal":[181],"success":[182],"rates":[183],"24.4%,":[185],"minimum":[187],"6.8%,":[191],"intervention":[195],"45.7%,":[198],"normalized":[201],"completion":[203],"38.6%":[205],"scenarios,":[210],"Our":[216],"results":[217],"highlight":[218],"value":[220],"supervision":[224],"bridging":[226],"gap":[228],"between":[229],"large-scale":[230],"human-aligned,":[234],"safety-aware":[235]},"counts_by_year":[],"updated_date":"2026-03-04T07:09:34.246503","created_date":"2026-03-04T00:00:00"}
