{"id":"https://openalex.org/W7138430712","doi":"https://doi.org/10.48550/arxiv.2603.15558","title":"Panoramic Affordance Prediction","display_name":"Panoramic Affordance Prediction","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7138430712","doi":"https://doi.org/10.48550/arxiv.2603.15558"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.15558","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15558","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.15558","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129681178","display_name":"Zixin Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Zixin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129001527","display_name":"Chenfei Liao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liao, Chenfei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128991438","display_name":"Hongfei Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Hongfei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129726175","display_name":"Harold Haodong Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Harold Haodong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129666072","display_name":"Kanghao Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Kanghao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129670970","display_name":"Zichen Wen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Zichen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129674786","display_name":"Litao Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Litao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129742408","display_name":"Bin Ren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Bin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129744712","display_name":"Xu Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Xu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129738684","display_name":"Yinchuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yinchuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129663223","display_name":"Xuming Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Xuming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129650669","display_name":"Nicu Sebe","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sebe, Nicu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129654488","display_name":"Ying-cong Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Ying-Cong","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5129681178"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.3068000078201294,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.3068000078201294,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.13510000705718994,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.09489999711513519,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/affordance","display_name":"Affordance","score":0.9039999842643738},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.5194000005722046},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5170999765396118},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.48969998955726624},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4690999984741211},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.39739999175071716},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.38100001215934753},{"id":"https://openalex.org/keywords/embodied-cognition","display_name":"Embodied cognition","score":0.37290000915527344},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.3682999908924103}],"concepts":[{"id":"https://openalex.org/C194995250","wikidata":"https://www.wikidata.org/wiki/Q531136","display_name":"Affordance","level":2,"score":0.9039999842643738},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7505999803543091},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6783000230789185},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6078000068664551},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.5194000005722046},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5170999765396118},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.48969998955726624},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4690999984741211},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.39739999175071716},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.39730000495910645},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.38100001215934753},{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.37290000915527344},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.3682999908924103},{"id":"https://openalex.org/C2779916870","wikidata":"https://www.wikidata.org/wiki/Q14467155","display_name":"Gaze","level":2,"score":0.36059999465942383},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.34040001034736633},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.33660000562667847},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.3357999920845032},{"id":"https://openalex.org/C179458375","wikidata":"https://www.wikidata.org/wiki/Q1020763","display_name":"Bundle adjustment","level":3,"score":0.3228999972343445},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.3192000091075897},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.31150001287460327},{"id":"https://openalex.org/C178253425","wikidata":"https://www.wikidata.org/wiki/Q162668","display_name":"Visual perception","level":3,"score":0.3095000088214874},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3052999973297119},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.3052000105381012},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.30070000886917114},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.2669999897480011},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.2547999918460846}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.15558","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15558","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.15558","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15558","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.494440495967865,"display_name":"Life in Land","id":"https://metadata.un.org/sdg/15"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Affordance":[0,50],"prediction":[1,165],"serves":[2],"as":[3],"a":[4,73,101,148],"critical":[5,36],"bridge":[6],"between":[7],"perception":[8,205],"and":[9,31,60,94,117,146,176,198],"action":[10],"in":[11,121],"embodied":[12,208],"AI.":[13],"However,":[14],"existing":[15,163],"research":[16],"is":[17],"confined":[18],"to":[19,55,112,132,141,152,179],"pinhole":[20],"camera":[21],"models,":[22],"which":[23],"suffer":[24,172],"from":[25],"narrow":[26],"Fields":[27],"of":[28,183,203],"View":[29],"(FoV)":[30],"fragmented":[32],"observations,":[33],"often":[34],"missing":[35],"holistic":[37,61],"environmental":[38],"context.":[39],"In":[40,186],"this":[41,66],"paper,":[42],"we":[43,69,98],"present":[44],"the":[45,107,114,180,200],"first":[46,70],"exploration":[47],"into":[48],"Panoramic":[49],"Prediction,":[51],"utilizing":[52],"360-degree":[53],"imagery":[54],"capture":[56],"global":[57],"spatial":[58],"relationships":[59],"scene":[62],"understanding.":[63],"To":[64],"facilitate":[65],"novel":[67],"task,":[68],"introduce":[71],"PAP-12K,":[72],"large-scale":[74],"benchmark":[75],"dataset":[76],"containing":[77],"over":[78,88],"1,000":[79],"ultra-high-resolution":[80],"(12k,":[81],"11904":[82],"x":[83],"5952)":[84],"panoramic":[85,122,184,204],"images":[86,171],"with":[87],"12k":[89],"carefully":[90],"annotated":[91],"QA":[92],"pairs":[93],"affordance":[95,164],"masks.":[96,156],"Furthermore,":[97],"propose":[99],"PAP,":[100],"training-free,":[102],"coarse-to-fine":[103],"pipeline":[104,151],"inspired":[105],"by":[106],"human":[108],"foveal":[109],"visual":[110,127],"system":[111],"tackle":[113],"ultra-high":[115],"resolution":[116],"severe":[118,173],"distortion":[119],"inherent":[120],"images.":[123],"PAP":[124,188],"employs":[125],"recursive":[126],"routing":[128],"via":[129],"grid":[130],"prompting":[131],"progressively":[133],"locate":[134],"targets,":[135],"applies":[136],"an":[137],"adaptive":[138],"gaze":[139],"mechanism":[140],"rectify":[142],"local":[143],"geometric":[144],"distortions,":[145],"utilizes":[147],"cascaded":[149],"grounding":[150],"extract":[153],"precise":[154],"instance-level":[155],"Experimental":[157],"results":[158],"on":[159],"PAP-12K":[160],"reveal":[161],"that":[162],"methods":[166],"designed":[167],"for":[168,206],"standard":[169],"perspective":[170],"performance":[174],"degradation":[175],"fail":[177],"due":[178],"unique":[181],"challenges":[182],"vision.":[185],"contrast,":[187],"framework":[189],"effectively":[190],"overcomes":[191],"these":[192],"obstacles,":[193],"significantly":[194],"outperforming":[195],"state-of-the-art":[196],"baselines":[197],"highlighting":[199],"immense":[201],"potential":[202],"robust":[207],"intelligence.":[209]},"counts_by_year":[],"updated_date":"2026-03-18T06:31:55.123368","created_date":"2026-03-18T00:00:00"}
