{"id":"https://openalex.org/W7128723048","doi":"https://doi.org/10.48550/arxiv.2602.10551","title":"C^2ROPE: Causal Continuous Rotary Positional Encoding for 3D Large Multimodal-Models Reasoning","display_name":"C^2ROPE: Causal Continuous Rotary Positional Encoding for 3D Large Multimodal-Models Reasoning","publication_year":2026,"publication_date":"2026-02-11","ids":{"openalex":"https://openalex.org/W7128723048","doi":"https://doi.org/10.48550/arxiv.2602.10551"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.10551","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085274223","display_name":"Guanting Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ye, Guanting","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125769167","display_name":"Qiyan Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Qiyan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125769479","display_name":"Wenhao Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Wenhao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125754629","display_name":"Xiaofeng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xiaofeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5098821261","display_name":"Jianmin Ji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ji, Jianmin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125708551","display_name":"Yanyong Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yanyong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5122304301","display_name":"Ka-Veng Yuen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuen, Ka-Veng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5085274223"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.0006000000284984708,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.00039999998989515007,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6261000037193298},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.6116999983787537},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5199000239372253},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.5012000203132629},{"id":"https://openalex.org/keywords/visual-reasoning","display_name":"Visual reasoning","score":0.46549999713897705},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4226999878883362},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.41130000352859497},{"id":"https://openalex.org/keywords/causal-reasoning","display_name":"Causal reasoning","score":0.40220001339912415},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.39739999175071716},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.3783999979496002}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.730400025844574},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6261000037193298},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.6116999983787537},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5995000004768372},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5199000239372253},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.5012000203132629},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4674000144004822},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.46549999713897705},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4226999878883362},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.41130000352859497},{"id":"https://openalex.org/C115086926","wikidata":"https://www.wikidata.org/wiki/Q17004651","display_name":"Causal reasoning","level":3,"score":0.40220001339912415},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.39739999175071716},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.3783999979496002},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3756999969482422},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.35830000042915344},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35740000009536743},{"id":"https://openalex.org/C194226119","wikidata":"https://www.wikidata.org/wiki/Q161779","display_name":"Spatial reference system","level":2,"score":0.3537999987602234},{"id":"https://openalex.org/C2780103172","wikidata":"https://www.wikidata.org/wiki/Q1309721","display_name":"Visual Objects","level":3,"score":0.3084000051021576},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.2976999878883362},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.29440000653266907},{"id":"https://openalex.org/C178253425","wikidata":"https://www.wikidata.org/wiki/Q162668","display_name":"Visual perception","level":3,"score":0.2892000079154968},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.28529998660087585},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.2791000008583069},{"id":"https://openalex.org/C11671645","wikidata":"https://www.wikidata.org/wiki/Q5054567","display_name":"Causal model","level":2,"score":0.2784000039100647},{"id":"https://openalex.org/C53051483","wikidata":"https://www.wikidata.org/wiki/Q861555","display_name":"Cube (algebra)","level":2,"score":0.27160000801086426},{"id":"https://openalex.org/C155911833","wikidata":"https://www.wikidata.org/wiki/Q3817354","display_name":"Spatial intelligence","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C178278151","wikidata":"https://www.wikidata.org/wiki/Q7936607","display_name":"Visual memory","level":3,"score":0.2624000012874603},{"id":"https://openalex.org/C105842133","wikidata":"https://www.wikidata.org/wiki/Q1899679","display_name":"Visual communication","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.2597000002861023},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.25870001316070557},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.25619998574256897},{"id":"https://openalex.org/C3073032","wikidata":"https://www.wikidata.org/wiki/Q15912075","display_name":"Information hiding","level":3,"score":0.25209999084472656},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2515999972820282}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.10551","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.10551","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.10551","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.10551","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,58,80,184],"3D":[3,19,193,197],"Large":[4,10],"Multimodal":[5],"Models":[6,12],"(LMMs)":[7],"built":[8],"on":[9],"Language":[11],"(LLMs)":[13],"have":[14],"established":[15],"the":[16,26,30,48,54,65,85,94,162,178],"alignment":[17],"of":[18,50,181],"visual":[20,51,91,119,130,198],"features":[21,52],"with":[22,138],"LLM":[23],"representations":[24],"as":[25,93],"dominant":[27],"paradigm.":[28],"However,":[29],"inherited":[31],"Rotary":[32],"Position":[33],"Embedding":[34],"(RoPE)":[35],"introduces":[36,122],"limitations":[37],"for":[38,118,129],"multimodal":[39],"processing.":[40,120],"Specifically,":[41],"applying":[42],"1D":[43,135],"temporal":[44,136],"positional":[45,126,147,159],"indices":[46],"disrupts":[47],"continuity":[49],"along":[53],"column":[55],"dimension,":[56],"resulting":[57],"spatial":[59,112,115,140],"locality":[60],"loss.":[61],"Moreover,":[62],"RoPE":[63,107],"follows":[64],"prior":[66],"that":[67,108],"temporally":[68],"closer":[69],"image":[70,182],"tokens":[71,92,183],"are":[72],"more":[73],"causally":[74],"related,":[75],"leading":[76],"to":[77,87,142,156],"long-term":[78],"decay":[79],"attention":[81],"allocation":[82,154],"and":[83,114,149,196],"causing":[84],"model":[86],"progressively":[88],"neglect":[89],"earlier":[90],"sequence":[95],"length":[96],"increases.":[97],"To":[98],"address":[99],"these":[100],"issues,":[101],"we":[102,167],"propose":[103],"C^2RoPE,":[104],"an":[105],"improved":[106],"explicitly":[109],"models":[110],"local":[111],"Continuity":[113],"Causal":[116,170],"relationships":[117],"C^2RoPE":[121],"a":[123,144,152],"spatio-temporal":[124,158],"continuous":[125],"embedding":[127],"mechanism":[128],"tokens.":[131],"It":[132],"first":[133],"integrates":[134],"positions":[137],"Cartesian-based":[139],"coordinates":[141],"construct":[143],"triplet":[145],"hybrid":[146],"index,":[148],"then":[150],"employs":[151],"frequency":[153],"strategy":[155],"encode":[157],"information":[160],"across":[161,189],"three":[163],"index":[164],"components.":[165],"Additionally,":[166],"introduce":[168],"Chebyshev":[169,179],"Masking,":[171],"which":[172],"determines":[173],"causal":[174],"dependencies":[175],"by":[176],"computing":[177],"distance":[180],"2D":[185],"space.":[186],"Evaluation":[187],"results":[188],"various":[190],"benchmarks,":[191],"including":[192],"scene":[194],"reasoning":[195],"question":[199],"answering,":[200],"demonstrate":[201],"C^2RoPE's":[202],"effectiveness.":[203],"The":[204],"code":[205],"is":[206],"be":[207],"available":[208],"at":[209],"https://github.com/ErikZ719/C2RoPE.":[210]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-13T00:00:00"}
