{"id":"https://openalex.org/W7129327785","doi":"https://doi.org/10.48550/arxiv.2602.13588","title":"Two-Stream Interactive Joint Learning of Scene Parsing and Geometric Vision Tasks","display_name":"Two-Stream Interactive Joint Learning of Scene Parsing and Geometric Vision Tasks","publication_year":2026,"publication_date":"2026-02-14","ids":{"openalex":"https://openalex.org/W7129327785","doi":"https://doi.org/10.48550/arxiv.2602.13588"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.13588","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113389034","display_name":"Guanfeng Tang","orcid":"https://orcid.org/0009-0002-5918-4775"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tang, Guanfeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126249256","display_name":"Hongbo Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Hongbo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126182875","display_name":"Ziwei Long","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Long, Ziwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100603319","display_name":"Jiayao Li","orcid":"https://orcid.org/0009-0002-9505-7343"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jiayao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126234160","display_name":"Bohong Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Bohong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126263146","display_name":"Wei Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126228708","display_name":"Hanli Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Hanli","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126194577","display_name":"Rui Fan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fan, Rui","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5113389034"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.2596000134944916,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.2596000134944916,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.21310000121593475,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.0908999964594841,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.77920001745224},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5849000215530396},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.5282999873161316},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4575999975204468},{"id":"https://openalex.org/keywords/visual-space","display_name":"Visual space","score":0.392300009727478},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.39079999923706055},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.34360000491142273},{"id":"https://openalex.org/keywords/data-stream-mining","display_name":"Data stream mining","score":0.31540000438690186},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.3111000061035156}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8338000178337097},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.77920001745224},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6826000213623047},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5849000215530396},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5807999968528748},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.5282999873161316},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4575999975204468},{"id":"https://openalex.org/C207363949","wikidata":"https://www.wikidata.org/wiki/Q462915","display_name":"Visual space","level":3,"score":0.392300009727478},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.39079999923706055},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.34360000491142273},{"id":"https://openalex.org/C89198739","wikidata":"https://www.wikidata.org/wiki/Q3079880","display_name":"Data stream mining","level":2,"score":0.31540000438690186},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.3111000061035156},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.30970001220703125},{"id":"https://openalex.org/C181095308","wikidata":"https://www.wikidata.org/wiki/Q1541599","display_name":"Geometric primitive","level":2,"score":0.2937999963760376},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.29260000586509705},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.27320000529289246},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.2603999972343445},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.26010000705718994},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.25519999861717224},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2542000114917755},{"id":"https://openalex.org/C193611912","wikidata":"https://www.wikidata.org/wiki/Q4677596","display_name":"Active vision","level":2,"score":0.25119999051094055},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.25049999356269836}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.13588","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.13588","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.13588","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.13588","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Inspired":[0],"by":[1],"the":[2,54,61,71,80,106,126,148],"human":[3],"visual":[4],"system,":[5],"which":[6,49,94,124],"operates":[7],"on":[8,108,143],"two":[9],"parallel":[10],"yet":[11],"interactive":[12],"streams":[13],"for":[14,84],"contextual":[15,51,81],"and":[16,38,132,154],"spatial":[17],"understanding,":[18],"this":[19],"article":[20],"presents":[21],"Two":[22],"Interactive":[23],"Streams":[24],"(TwInS),":[25],"a":[26,44,90,119],"novel":[27,91],"bio-inspired":[28],"joint":[29],"learning":[30],"framework":[31],"capable":[32],"of":[33,128,150],"simultaneously":[34],"performing":[35],"scene":[36,55,102],"parsing":[37,56],"geometric":[39,62,75,98],"vision":[40,63],"tasks.":[41],"TwInS":[42,114],"adopts":[43],"unified,":[45],"general-purpose":[46],"architecture":[47],"in":[48],"multi-level":[50],"features":[52,76],"from":[53],"stream":[57,64],"are":[58,77],"infused":[59],"into":[60,79],"to":[65,100],"guide":[66],"its":[67,156],"iterative":[68],"refinement.":[69],"In":[70],"reverse":[72],"direction,":[73],"decoded":[74],"projected":[78],"feature":[82,87],"space":[83],"selective":[85],"heterogeneous":[86],"fusion":[88],"via":[89],"cross-task":[92],"adapter,":[93],"leverages":[95],"rich":[96],"cross-view":[97],"cues":[99],"enhance":[101],"parsing.":[103],"To":[104],"eliminate":[105],"dependence":[107],"costly":[109],"human-annotated":[110],"correspondence":[111],"ground":[112],"truth,":[113],"is":[115],"further":[116],"equipped":[117],"with":[118],"tailored":[120],"semi-supervised":[121],"training":[122],"strategy,":[123],"unleashes":[125],"potential":[127],"large-scale":[129],"multi-view":[130],"data":[131],"enables":[133],"continuous":[134],"self-evolution":[135],"without":[136],"requiring":[137],"ground-truth":[138],"correspondences.":[139],"Extensive":[140],"experiments":[141],"conducted":[142],"three":[144],"public":[145],"datasets":[146],"validate":[147],"effectiveness":[149],"TwInS's":[151],"core":[152],"components":[153],"demonstrate":[155],"superior":[157],"performance":[158],"over":[159],"existing":[160],"state-of-the-art":[161],"approaches.":[162],"The":[163],"source":[164],"code":[165],"will":[166],"be":[167],"made":[168],"publicly":[169],"available":[170],"upon":[171],"publication.":[172]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-18T00:00:00"}
