{"id":"https://openalex.org/W7148356481","doi":"https://doi.org/10.48550/arxiv.2604.00363","title":"A Dual-Stream Transformer Architecture for Illumination-Invariant TIR-LiDAR Person Tracking","display_name":"A Dual-Stream Transformer Architecture for Illumination-Invariant TIR-LiDAR Person Tracking","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7148356481","doi":"https://doi.org/10.48550/arxiv.2604.00363"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.00363","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00363","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.00363","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120788633","display_name":"Yuki Minase","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Minase, Yuki","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5030913821","display_name":"Kanji Tanaka","orcid":"https://orcid.org/0000-0001-5584-3521"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tanaka, Kanji","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5120788633"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.8912000060081482,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.8912000060081482,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.01850000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.015200000256299973,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.5662000179290771},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.5223000049591064},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.49779999256134033},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.43549999594688416},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4203999936580658},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4020000100135803}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7293999791145325},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5963000059127808},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.5662000179290771},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5400999784469604},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.5223000049591064},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.49779999256134033},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.43549999594688416},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4203999936580658},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4020000100135803},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.37400001287460327},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3294999897480011},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3181000053882599},{"id":"https://openalex.org/C154586513","wikidata":"https://www.wikidata.org/wiki/Q4420972","display_name":"Tracking system","level":3,"score":0.3165000081062317},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3046000003814697},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.2922999858856201},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.29030001163482666},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2635999917984009}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.00363","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00363","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.00363","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00363","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","score":0.5686915516853333,"display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Robust":[0],"person":[1],"tracking":[2,19,52,73],"is":[3,74],"a":[4,46,86,96,106,155,171],"critical":[5],"capability":[6],"for":[7,176],"autonomous":[8],"mobile":[9],"robots":[10],"operating":[11],"in":[12,71,179],"diverse":[13],"and":[14,49,65,154,165,173],"unpredictable":[15],"environments.":[16],"While":[17],"RGB-D":[18],"has":[20],"shown":[21],"high":[22],"precision,":[23],"its":[24],"performance":[25],"severely":[26],"degrades":[27],"under":[28],"challenging":[29],"illumination":[30],"conditions,":[31],"such":[32],"as":[33,114],"total":[34],"darkness":[35],"or":[36],"intense":[37],"backlighting.":[38],"To":[39,81],"achieve":[40],"all-weather":[41,180],"robustness,":[42],"this":[43],"paper":[44],"proposes":[45],"novel":[47],"Thermal-Infrared":[48],"Depth":[50],"(TIR-D)":[51],"architecture":[53],"that":[54,91,139],"leverages":[55],"the":[56,75,101],"standard":[57],"sensor":[58],"suite":[59],"of":[60,77,152,159],"SLAM-capable":[61],"robots,":[62],"namely":[63],"LiDAR":[64],"TIR":[66],"cameras.":[67],"A":[68],"major":[69],"challenge":[70],"TIR-D":[72,102,142],"scarcity":[76],"annotated":[78],"multi-modal":[79],"datasets.":[80],"address":[82],"this,":[83],"we":[84,121],"introduce":[85],"sequential":[87],"knowledge":[88],"transfer":[89],"strategy":[90,110],"evolves":[92],"structural":[93],"priors":[94],"from":[95],"large-scale":[97],"thermal-trained":[98],"model":[99],"into":[100],"domain.":[103],"By":[104],"employing":[105],"differential":[107],"learning":[108],"rate":[109],"--":[111,120],"referred":[112],"to":[113,132],"``Fine-grained":[115],"Differential":[116],"Learning":[117],"Rate":[118,157],"Strategy''":[119],"effectively":[122],"preserve":[123],"pre-trained":[124],"feature":[125],"extraction":[126],"capabilities":[127],"while":[128],"enabling":[129],"rapid":[130],"adaptation":[131],"geometric":[133],"depth":[134],"cues.":[135],"Experimental":[136],"results":[137],"demonstrate":[138],"our":[140],"proposed":[141],"tracker":[143],"achieves":[144],"superior":[145],"performance,":[146],"with":[147],"an":[148],"Average":[149],"Overlap":[150],"(AO)":[151],"0.700":[153],"Success":[156],"(SR)":[158],"58.7\\%,":[160],"significantly":[161],"outperforming":[162],"conventional":[163],"RGB-transfer":[164],"single-modality":[166],"baselines.":[167],"Our":[168],"approach":[169],"provides":[170],"practical":[172],"resource-efficient":[174],"solution":[175],"robust":[177],"human-following":[178],"robotics":[181],"applications.":[182]},"counts_by_year":[],"updated_date":"2026-04-03T16:44:17.987007","created_date":"2026-04-03T00:00:00"}
