{"id":"https://openalex.org/W7134038225","doi":"https://doi.org/10.3233/faia260017","title":"Multi-Stage Learning for Visually Similar Road User Detection and Tracking","display_name":"Multi-Stage Learning for Visually Similar Road User Detection and Tracking","publication_year":2026,"publication_date":"2026-03-04","ids":{"openalex":"https://openalex.org/W7134038225","doi":"https://doi.org/10.3233/faia260017"},"language":null,"primary_location":{"id":"doi:10.3233/faia260017","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia260017","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.3233/faia260017","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100989543","display_name":"Young Chul Lim","orcid":"https://orcid.org/0009-0003-5229-360X"},"institutions":[{"id":"https://openalex.org/I193352282","display_name":"Daegu Gyeongbuk Institute of Science and Technology","ror":"https://ror.org/03frjya69","country_code":"KR","type":"education","lineage":["https://openalex.org/I193352282"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Young Chul Lim","raw_affiliation_strings":["Division of Mobility Technology, Daegu Gyeongbuk Institute of Science & Technology, Korea"],"raw_orcid":"https://orcid.org/0009-0003-5229-360X","affiliations":[{"raw_affiliation_string":"Division of Mobility Technology, Daegu Gyeongbuk Institute of Science & Technology, Korea","institution_ids":["https://openalex.org/I193352282"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5128222091","display_name":"Minsung Kang","orcid":null},"institutions":[{"id":"https://openalex.org/I193352282","display_name":"Daegu Gyeongbuk Institute of Science and Technology","ror":"https://ror.org/03frjya69","country_code":"KR","type":"education","lineage":["https://openalex.org/I193352282"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Minsung Kang","raw_affiliation_strings":["Division of Mobility Technology, Daegu Gyeongbuk Institute of Science & Technology, Korea"],"raw_orcid":"https://orcid.org/0000-0003-4018-8514","affiliations":[{"raw_affiliation_string":"Division of Mobility Technology, Daegu Gyeongbuk Institute of Science & Technology, Korea","institution_ids":["https://openalex.org/I193352282"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100989543"],"corresponding_institution_ids":["https://openalex.org/I193352282"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.58904773,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.7634999752044678,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.7634999752044678,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.13779999315738678,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.039000000804662704,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6482999920845032},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.5282999873161316},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5188000202178955},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.503600001335144},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.45100000500679016},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.44029998779296875},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.43939998745918274},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.4372999966144562},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.4359999895095825}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.8004999756813049},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7753000259399414},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6482999920845032},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6065999865531921},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.5282999873161316},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5188000202178955},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.503600001335144},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.45100000500679016},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.44029998779296875},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.43939998745918274},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.4372999966144562},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.4359999895095825},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4165000021457672},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.3840000033378601},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35199999809265137},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.35179999470710754},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.3508000075817108},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.3504999876022339},{"id":"https://openalex.org/C71681937","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object-class detection","level":5,"score":0.3456000089645386},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.3174999952316284},{"id":"https://openalex.org/C83248878","wikidata":"https://www.wikidata.org/wiki/Q344000","display_name":"Active appearance model","level":3,"score":0.29739999771118164},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.2915000021457672},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.2888000011444092},{"id":"https://openalex.org/C142853389","wikidata":"https://www.wikidata.org/wiki/Q744778","display_name":"Association (psychology)","level":2,"score":0.28349998593330383},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2793000042438507},{"id":"https://openalex.org/C154586513","wikidata":"https://www.wikidata.org/wiki/Q4420972","display_name":"Tracking system","level":3,"score":0.2784999907016754},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.2750999927520752},{"id":"https://openalex.org/C89992363","wikidata":"https://www.wikidata.org/wiki/Q5961558","display_name":"Track (disk drive)","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/faia260017","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia260017","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.3233/faia260017","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia260017","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,58,63,76,91],"unified":[4,109],"deep":[5],"learning":[6,66,79],"framework":[7],"for":[8,68,81],"multi-class":[9],"detection":[10,52,71,103,139],"and":[11,30,42,53,72,89,104,116,140],"tracking":[12,142],"of":[13],"visually":[14],"similar":[15,46],"road":[16,20,33],"users":[17],"in":[18,136],"complex":[19],"environments.":[21],"The":[22,108],"proposed":[23,131],"system":[24],"is":[25],"designed":[26],"to":[27,94],"accurately":[28],"distinguish":[29],"track":[31],"various":[32],"entities\u2014such":[34],"as":[35],"cars,":[36],"buses,":[37],"trucks,":[38],"bicycles,":[39],"motorcycles,":[40],"pedestrians,":[41],"riders\u2014which":[43],"often":[44],"exhibit":[45],"visual":[47],"features.":[48],"To":[49],"achieve":[50],"robust":[51],"instance-aware":[54],"tracking,":[55],"we":[56],"adopt":[57],"three-stage":[59],"training":[60],"strategy:":[61],"(1)":[62],"supervised":[64],"multi-task":[65],"stage":[67,80,93],"joint":[69],"object":[70,96,113],"class":[73],"identification,":[74],"(2)":[75],"self-supervised":[77],"contrastive":[78],"extracting":[82],"instance-level":[83],"feature":[84,105],"embeddings":[85],"without":[86],"identity":[87,121],"labels,":[88],"(3)":[90],"fine-tuning":[92],"improve":[95],"identification":[97],"accuracy":[98],"by":[99],"refining":[100],"both":[101,137],"the":[102,130],"embedding":[106],"heads.":[107],"network":[110],"simultaneously":[111],"outputs":[112],"classes,":[114],"locations,":[115],"appearance":[117],"embeddings,":[118],"enabling":[119],"consistent":[120],"association":[122],"across":[123],"video":[124],"frames.":[125],"Experimental":[126],"results":[127],"demonstrate":[128],"that":[129],"method":[132],"outperforms":[133],"existing":[134],"approaches":[135],"fine-grained":[138],"multi-object":[141],"accuracy.":[143]},"counts_by_year":[],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2026-03-07T00:00:00"}
