{"id":"https://openalex.org/W3204321269","doi":"https://doi.org/10.1145/3458380.3458399","title":"Siamese Networks with Distance-IoU Loss for Real-time Visual Tracking","display_name":"Siamese Networks with Distance-IoU Loss for Real-time Visual Tracking","publication_year":2021,"publication_date":"2021-02-26","ids":{"openalex":"https://openalex.org/W3204321269","doi":"https://doi.org/10.1145/3458380.3458399","mag":"3204321269"},"language":"en","primary_location":{"id":"doi:10.1145/3458380.3458399","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3458380.3458399","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 5th International Conference on Digital Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100449786","display_name":"Shan Liu","orcid":"https://orcid.org/0000-0001-8997-0908"},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shan Liu","raw_affiliation_strings":["Harbin Engineering University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Engineering University, China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060643741","display_name":"Lilian Huang","orcid":"https://orcid.org/0000-0002-3589-285X"},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lilian Huang","raw_affiliation_strings":["Harbin Engineering University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Engineering University, China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061580251","display_name":"Xu Shi","orcid":"https://orcid.org/0000-0002-6353-5470"},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Shi","raw_affiliation_strings":["Harbin Engineering University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Engineering University, China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101577180","display_name":"Yi Sun","orcid":"https://orcid.org/0000-0002-6124-4127"},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Sun","raw_affiliation_strings":["Harbin Engineering University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Engineering University, China","institution_ids":["https://openalex.org/I151727225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.097,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.40809019,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"109","last_page":"115"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9599000215530396,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9442999958992004,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/subnetwork","display_name":"Subnetwork","score":0.8109264373779297},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7670122385025024},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.703183114528656},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6754745244979858},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.642314612865448},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.5511649250984192},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5481250882148743},{"id":"https://openalex.org/keywords/backbone-network","display_name":"Backbone network","score":0.5188485383987427},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.49741676449775696},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.4858834147453308},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.4582395553588867},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4556080400943756},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.41069281101226807},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4092980623245239},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.22747066617012024},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.18288081884384155},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09294062852859497}],"concepts":[{"id":"https://openalex.org/C2780186347","wikidata":"https://www.wikidata.org/wiki/Q11414","display_name":"Subnetwork","level":2,"score":0.8109264373779297},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7670122385025024},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.703183114528656},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6754745244979858},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.642314612865448},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.5511649250984192},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5481250882148743},{"id":"https://openalex.org/C88796919","wikidata":"https://www.wikidata.org/wiki/Q1142907","display_name":"Backbone network","level":2,"score":0.5188485383987427},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.49741676449775696},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.4858834147453308},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.4582395553588867},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4556080400943756},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.41069281101226807},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4092980623245239},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.22747066617012024},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.18288081884384155},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09294062852859497},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3458380.3458399","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3458380.3458399","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 5th International Conference on Digital Signal Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","score":0.4099999964237213,"display_name":"Partnerships for the goals"}],"awards":[{"id":"https://openalex.org/G2700002112","display_name":null,"funder_award_id":"No. F201220","funder_id":"https://openalex.org/F4320323085","funder_display_name":"Natural Science Foundation of Heilongjiang Province"},{"id":"https://openalex.org/G5201504206","display_name":null,"funder_award_id":"No. 61203004","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323085","display_name":"Natural Science Foundation of Heilongjiang Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1955741794","https://openalex.org/W2034803354","https://openalex.org/W2089961441","https://openalex.org/W2117539524","https://openalex.org/W2127589108","https://openalex.org/W2158592639","https://openalex.org/W2613718673","https://openalex.org/W2885238544","https://openalex.org/W2892241171","https://openalex.org/W2915935370","https://openalex.org/W2920338184","https://openalex.org/W2963074722","https://openalex.org/W3039148474","https://openalex.org/W4234552385","https://openalex.org/W4301409532"],"related_works":["https://openalex.org/W4237171675","https://openalex.org/W3036286480","https://openalex.org/W4287027631","https://openalex.org/W3192357901","https://openalex.org/W2387360586","https://openalex.org/W2952736415","https://openalex.org/W3209723314","https://openalex.org/W3205398323","https://openalex.org/W2883297582","https://openalex.org/W4390524233"],"abstract_inverted_index":{"The":[0,75,100,161],"combination":[1],"of":[2,13,21,34,60,96,102,119,142,188],"siamese":[3,35,66],"networks":[4,8,67],"and":[5,29,37,46,80,158,172,177],"region":[6],"proposal":[7],"(RPN)":[9],"has":[10],"drawn":[11],"attention":[12],"a":[14],"great":[15],"many":[16],"scholars":[17],"in":[18,174],"the":[19,42,56,61,65,82,88,97,112,116,120,126,131,140,155,186,189],"field":[20],"visual":[22,73],"object":[23],"tracking":[24,58,143,152,170],"with":[25,68,149],"its":[26],"balanced":[27],"speed":[28],"accuracy.":[30],"SiamRPN":[31],"is":[32,77],"composed":[33],"subnetwork":[36],"RPN":[38],"subnetwork.":[39],"It":[40],"abandons":[41],"traditional":[43],"multi-scale":[44],"testing":[45],"online":[47],"tracking,":[48],"which":[49,137,184],"greatly":[50,138],"meets":[51],"real-time":[52,72],"requirements.":[53],"Aiming":[54],"at":[55,179],"limited":[57],"accuracy":[59,171],"SiamRPN,":[62,136],"we":[63,124],"propose":[64],"Distance-IoU":[69,127],"Loss":[70],"for":[71],"tracking.":[74],"first":[76],"to":[78,92,129],"crop":[79],"fuse":[81],"multi-layer":[83,98],"feature":[84,89],"maps":[85],"extracted":[86],"by":[87,107,135],"extraction":[90],"network":[91,108],"make":[93],"full":[94],"use":[95],"features.":[99],"weights":[101],"weighted":[103],"fusion":[104],"are":[105],"obtained":[106],"learning":[109],"rather":[110],"than":[111],"manual":[113],"setting.":[114],"For":[115],"loss":[117,128,133],"function":[118],"bounding":[121],"box":[122],"regression,":[123],"choose":[125],"replace":[130],"Smooth":[132],"adopted":[134],"improves":[139],"performance":[141],"algorithm.":[144,190],"We":[145],"compare":[146],"our":[147,166],"algorithm":[148,167],"other":[150],"state-of-the-art":[151],"algorithms":[153],"on":[154],"VOT2016,":[156],"VOT2018,":[157],"UAV123":[159],"datasets.":[160],"experimental":[162],"results":[163],"show":[164],"that":[165],"shows":[168],"better":[169],"robustness":[173],"various":[175],"scenarios":[176],"works":[178],"154":[180],"frames":[181],"per":[182],"second,":[183],"verifies":[185],"effectiveness":[187]},"counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
