{"id":"https://openalex.org/W2765837117","doi":"https://doi.org/10.1145/3123266.3123321","title":"Sketch Recognition with Deep Visual-Sequential Fusion Model","display_name":"Sketch Recognition with Deep Visual-Sequential Fusion Model","publication_year":2017,"publication_date":"2017-10-19","ids":{"openalex":"https://openalex.org/W2765837117","doi":"https://doi.org/10.1145/3123266.3123321","mag":"2765837117"},"language":"en","primary_location":{"id":"doi:10.1145/3123266.3123321","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3123266.3123321","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 25th ACM international conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026022705","display_name":"Jun-Yan He","orcid":"https://orcid.org/0000-0002-6628-6924"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jun-Yan He","raw_affiliation_strings":["Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011680564","display_name":"Xiao Wu","orcid":"https://orcid.org/0000-0002-8322-8558"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao Wu","raw_affiliation_strings":["Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047962986","display_name":"Yu\u2013Gang Jiang","orcid":"https://orcid.org/0000-0002-1907-8567"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu-Gang Jiang","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103114339","display_name":"Bo Zhao","orcid":"https://orcid.org/0000-0002-2120-2571"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Zhao","raw_affiliation_strings":["Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053836350","display_name":"Qiang Peng","orcid":"https://orcid.org/0000-0002-0536-2313"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiang Peng","raw_affiliation_strings":["Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5026022705"],"corresponding_institution_ids":["https://openalex.org/I4800084"],"apc_list":null,"apc_paid":null,"fwci":1.3845,"has_fulltext":false,"cited_by_count":35,"citation_normalized_percentile":{"value":0.89027417,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"448","last_page":"456"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9896000027656555,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8364089727401733},{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.7465684413909912},{"id":"https://openalex.org/keywords/sketch-recognition","display_name":"Sketch recognition","score":0.6878141164779663},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6797454953193665},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.654051661491394},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.6449447870254517},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.557647705078125},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5126670598983765},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5045024156570435},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.43705254793167114},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.11297783255577087}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8364089727401733},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.7465684413909912},{"id":"https://openalex.org/C132900626","wikidata":"https://www.wikidata.org/wiki/Q7534733","display_name":"Sketch recognition","level":4,"score":0.6878141164779663},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6797454953193665},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.654051661491394},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.6449447870254517},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.557647705078125},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5126670598983765},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5045024156570435},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.43705254793167114},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.11297783255577087},{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C159437735","wikidata":"https://www.wikidata.org/wiki/Q1519524","display_name":"Gesture recognition","level":3,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3123266.3123321","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3123266.3123321","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 25th ACM international conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/14","score":0.5199999809265137,"display_name":"Life below water"}],"awards":[{"id":"https://openalex.org/G5763239087","display_name":null,"funder_award_id":"61373121 and 61622204","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W1488163396","https://openalex.org/W1923404803","https://openalex.org/W1933349210","https://openalex.org/W1972420097","https://openalex.org/W1976664910","https://openalex.org/W1977841709","https://openalex.org/W1983556963","https://openalex.org/W2026019603","https://openalex.org/W2034136097","https://openalex.org/W2064675550","https://openalex.org/W2066562438","https://openalex.org/W2097117768","https://openalex.org/W2116435618","https://openalex.org/W2121604810","https://openalex.org/W2141345255","https://openalex.org/W2148357922","https://openalex.org/W2149481809","https://openalex.org/W2161565164","https://openalex.org/W2187089797","https://openalex.org/W2189070436","https://openalex.org/W2194775991","https://openalex.org/W2251228688","https://openalex.org/W2267126114","https://openalex.org/W2401231614","https://openalex.org/W2471581439","https://openalex.org/W2472970127","https://openalex.org/W2618530766","https://openalex.org/W2949218037","https://openalex.org/W2950166981","https://openalex.org/W2950761309","https://openalex.org/W2952320381","https://openalex.org/W2952453038","https://openalex.org/W2962835968","https://openalex.org/W2962974137","https://openalex.org/W2963843052","https://openalex.org/W2963954913","https://openalex.org/W3118608800"],"related_works":["https://openalex.org/W2294900353","https://openalex.org/W2411243951","https://openalex.org/W2151314278","https://openalex.org/W13629514","https://openalex.org/W1971224820","https://openalex.org/W2963977451","https://openalex.org/W2098836165","https://openalex.org/W1976890290","https://openalex.org/W1573697454","https://openalex.org/W2966897482"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"a":[3,35,138],"deep":[4,48],"end-to-end":[5],"network":[6,120],"for":[7],"sketch":[8,151],"recognition,":[9],"named":[10],"Deep":[11],"Visual-Sequential":[12],"Fusion":[13],"model":[14,19],"(DVSF)":[15],"is":[16,39],"proposed":[17,72,159],"to":[18,42,59,73,92,141],"the":[20,26,30,44,54,75,80,94,101,119,126,132,143,149,155,158,163],"visual":[21,45,55,68,127],"and":[22,56,62,88,96,128],"sequential":[23,57,106,129],"patterns":[24,77,102],"of":[25,33,103,131,157],"strokes.":[27],"To":[28,99],"capture":[29,60],"intermediate":[31],"states":[32],"sketches,":[34],"three-way":[36],"representation":[37],"learner":[38],"first":[40],"utilized":[41],"extract":[43],"features.":[46],"These":[47],"features":[49],"are":[50,70,108,134],"simultaneously":[51],"fed":[52],"into":[53],"networks":[58,69,107],"spatial":[61],"temporal":[63],"properties,":[64],"respectively.":[65],"More":[66],"specifically,":[67],"novelly":[71],"learn":[74,100],"stroke":[76,104],"by":[78,110,122],"stacking":[79],"Residual":[81,111],"Fully-Connected":[82],"(R-FC)":[83],"layers,":[84],"which":[85,117,161],"integrate":[86],"ReLU":[87],"Tanh":[89],"activation":[90],"functions":[91],"achieve":[93],"sparsity":[95],"generalization":[97],"ability.":[98],"order,":[105],"constructed":[109],"Long":[112],"Short-Term":[113],"Memory":[114],"(R-LSTM)":[115],"units,":[116],"optimize":[118],"architecture":[121],"skip":[123],"connection.":[124],"Finally,":[125],"representations":[130],"sketches":[133],"seamlessly":[135],"integrated":[136],"with":[137],"fusion":[139],"layer":[140],"obtain":[142],"final":[144],"results.":[145],"Experiments":[146],"conducted":[147],"on":[148],"benchmark":[150],"dataset":[152],"TU-Berlin":[153],"demonstrate":[154],"effectiveness":[156],"method,":[160],"outperforms":[162],"state-of-the-art":[164],"approaches.":[165]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":3}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
