{"id":"https://openalex.org/W2793987571","doi":"https://doi.org/10.5220/0006544001770184","title":"Simultaneous Object Classification and Viewpoint Estimation using Deep Multi-task Convolutional Neural Network","display_name":"Simultaneous Object Classification and Viewpoint Estimation using Deep Multi-task Convolutional Neural Network","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2793987571","doi":"https://doi.org/10.5220/0006544001770184","mag":"2793987571"},"language":"en","primary_location":{"id":"doi:10.5220/0006544001770184","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0006544001770184","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.5220/0006544001770184","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039719067","display_name":"Ahmed J. Afifi","orcid":"https://orcid.org/0000-0001-6782-6753"},"institutions":[{"id":"https://openalex.org/I4577782","display_name":"Technische Universit\u00e4t Berlin","ror":"https://ror.org/03v4gjf40","country_code":"DE","type":"education","lineage":["https://openalex.org/I4577782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Ahmed J. Afifi","raw_affiliation_strings":["Technische Universit\u00e4t Berlin, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Berlin, Germany","institution_ids":["https://openalex.org/I4577782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081055268","display_name":"Olaf Hellwich","orcid":"https://orcid.org/0000-0002-2871-9266"},"institutions":[{"id":"https://openalex.org/I4577782","display_name":"Technische Universit\u00e4t Berlin","ror":"https://ror.org/03v4gjf40","country_code":"DE","type":"education","lineage":["https://openalex.org/I4577782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Olaf Hellwich","raw_affiliation_strings":["Technische Universit\u00e4t Berlin, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Technische Universit\u00e4t Berlin, Germany","institution_ids":["https://openalex.org/I4577782"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012087887","display_name":"Toufique Ahmed Soomro","orcid":"https://orcid.org/0000-0001-7191-6356"},"institutions":[{"id":"https://openalex.org/I153230381","display_name":"Charles Sturt University","ror":"https://ror.org/00wfvh315","country_code":"AU","type":"education","lineage":["https://openalex.org/I153230381"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Toufique A. Soomro","raw_affiliation_strings":["Charles Sturt University, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Charles Sturt University, Australia","institution_ids":["https://openalex.org/I153230381"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.53,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.70307514,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"177","last_page":"184"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8116000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8116000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.8050000071525574,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.8328068256378174},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8096444606781006},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.711359441280365},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6285496950149536},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.5823310017585754},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.540305495262146},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5026311874389648},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.49006664752960205},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.473058819770813},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4342181086540222},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4260816276073456},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.4231211543083191},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.06700319051742554}],"concepts":[{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.8328068256378174},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8096444606781006},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.711359441280365},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6285496950149536},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.5823310017585754},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.540305495262146},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5026311874389648},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.49006664752960205},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.473058819770813},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4342181086540222},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4260816276073456},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.4231211543083191},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.06700319051742554},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.5220/0006544001770184","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0006544001770184","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:publications/71ea3614-7155-45a9-b539-758962730d3e","is_oa":true,"landing_page_url":"https://researchoutput.csu.edu.au/en/publications/71ea3614-7155-45a9-b539-758962730d3e","pdf_url":null,"source":{"id":"https://openalex.org/S7407055442","display_name":"Charles Sturt University Research Output (CRO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Afifi, A J, Hellwich, O & Soomro, T A 2018, Simultaneous object classification and viewpoint estimation using deep multi-task convolutional neural network. in F Imai, A Tremeau & J Braz (eds), Proceedings of the 13th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications : Volume 5: VISAPP. vol. 5, Scitepress, Portugal, pp. 177-184, 13th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications, VISIGRAPP 2018, Funchal, Portugal, 27/01/18. https://doi.org/10.5220/0006544001770184","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.5220/0006544001770184","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0006544001770184","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4226493464","https://openalex.org/W4312417841","https://openalex.org/W3133861977","https://openalex.org/W2951211570","https://openalex.org/W3103566983","https://openalex.org/W3167935049","https://openalex.org/W3029198973","https://openalex.org/W2949096641","https://openalex.org/W2970686063","https://openalex.org/W2969228573"],"abstract_inverted_index":{"Convolutional":[0],"Neural":[1],"Networks":[2],"(CNNs)":[3],"have":[4],"shown":[5],"an":[6],"impressive":[7],"performance":[8],"in":[9,48,196],"many":[10],"computer":[11],"vision":[12],"tasks.":[13,186],"Most":[14],"of":[15,36,50,72,101,203,211],"the":[16,34,70,73,76,102,107,111,128,133,163,165,177,201,209,212],"CNN":[17,30,88,103],"architectures":[18],"were":[19],"proposed":[20,134,147,166],"to":[21,32,58,117,126,131,144,162,180,193,199,207],"solve":[22,118,200],"a":[23,29,86,152,170],"single":[24],"task.":[25],"This":[26,79],"paper":[27],"proposes":[28],"model":[31,167],"tackle":[33],"problem":[35,83],"object":[37,54,92,156],"classification":[38,55,93],"and":[39,94,110,158,206],"viewpoint":[40,60,63,74,95,159],"estimation":[41,64,96],"simultaneously,":[42],"where":[43,173],"these":[44],"problems":[45],"are":[46,124],"opposite":[47],"terms":[49],"feature":[51],"representation.":[52],"While":[53],"task":[56,65,120],"aims":[57],"learn":[59],"invariant":[61],"features,":[62],"requires":[66],"features":[67,183],"that":[68,90],"capture":[69],"variations":[71],"for":[75,155,184],"same":[77],"object.":[78],"study":[80],"addresses":[81],"this":[82],"by":[84],"introducing":[85],"multi-task":[87,171],"architecture":[89],"performs":[91,168],"simultaneously.":[97],"The":[98],"first":[99],"part":[100,113],"is":[104,114,142,151],"shared":[105,178],"between":[106],"two":[108,115],"tasks,":[109],"second":[112],"subnetworks":[116],"each":[119],"separately.":[121],"Synthetic":[122],"images":[123,195],"used":[125,143,192],"increase":[127],"training":[129,204,210],"dataset":[130,141,154],"train":[132],"model.":[135],"To":[136],"evaluate":[137],"our":[138,146],"model,":[139,148,172],"PASCAL3D+":[140],"test":[145],"as":[149,169],"it":[150],"challenging":[153],"detection":[157],"estimation.":[160],"According":[161],"results,":[164],"we":[174],"can":[175,190],"exploit":[176],"layers":[179],"feed":[181],"their":[182],"different":[185,197],"Moreover,":[187],"3D":[188],"models":[189],"be":[191],"render":[194],"conditions":[198],"lack":[202],"data":[205],"enhance":[208],"CNNs.":[213]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
