{"id":"https://openalex.org/W4392824587","doi":"https://doi.org/10.1145/3638584.3638633","title":"Towards Discrete Object Representations in Vision Transformers with Tensor Products","display_name":"Towards Discrete Object Representations in Vision Transformers with Tensor Products","publication_year":2023,"publication_date":"2023-12-08","ids":{"openalex":"https://openalex.org/W4392824587","doi":"https://doi.org/10.1145/3638584.3638633"},"language":"en","primary_location":{"id":"doi:10.1145/3638584.3638633","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3638584.3638633","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3638584.3638633","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 7th International Conference on Computer Science and Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3638584.3638633","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027826572","display_name":"Wei Yuen Teh","orcid":"https://orcid.org/0000-0002-2719-6870"},"institutions":[{"id":"https://openalex.org/I11662577","display_name":"Monash University Malaysia","ror":"https://ror.org/00yncr324","country_code":"MY","type":"education","lineage":["https://openalex.org/I11662577"]}],"countries":["MY"],"is_corresponding":true,"raw_author_name":"Wei Yuen Teh","raw_affiliation_strings":["School of Information Technology, Monash University Malaysia, Malaysia"],"affiliations":[{"raw_affiliation_string":"School of Information Technology, Monash University Malaysia, Malaysia","institution_ids":["https://openalex.org/I11662577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031567819","display_name":"Chern Hong Lim","orcid":"https://orcid.org/0000-0003-4754-6724"},"institutions":[{"id":"https://openalex.org/I11662577","display_name":"Monash University Malaysia","ror":"https://ror.org/00yncr324","country_code":"MY","type":"education","lineage":["https://openalex.org/I11662577"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"Chern Hong Lim","raw_affiliation_strings":["School of Information Technology, Monash University Malaysia, Malaysia"],"affiliations":[{"raw_affiliation_string":"School of Information Technology, Monash University Malaysia, Malaysia","institution_ids":["https://openalex.org/I11662577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046137969","display_name":"Mei Kuan Lim","orcid":"https://orcid.org/0000-0001-8834-9933"},"institutions":[{"id":"https://openalex.org/I11662577","display_name":"Monash University Malaysia","ror":"https://ror.org/00yncr324","country_code":"MY","type":"education","lineage":["https://openalex.org/I11662577"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"Mei Kuan Lim","raw_affiliation_strings":["School of Information Technology, Monash University Malaysia, Malaysia"],"affiliations":[{"raw_affiliation_string":"School of Information Technology, Monash University Malaysia, Malaysia","institution_ids":["https://openalex.org/I11662577"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035077941","display_name":"Ian K. T. Tan","orcid":"https://orcid.org/0000-0003-1474-8717"},"institutions":[{"id":"https://openalex.org/I4210085930","display_name":"Heriot-Watt University Malaysia","ror":"https://ror.org/0059w0420","country_code":"MY","type":"education","lineage":["https://openalex.org/I4210085930"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"Ian K.T. Tan","raw_affiliation_strings":["Heriot-Watt University Malaysia, Malaysia"],"affiliations":[{"raw_affiliation_string":"Heriot-Watt University Malaysia, Malaysia","institution_ids":["https://openalex.org/I4210085930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5027826572"],"corresponding_institution_ids":["https://openalex.org/I11662577"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.20903615,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"190","last_page":"194"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5701953172683716},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5384924411773682},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5232683420181274},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47608843445777893},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12806853652000427},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.0851794183254242}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5701953172683716},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5384924411773682},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5232683420181274},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47608843445777893},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12806853652000427},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0851794183254242},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3638584.3638633","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3638584.3638633","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3638584.3638633","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 7th International Conference on Computer Science and Artificial Intelligence","raw_type":"proceedings-article"},{"id":"pmh:oai:monash.edu:openaire/c314acde-0c80-4f54-9c61-534f46f6c838","is_oa":true,"landing_page_url":"https://research.monash.edu/en/publications/c314acde-0c80-4f54-9c61-534f46f6c838","pdf_url":"https://researchmgt.monash.edu/ws/files/609284930/541582214_oa.pdf","source":{"id":"https://openalex.org/S4306402625","display_name":"Monash University Research Portal (Monash University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I56590836","host_organization_name":"Monash University","host_organization_lineage":["https://openalex.org/I56590836"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Teh, W Y, Lim, C H, Lim, M K & Tan, I K T 2023, Towards Discrete Object Representations in Vision Transformers with Tensor Products. in E Jiang, Y Sun, Y Liu, R Cheng & S Huang (eds), CSAI 2023, 2023 International Conference on Computer Science and Artificial Intelligence. Association for Computing Machinery (ACM), New York NY USA, pp. 190-194, International Conference on Computer Science and Artificial Intelligence 2023, Beijing, China, 8/12/23. https://doi.org/10.1145/3638584.3638633","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"doi:10.1145/3638584.3638633","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3638584.3638633","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3638584.3638633","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 7th International Conference on Computer Science and Artificial Intelligence","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4392824587.pdf","grobid_xml":"https://content.openalex.org/works/W4392824587.grobid-xml"},"referenced_works_count":5,"referenced_works":["https://openalex.org/W2966661","https://openalex.org/W2108598243","https://openalex.org/W2618530766","https://openalex.org/W2898526707","https://openalex.org/W3121523901"],"related_works":["https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"In":[0],"this":[1],"work,":[2],"we":[3,74],"explore":[4],"the":[5,35,65,83,89],"use":[6,84],"of":[7,43,68,85,91],"Tensor":[8,36],"Product":[9,37],"Representations":[10],"(TPRs)":[11],"in":[12,29],"a":[13,30,44,101],"Vision":[14,38,45,103],"Transformer":[15,39,46],"model":[16],"to":[17,60,100],"form":[18],"image":[19],"representations":[20,97],"that":[21,47,54,82],"can":[22],"later":[23],"be":[24],"used":[25],"for":[26,88],"symbolic":[27],"manipulation":[28],"neurosymbolic":[31],"model.":[32],"We":[33],"propose":[34],"(TP-ViT),":[40],"an":[41,50],"enhancement":[42],"incorporates":[48],"TPRs,":[49],"object":[51,96],"representation":[52],"methodology":[53],"utilizes":[55],"filler":[56],"and":[57,73,77,94],"role":[58],"vectors":[59],"represent":[61],"objects.":[62],"TP-ViT":[63],"is":[64],"first":[66],"application":[67],"TPRs":[69,86],"on":[70],"visual":[71],"input,":[72],"report":[75],"qualitative":[76],"quantitative":[78],"results":[79],"which":[80],"show":[81],"allows":[87],"formation":[90],"more":[92],"targeted":[93],"diverse":[95],"when":[98],"compared":[99],"standard":[102],"Transformer.":[104]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
