{"id":"https://openalex.org/W4360605045","doi":"https://doi.org/10.1109/icaiic57133.2023.10067104","title":"Semantic Similarity-based Visual Reasoning without Language Information","display_name":"Semantic Similarity-based Visual Reasoning without Language Information","publication_year":2023,"publication_date":"2023-02-20","ids":{"openalex":"https://openalex.org/W4360605045","doi":"https://doi.org/10.1109/icaiic57133.2023.10067104"},"language":"en","primary_location":{"id":"doi:10.1109/icaiic57133.2023.10067104","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icaiic57133.2023.10067104","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 International Conference on Artificial Intelligence in Information and Communication (ICAIIC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026718067","display_name":"Chang-Su Choi","orcid":null},"institutions":[{"id":"https://openalex.org/I145808223","display_name":"Hanbat National University","ror":"https://ror.org/00x514t95","country_code":"KR","type":"education","lineage":["https://openalex.org/I145808223"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"ChangSu Choi","raw_affiliation_strings":["Hanbat National University,Department of Computer Engineering,Daejeon,South Korea","Department of Computer Engineering, Hanbat National University, Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"Hanbat National University,Department of Computer Engineering,Daejeon,South Korea","institution_ids":["https://openalex.org/I145808223"]},{"raw_affiliation_string":"Department of Computer Engineering, Hanbat National University, Daejeon, South Korea","institution_ids":["https://openalex.org/I145808223"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056276165","display_name":"HyeonSeok Lim","orcid":null},"institutions":[{"id":"https://openalex.org/I145808223","display_name":"Hanbat National University","ror":"https://ror.org/00x514t95","country_code":"KR","type":"education","lineage":["https://openalex.org/I145808223"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"HyeonSeok Lim","raw_affiliation_strings":["Hanbat National University,Department of Computer Engineering,Daejeon,South Korea","Department of Computer Engineering, Hanbat National University, Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"Hanbat National University,Department of Computer Engineering,Daejeon,South Korea","institution_ids":["https://openalex.org/I145808223"]},{"raw_affiliation_string":"Department of Computer Engineering, Hanbat National University, Daejeon, South Korea","institution_ids":["https://openalex.org/I145808223"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101745581","display_name":"Ha-Young Jang","orcid":"https://orcid.org/0000-0002-5640-0287"},"institutions":[{"id":"https://openalex.org/I4210148772","display_name":"Helixmith (South Korea)","ror":"https://ror.org/05n9nsw73","country_code":"KR","type":"company","lineage":["https://openalex.org/I4210148772"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hayoung Jang","raw_affiliation_strings":["Surromind Co., Ltd.,Seoul,South Korea","Surromind Co., Ltd., Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"Surromind Co., Ltd.,Seoul,South Korea","institution_ids":["https://openalex.org/I4210148772"]},{"raw_affiliation_string":"Surromind Co., Ltd., Seoul, South Korea","institution_ids":["https://openalex.org/I4210148772"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041412501","display_name":"Juhan Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Juhan Park","raw_affiliation_strings":["Euclidsoft Co., Ltd.,Daejeon,South Korea","Euclidsoft Co., Ltd., Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"Euclidsoft Co., Ltd.,Daejeon,South Korea","institution_ids":[]},{"raw_affiliation_string":"Euclidsoft Co., Ltd., Daejeon, South Korea","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100616087","display_name":"Eunkyung Kim","orcid":"https://orcid.org/0000-0003-3558-7086"},"institutions":[{"id":"https://openalex.org/I145808223","display_name":"Hanbat National University","ror":"https://ror.org/00x514t95","country_code":"KR","type":"education","lineage":["https://openalex.org/I145808223"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Eunkyung Kim","raw_affiliation_strings":["Hanbat National University,Department of AI Software,Daejeon,South Korea","Department of AI Software, Hanbat National University, Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"Hanbat National University,Department of AI Software,Daejeon,South Korea","institution_ids":["https://openalex.org/I145808223"]},{"raw_affiliation_string":"Department of AI Software, Hanbat National University, Daejeon, South Korea","institution_ids":["https://openalex.org/I145808223"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003224328","display_name":"KyungTae Lim","orcid":"https://orcid.org/0000-0002-5818-1161"},"institutions":[{"id":"https://openalex.org/I145808223","display_name":"Hanbat National University","ror":"https://ror.org/00x514t95","country_code":"KR","type":"education","lineage":["https://openalex.org/I145808223"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"KyungTae Lim","raw_affiliation_strings":["Hanbat National University,Department of Computer Engineering,Daejeon,South Korea","Department of Computer Engineering, Hanbat National University, Daejeon, South Korea"],"affiliations":[{"raw_affiliation_string":"Hanbat National University,Department of Computer Engineering,Daejeon,South Korea","institution_ids":["https://openalex.org/I145808223"]},{"raw_affiliation_string":"Department of Computer Engineering, Hanbat National University, Daejeon, South Korea","institution_ids":["https://openalex.org/I145808223"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5026718067"],"corresponding_institution_ids":["https://openalex.org/I145808223"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.018398,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"07461","issue":null,"first_page":"107","last_page":"111"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9889000058174133,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7910692691802979},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.702441930770874},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6419258117675781},{"id":"https://openalex.org/keywords/visual-reasoning","display_name":"Visual reasoning","score":0.6419047713279724},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.5543811917304993},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5259739756584167},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.49607619643211365},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4434930980205536},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.443334698677063},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.417675256729126},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.3472091555595398},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.1973731517791748}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7910692691802979},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.702441930770874},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6419258117675781},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.6419047713279724},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.5543811917304993},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5259739756584167},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.49607619643211365},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4434930980205536},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.443334698677063},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.417675256729126},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3472091555595398},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.1973731517791748},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icaiic57133.2023.10067104","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icaiic57133.2023.10067104","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 International Conference on Artificial Intelligence in Information and Communication (ICAIIC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6700000166893005}],"awards":[{"id":"https://openalex.org/G5804139154","display_name":null,"funder_award_id":"2021RIS-004,2021RIFIAI063474","funder_id":"https://openalex.org/F4320311649","funder_display_name":"Ministry of Education"}],"funders":[{"id":"https://openalex.org/F4320311649","display_name":"Ministry of Education","ror":"https://ror.org/036nq5137"},{"id":"https://openalex.org/F4320337337","display_name":"National Institute on Aging","ror":"https://ror.org/049v75w11"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W2006500696","https://openalex.org/W2088589173","https://openalex.org/W2168983113","https://openalex.org/W2228826686","https://openalex.org/W2489434015","https://openalex.org/W2618530766","https://openalex.org/W2741631785","https://openalex.org/W2799054028","https://openalex.org/W2912371042","https://openalex.org/W2923014074","https://openalex.org/W2963690694","https://openalex.org/W3094502228","https://openalex.org/W3162296828","https://openalex.org/W4312502942"],"related_works":["https://openalex.org/W2974225181","https://openalex.org/W4288108740","https://openalex.org/W4287890973","https://openalex.org/W2153717697","https://openalex.org/W3018936175","https://openalex.org/W2180017908","https://openalex.org/W2289318896","https://openalex.org/W3107290838","https://openalex.org/W4281690070","https://openalex.org/W2131253837"],"abstract_inverted_index":{"In":[0],"this":[1,31,85,92],"research,":[2],"we":[3,47,111],"propose":[4,75],"new":[5],"training":[6,37,69],"data":[7],"for":[8,96,117],"the":[9,25,34,81,107,113],"visual":[10,50,77],"reasoning":[11,121],"task":[12],"based":[13],"on":[14,40,106],"semantic":[15],"similarity":[16],"and":[17,70,101,122],"proposed":[18],"a":[19,41,49,58,60,76],"deep":[20],"learning":[21],"model":[22,79,89,116],"that":[23],"utilizes":[24],"data.":[26,38,56,72],"The":[27,87],"first":[28],"contribution":[29,83],"of":[30,36,43,62,84],"study":[32,93],"is":[33],"construction":[35],"Based":[39,105],"total":[42,61],"40":[44],"object":[45],"attributes,":[46],"created":[48],"inference":[51,78,88],"problem":[52],"using":[53,99],"only":[54],"image":[55],"As":[57],"result,":[59],"6,000":[63],"datasets":[64],"were":[65],"built":[66],"to":[67],"create":[68],"test":[71],"We":[73],"also":[74],"as":[80],"second":[82],"work.":[86],"shown":[90],"in":[91],"was":[94],"evaluated":[95],"two":[97],"tasks":[98],"ResNet50":[100],"Vision":[102],"Transformer,":[103],"respectively.":[104,125],"experimental":[108],"evaluation":[109],"results,":[110],"investigated":[112],"suitable":[114],"pre-trained":[115],"both":[118],"single-choice":[119],"binary":[120],"multiple-selection":[123],"reasoning,":[124]},"counts_by_year":[],"updated_date":"2025-12-24T23:09:58.560324","created_date":"2025-10-10T00:00:00"}
