{"id":"https://openalex.org/W3132408188","doi":"https://doi.org/10.5220/0010261301460156","title":"Few-shot Linguistic Grounding of Visual Attributes and Relations using Gaussian Kernels","display_name":"Few-shot Linguistic Grounding of Visual Attributes and Relations using Gaussian Kernels","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3132408188","doi":"https://doi.org/10.5220/0010261301460156","mag":"3132408188"},"language":"en","primary_location":{"id":"doi:10.5220/0010261301460156","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0010261301460156","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 16th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.5220/0010261301460156","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029529703","display_name":"Daniel Koudouna","orcid":null},"institutions":[{"id":"https://openalex.org/I16835326","display_name":"University of St Andrews","ror":"https://ror.org/02wn5qz54","country_code":"GB","type":"education","lineage":["https://openalex.org/I16835326"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Daniel Koudouna","raw_affiliation_strings":["School of Computer Science, University of St Andrews, U.K., --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, University of St Andrews, U.K., --- Select a Country ---","institution_ids":["https://openalex.org/I16835326"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053472065","display_name":"Kasim Terzi\u0107","orcid":"https://orcid.org/0000-0001-6692-209X"},"institutions":[{"id":"https://openalex.org/I16835326","display_name":"University of St Andrews","ror":"https://ror.org/02wn5qz54","country_code":"GB","type":"education","lineage":["https://openalex.org/I16835326"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Kasim Terzi\u0107","raw_affiliation_strings":["School of Computer Science, University of St Andrews, U.K., --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, University of St Andrews, U.K., --- Select a Country ---","institution_ids":["https://openalex.org/I16835326"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5029529703"],"corresponding_institution_ids":["https://openalex.org/I16835326"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.01988562,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"146","last_page":"156"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6695429086685181},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.640743613243103},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5735132694244385},{"id":"https://openalex.org/keywords/ground","display_name":"Ground","score":0.5724835395812988},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5374053120613098},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.48833534121513367},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3922763466835022},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10090300440788269},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1000501811504364},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.087289959192276},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.056490927934646606}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6695429086685181},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.640743613243103},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5735132694244385},{"id":"https://openalex.org/C168993435","wikidata":"https://www.wikidata.org/wiki/Q6501125","display_name":"Ground","level":2,"score":0.5724835395812988},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5374053120613098},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.48833534121513367},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3922763466835022},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10090300440788269},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1000501811504364},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.087289959192276},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.056490927934646606},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.5220/0010261301460156","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0010261301460156","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 16th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},{"id":"pmh:oai:research-repository.st-andrews.ac.uk:10023/21653","is_oa":true,"landing_page_url":"https://hdl.handle.net/10023/21653","pdf_url":null,"source":{"id":"https://openalex.org/S4306400230","display_name":"St Andrews Research Repository (St Andrews Research Repository)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I16835326","host_organization_name":"University of St Andrews","host_organization_lineage":["https://openalex.org/I16835326"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference item"}],"best_oa_location":{"id":"doi:10.5220/0010261301460156","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0010261301460156","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 16th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.4699999988079071,"display_name":"Reduced inequalities"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W56479147","https://openalex.org/W290564607","https://openalex.org/W1746737644","https://openalex.org/W1796264214","https://openalex.org/W2010239981","https://openalex.org/W2013335841","https://openalex.org/W2016429292","https://openalex.org/W2111807093","https://openalex.org/W2144209400","https://openalex.org/W2479423890","https://openalex.org/W2555897561","https://openalex.org/W2583360688","https://openalex.org/W2607855566","https://openalex.org/W2740962769","https://openalex.org/W2766324327","https://openalex.org/W2789177853","https://openalex.org/W2795378892","https://openalex.org/W2962716332","https://openalex.org/W2962737704","https://openalex.org/W2962837320","https://openalex.org/W2963143606","https://openalex.org/W2963518342","https://openalex.org/W2963650529","https://openalex.org/W2969047925","https://openalex.org/W2972771158","https://openalex.org/W2981707695","https://openalex.org/W2982147439","https://openalex.org/W3020712669","https://openalex.org/W3090098073","https://openalex.org/W3096492486","https://openalex.org/W3100307207","https://openalex.org/W3100749323","https://openalex.org/W4293584584"],"related_works":["https://openalex.org/W2074502265","https://openalex.org/W4214877189","https://openalex.org/W2773965352","https://openalex.org/W2381179799","https://openalex.org/W2980279061","https://openalex.org/W2334685461","https://openalex.org/W2366718574","https://openalex.org/W2359774528","https://openalex.org/W4298312966","https://openalex.org/W2325697621"],"abstract_inverted_index":{"Understanding":[0],"complex":[1],"visual":[2,26,87],"scenes":[3],"is":[4,17,118,130,161],"one":[5],"of":[6,24,32,38,64,89,115,126,150,167,187],"fundamental":[7],"problems":[8],"in":[9,14,107,143,173],"computer":[10],"vision,":[11],"but":[12],"learning":[13,62,86],"this":[15,78,171],"domain":[16],"challenging":[18],"due":[19],"to":[20,42,69,74,132,135,163],"the":[21,25,29,39,59,148,154,165,168,175],"inherent":[22],"richness":[23],"world":[27],"and":[28,52,66,96,129,177],"vast":[30],"number":[31,125],"possible":[33],"scene":[34,43],"configurations.":[35,145],"Current":[36],"state":[37,166],"art":[40,169],"approaches":[41],"understanding":[44],"often":[45],"employ":[46],"deep":[47],"networks":[48],"which":[49],"require":[50],"large":[51],"densely":[53],"annotated":[54],"datasets.":[55],"This":[56],"goes":[57],"against":[58],"seemingly":[60],"intuitive":[61],"abilities":[63],"humans":[65],"our":[67,116,151],"ability":[68],"generalise":[70],"from":[71],"few":[72],"examples":[73],"unseen":[75,136],"situations.":[76],"In":[77],"paper,":[79],"we":[80],"propose":[81],"a":[82,108,123,183],"unified":[83,110],"framework":[84],"for":[85],"representation":[88],"words":[90],"denoting":[91],"attributes":[92],"such":[93,98,138],"as":[94,99,139],"\u201cblue\u201d":[95],"relations":[97,142],"\u201cleft":[100],"of\u201d":[101],"based":[102],"on":[103,153,170,182],"Gaussian":[104],"models":[105],"operating":[106],"simple,":[109],"feature":[111],"space.":[112],"The":[113],"strength":[114],"model":[117,152,160],"that":[119],"it":[120],"only":[121],"requires":[122],"small":[124],"weak":[127],"annotations":[128],"able":[131,162],"generalize":[133],"easily":[134],"situations":[137],"recognizing":[140],"object":[141],"unusual":[144],"We":[146],"demonstrate":[147],"effectiveness":[149],"pr":[155],"edicate":[156],"detection":[157],"task.":[158],"Our":[159],"outperform":[164],"task":[172],"both":[174],"normal":[176],"zero-shot":[178],"scenarios,":[179],"while":[180],"training":[181],"dataset":[184],"an":[185],"order":[186],"magnitude":[188],"smaller.":[189],"(Less)":[190]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
