{"id":"https://openalex.org/W2101818040","doi":"https://doi.org/10.1145/1647314.1647369","title":"Grounding spatial prepositions for video search","display_name":"Grounding spatial prepositions for video search","publication_year":2009,"publication_date":"2009-11-02","ids":{"openalex":"https://openalex.org/W2101818040","doi":"https://doi.org/10.1145/1647314.1647369","mag":"2101818040"},"language":"en","primary_location":{"id":"doi:10.1145/1647314.1647369","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1647314.1647369","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2009 international conference on Multimodal interfaces","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/1721.1/65868","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059273574","display_name":"Stefanie Tellex","orcid":"https://orcid.org/0000-0002-2905-4075"},"institutions":[{"id":"https://openalex.org/I4210142372","display_name":"Human Media","ror":"https://ror.org/04072nk43","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210142372"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Stefanie Tellex","raw_affiliation_strings":["MIT Media Lab, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"MIT Media Lab, Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210142372"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004281470","display_name":"Deb Roy","orcid":"https://orcid.org/0000-0002-2780-4768"},"institutions":[{"id":"https://openalex.org/I4210142372","display_name":"Human Media","ror":"https://ror.org/04072nk43","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210142372"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Deb Roy","raw_affiliation_strings":["MIT Media Lab, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"MIT Media Lab, Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210142372"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5059273574"],"corresponding_institution_ids":["https://openalex.org/I4210142372"],"apc_list":null,"apc_paid":null,"fwci":2.2963,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.89554014,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"253","last_page":"260"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8545875549316406},{"id":"https://openalex.org/keywords/clips","display_name":"CLIPS","score":0.790229320526123},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.6678531169891357},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.569443941116333},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5390177965164185},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5115512013435364},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4950372278690338},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.47209876775741577},{"id":"https://openalex.org/keywords/meaning","display_name":"Meaning (existential)","score":0.4629005193710327},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.45797890424728394},{"id":"https://openalex.org/keywords/natural-language-user-interface","display_name":"Natural language user interface","score":0.44023704528808594}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8545875549316406},{"id":"https://openalex.org/C2778739407","wikidata":"https://www.wikidata.org/wiki/Q165372","display_name":"CLIPS","level":2,"score":0.790229320526123},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.6678531169891357},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.569443941116333},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5390177965164185},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5115512013435364},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4950372278690338},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.47209876775741577},{"id":"https://openalex.org/C2780876879","wikidata":"https://www.wikidata.org/wiki/Q3054749","display_name":"Meaning (existential)","level":2,"score":0.4629005193710327},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.45797890424728394},{"id":"https://openalex.org/C174252522","wikidata":"https://www.wikidata.org/wiki/Q3816772","display_name":"Natural language user interface","level":3,"score":0.44023704528808594},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/1647314.1647369","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1647314.1647369","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2009 international conference on Multimodal interfaces","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.148.2939","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.148.2939","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.media.mit.edu/cogmac/publications/stefie10-icmi2009-2.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.151.2342","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.151.2342","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://web.media.mit.edu/~dkroy/papers/pdf/stefie10-icmi2009.pdf","raw_type":"text"},{"id":"pmh:oai:dspace.mit.edu:1721.1/65868","is_oa":true,"landing_page_url":"http://hdl.handle.net/1721.1/65868","pdf_url":null,"source":{"id":"https://openalex.org/S4306400425","display_name":"DSpace@MIT (Massachusetts Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63966007","host_organization_name":"Massachusetts Institute of Technology","host_organization_lineage":["https://openalex.org/I63966007"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"MIT web domain","raw_type":"http://purl.org/eprint/type/ConferencePaper"}],"best_oa_location":{"id":"pmh:oai:dspace.mit.edu:1721.1/65868","is_oa":true,"landing_page_url":"http://hdl.handle.net/1721.1/65868","pdf_url":null,"source":{"id":"https://openalex.org/S4306400425","display_name":"DSpace@MIT (Massachusetts Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63966007","host_organization_name":"Massachusetts Institute of Technology","host_organization_lineage":["https://openalex.org/I63966007"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"MIT web domain","raw_type":"http://purl.org/eprint/type/ConferencePaper"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7900000214576721,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G5767131270","display_name":null,"funder_award_id":"MURI N00014-07-1-0749","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"},{"id":"https://openalex.org/G8876996369","display_name":null,"funder_award_id":"N00014","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320333591","display_name":"Multidisciplinary University Research Initiative","ror":null},{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W172019652","https://openalex.org/W1239985160","https://openalex.org/W1548185736","https://openalex.org/W1576271470","https://openalex.org/W1964338286","https://openalex.org/W1987038030","https://openalex.org/W2009973286","https://openalex.org/W2014687206","https://openalex.org/W2020549735","https://openalex.org/W2021121433","https://openalex.org/W2032846947","https://openalex.org/W2039561763","https://openalex.org/W2060599709","https://openalex.org/W2061997612","https://openalex.org/W2089150756","https://openalex.org/W2099604484","https://openalex.org/W2101906254","https://openalex.org/W2111644456","https://openalex.org/W2121458419","https://openalex.org/W2123987305","https://openalex.org/W2132195693","https://openalex.org/W2147191817","https://openalex.org/W2148613815","https://openalex.org/W2167851108","https://openalex.org/W2474463024","https://openalex.org/W2481295655","https://openalex.org/W2492390975","https://openalex.org/W2528951757","https://openalex.org/W6634526646","https://openalex.org/W6723158049"],"related_works":["https://openalex.org/W2112751186","https://openalex.org/W1968262010","https://openalex.org/W3036268427","https://openalex.org/W3158218201","https://openalex.org/W1550490297","https://openalex.org/W2605168037","https://openalex.org/W2401646948","https://openalex.org/W3134925693","https://openalex.org/W2099417110","https://openalex.org/W2032694873"],"abstract_inverted_index":{"Spatial":[0],"language":[1,20,31,91,103,116,153],"video":[2,44,82,111,154],"retrieval":[3,155],"is":[4],"an":[5],"important":[6],"real-world":[7],"problem":[8],"that":[9,34,41,50,74,157],"forms":[10],"a":[11,52,57,70,81,89,99,151],"test":[12,127],"bed":[13],"for":[14,18,59,129],"evaluating":[15],"semantic":[16],"structures":[17,40],"natural":[19,30,90,102],"descriptions":[21,104],"of":[22,63,72,101,108,132],"motion":[23,107],"on":[24,43,85],"naturalistic":[25],"data.":[26],"Video":[27],"search":[28],"by":[29],"query":[32],"requires":[33],"linguistic":[35],"input":[36],"be":[37,76,147],"converted":[38],"into":[39],"operate":[42],"in":[45,66,110,118],"order":[46],"to":[47,78,124,149],"find":[48],"clips":[49,159],"match":[51],"query.":[53,92],"This":[54],"paper":[55],"describes":[56],"framework":[58],"grounding":[60],"the":[61,106,115,119,130,133,165],"meaning":[62],"spatial":[64,134,152],"prepositions":[65,135],"video.":[67],"We":[68,113],"present":[69],"library":[71],"features":[73],"can":[75,146],"used":[77,117,148],"automatically":[79],"classify":[80],"clip":[83],"based":[84],"whether":[86],"it":[87,123],"matches":[88],"To":[93],"evaluate":[94],"these":[95],"features,":[96],"we":[97],"collected":[98],"corpus":[100],"about":[105],"people":[109],"clips.":[112],"characterize":[114],"corpus,":[120],"and":[121,126,142],"use":[122],"train":[125],"models":[128],"meanings":[131],"\"to,\"":[136],"\"across,\"":[137],"\"through,\"":[138],"\"out,\"":[139],"\"along,\"":[140],"\"towards,\"":[141],"\"around.\"":[143],"The":[144],"classifiers":[145],"build":[150],"system":[156],"finds":[158],"matching":[160],"queries":[161],"such":[162],"as":[163],"\"across":[164],"kitchen.\"":[166]},"counts_by_year":[{"year":2022,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
