{"id":"https://openalex.org/W2134455794","doi":"https://doi.org/10.1109/cvpr.2007.383223","title":"Multi-modal Clustering for Multimedia Collections","display_name":"Multi-modal Clustering for Multimedia Collections","publication_year":2007,"publication_date":"2007-06-01","ids":{"openalex":"https://openalex.org/W2134455794","doi":"https://doi.org/10.1109/cvpr.2007.383223","mag":"2134455794"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr.2007.383223","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2007.383223","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2007 IEEE Conference on Computer Vision and Pattern Recognition","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005515091","display_name":"Ron Bekkerman","orcid":"https://orcid.org/0000-0001-5636-694X"},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ron Bekkerman","raw_affiliation_strings":["Center for Intelligent Information Retrieval, University of Massachusetts, Amherst, USA","University of Massachusetts: Amherst#TAB#"],"affiliations":[{"raw_affiliation_string":"Center for Intelligent Information Retrieval, University of Massachusetts, Amherst, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"University of Massachusetts: Amherst#TAB#","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023139653","display_name":"Jiwoon Jeon","orcid":"https://orcid.org/0009-0001-1493-4408"},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiwoon Jeon","raw_affiliation_strings":["Center for Intelligent Information Retrieval, University of Massachusetts, Amherst, USA","University of Massachusetts: Amherst#TAB#"],"affiliations":[{"raw_affiliation_string":"Center for Intelligent Information Retrieval, University of Massachusetts, Amherst, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"University of Massachusetts: Amherst#TAB#","institution_ids":["https://openalex.org/I24603500"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5005515091"],"corresponding_institution_ids":["https://openalex.org/I24603500"],"apc_list":null,"apc_paid":null,"fwci":3.8948,"has_fulltext":false,"cited_by_count":76,"citation_normalized_percentile":{"value":0.93956174,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8293026685714722},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6151440739631653},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.5910431742668152},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5902114510536194},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5739102363586426},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4989793300628662},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.4860968589782715},{"id":"https://openalex.org/keywords/markov-random-field","display_name":"Markov random field","score":0.4746946692466736},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4742114841938019},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4570690393447876},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4308062195777893},{"id":"https://openalex.org/keywords/histogram","display_name":"Histogram","score":0.421661376953125},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3675881624221802},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2395378053188324},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.1483522653579712}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8293026685714722},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6151440739631653},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.5910431742668152},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5902114510536194},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5739102363586426},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4989793300628662},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.4860968589782715},{"id":"https://openalex.org/C2778045648","wikidata":"https://www.wikidata.org/wiki/Q176827","display_name":"Markov random field","level":4,"score":0.4746946692466736},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4742114841938019},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4570690393447876},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4308062195777893},{"id":"https://openalex.org/C53533937","wikidata":"https://www.wikidata.org/wiki/Q185020","display_name":"Histogram","level":3,"score":0.421661376953125},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3675881624221802},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2395378053188324},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.1483522653579712},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvpr.2007.383223","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2007.383223","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2007 IEEE Conference on Computer Vision and Pattern Recognition","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320332815","display_name":"Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W98391849","https://openalex.org/W1498355188","https://openalex.org/W1544067897","https://openalex.org/W1666447063","https://openalex.org/W1686946872","https://openalex.org/W1934863104","https://openalex.org/W1964937891","https://openalex.org/W1966957716","https://openalex.org/W2111048828","https://openalex.org/W2114220616","https://openalex.org/W2117848638","https://openalex.org/W2125323310","https://openalex.org/W2133576408","https://openalex.org/W2137918516","https://openalex.org/W2152818382","https://openalex.org/W2156336347","https://openalex.org/W2156919418","https://openalex.org/W2162491758","https://openalex.org/W2283195891","https://openalex.org/W2293605478","https://openalex.org/W2979454998","https://openalex.org/W6603954642","https://openalex.org/W6637108112","https://openalex.org/W6637249095","https://openalex.org/W6677388911","https://openalex.org/W6682532325"],"related_works":["https://openalex.org/W17155033","https://openalex.org/W3207760230","https://openalex.org/W1496222301","https://openalex.org/W4312814274","https://openalex.org/W1590307681","https://openalex.org/W2536018345","https://openalex.org/W4285370786","https://openalex.org/W2296488620","https://openalex.org/W2358353312","https://openalex.org/W2353836703"],"abstract_inverted_index":{"Most":[0],"of":[1,33,59,70,104,119,147,167,178],"the":[2,30,49,55,77,96,148,179],"online":[3],"multimedia":[4,34,60],"collections,":[5],"such":[6],"as":[7],"picture":[8,83],"galleries":[9],"or":[10,67],"video":[11],"archives,":[12],"are":[13,87,112],"categorized":[14],"in":[15,82,132],"a":[16,92,144,165,198],"fully":[17],"manual":[18],"process,":[19],"which":[20,71,136],"is":[21,143],"very":[22],"expensive":[23],"and":[24,116,170],"may":[25],"soon":[26],"be":[27],"infeasible":[28],"with":[29,197],"rapid":[31],"growth":[32],"repositories.":[35],"In":[36],"this":[37,46],"paper,":[38],"we":[39],"present":[40],"an":[41,161,172],"effective":[42],"method":[43],"for":[44,175],"automating":[45],"process":[47],"within":[48],"unsupervised":[50],"learning":[51],"framework.":[52],"We":[53,156],"exploit":[54],"truly":[56],"multi-modal":[57,133],"nature":[58],"collections":[61],"-":[62],"they":[63],"have":[64],"multiple":[65],"views,":[66],"modalities,":[68],"each":[69],"contributes":[72],"its":[73],"own":[74],"perspective":[75],"to":[76,159],"collection's":[78],"organization.":[79],"For":[80],"example,":[81],"galleries,":[84],"image":[85,188],"captions":[86],"often":[88],"provided":[89],"that":[90],"form":[91,107],"separate":[93],"view":[94],"on":[95,185],"collection.":[97],"Color":[98],"histograms":[99],"(or":[100],"any":[101],"other":[102,117],"set":[103],"global":[105],"features)":[106],"another":[108],"view.":[109],"Additional":[110],"views":[111,131],"blobs,":[113],"interest":[114],"points":[115],"sets":[118],"local":[120],"features.":[121],"Our":[122],"model,":[123],"called":[124],"Comraf*":[125,142,168,181],"(pronounced":[126],"Comraf-Star),":[127],"efficiently":[128],"incorporates":[129],"various":[130],"clustering,":[134],"by":[135],"it":[137,190],"allows":[138],"great":[139],"modeling":[140],"flexibility.":[141],"light-weight":[145],"version":[146],"recently":[149],"introduced":[150],"combinatorial":[151],"Markov":[152],"random":[153],"field":[154],"(Comraf).":[155],"show":[157],"how":[158],"translate":[160],"arbitrary":[162],"Comraf":[163],"into":[164],"series":[166],"models,":[169],"give":[171],"empirical":[173],"evidence":[174],"comparable":[176],"effectiveness":[177],"two.":[180],"demonstrates":[182],"excellent":[183],"results":[184],"two":[186],"real-world":[187],"galleries:":[189],"obtains":[191],"2.5-3":[192],"times":[193],"higher":[194],"accuracy":[195],"compared":[196],"uni-modal":[199],"k-means.":[200]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":10},{"year":2014,"cited_by_count":7},{"year":2013,"cited_by_count":12},{"year":2012,"cited_by_count":9}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
