{"id":"https://openalex.org/W2742295456","doi":"https://doi.org/10.1109/bigdata.2017.8258016","title":"Fishing in the stream: Similarity search over endless data","display_name":"Fishing in the stream: Similarity search over endless data","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2742295456","doi":"https://doi.org/10.1109/bigdata.2017.8258016","mag":"2742295456"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2017.8258016","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2017.8258016","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1708.02062","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109890838","display_name":"Naama Kraus","orcid":null},"institutions":[{"id":"https://openalex.org/I174306211","display_name":"Technion \u2013 Israel Institute of Technology","ror":"https://ror.org/03qryx823","country_code":"IL","type":"education","lineage":["https://openalex.org/I174306211"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Naama Kraus","raw_affiliation_strings":["Technion IIT, Haifa, Israel","Technion-IIT, Haifa, Israel"],"affiliations":[{"raw_affiliation_string":"Technion IIT, Haifa, Israel","institution_ids":["https://openalex.org/I174306211"]},{"raw_affiliation_string":"Technion-IIT, Haifa, Israel","institution_ids":["https://openalex.org/I174306211"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103324615","display_name":"David Carmel","orcid":"https://orcid.org/0000-0003-1161-7084"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"David Carmel","raw_affiliation_strings":["Yahoo Research, Haifa, Israel","Yahoo! research, Haifa, Israel"],"affiliations":[{"raw_affiliation_string":"Yahoo Research, Haifa, Israel","institution_ids":[]},{"raw_affiliation_string":"Yahoo! research, Haifa, Israel","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059238786","display_name":"Idit Keidar","orcid":"https://orcid.org/0000-0002-6417-1250"},"institutions":[{"id":"https://openalex.org/I174306211","display_name":"Technion \u2013 Israel Institute of Technology","ror":"https://ror.org/03qryx823","country_code":"IL","type":"education","lineage":["https://openalex.org/I174306211"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Idit Keidar","raw_affiliation_strings":["Technion IIT and Yahoo Research, Haifa, Israel"],"affiliations":[{"raw_affiliation_string":"Technion IIT and Yahoo Research, Haifa, Israel","institution_ids":["https://openalex.org/I174306211"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5109890838"],"corresponding_institution_ids":["https://openalex.org/I174306211"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.10010648,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"964","last_page":"969"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7261789441108704},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6971930861473083},{"id":"https://openalex.org/keywords/nearest-neighbor-search","display_name":"Nearest neighbor search","score":0.6423842906951904},{"id":"https://openalex.org/keywords/data-stream","display_name":"Data stream","score":0.6379013657569885},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5617496967315674},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5356853008270264},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.5305963754653931},{"id":"https://openalex.org/keywords/popularity","display_name":"Popularity","score":0.4741484522819519},{"id":"https://openalex.org/keywords/data-stream-mining","display_name":"Data stream mining","score":0.4531453549861908},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4478864073753357},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.43512266874313354},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.43357178568840027},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.21127614378929138},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15836963057518005},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.12052622437477112},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.07414931058883667}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7261789441108704},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6971930861473083},{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.6423842906951904},{"id":"https://openalex.org/C2778484313","wikidata":"https://www.wikidata.org/wiki/Q1172540","display_name":"Data stream","level":2,"score":0.6379013657569885},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5617496967315674},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5356853008270264},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.5305963754653931},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.4741484522819519},{"id":"https://openalex.org/C89198739","wikidata":"https://www.wikidata.org/wiki/Q3079880","display_name":"Data stream mining","level":2,"score":0.4531453549861908},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4478864073753357},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.43512266874313354},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.43357178568840027},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.21127614378929138},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15836963057518005},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.12052622437477112},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.07414931058883667},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/bigdata.2017.8258016","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2017.8258016","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1708.02062","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1708.02062","pdf_url":"https://arxiv.org/pdf/1708.02062","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:2742295456","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1708.02062.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1708.02062","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1708.02062","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1708.02062","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1708.02062","pdf_url":"https://arxiv.org/pdf/1708.02062","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/14","display_name":"Life below water","score":0.7900000214576721}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2742295456.pdf","grobid_xml":"https://content.openalex.org/works/W2742295456.grobid-xml"},"referenced_works_count":48,"referenced_works":["https://openalex.org/W642889137","https://openalex.org/W1502916507","https://openalex.org/W1541459201","https://openalex.org/W1602639018","https://openalex.org/W1984270672","https://openalex.org/W1987700483","https://openalex.org/W1995672491","https://openalex.org/W2012833704","https://openalex.org/W2020498246","https://openalex.org/W2037858832","https://openalex.org/W2055483934","https://openalex.org/W2071080574","https://openalex.org/W2071572981","https://openalex.org/W2076538837","https://openalex.org/W2079825698","https://openalex.org/W2081798681","https://openalex.org/W2101196063","https://openalex.org/W2102428892","https://openalex.org/W2107427524","https://openalex.org/W2110443819","https://openalex.org/W2112056172","https://openalex.org/W2123427850","https://openalex.org/W2125671345","https://openalex.org/W2140427797","https://openalex.org/W2140942692","https://openalex.org/W2144265691","https://openalex.org/W2147717514","https://openalex.org/W2153111836","https://openalex.org/W2160306106","https://openalex.org/W2164986850","https://openalex.org/W2171960770","https://openalex.org/W2222139048","https://openalex.org/W2225766585","https://openalex.org/W2238991082","https://openalex.org/W2251406078","https://openalex.org/W2271423210","https://openalex.org/W2296107147","https://openalex.org/W2346507211","https://openalex.org/W2441844958","https://openalex.org/W2949637668","https://openalex.org/W4230940751","https://openalex.org/W4250011483","https://openalex.org/W4285719527","https://openalex.org/W4300601563","https://openalex.org/W6629956336","https://openalex.org/W6664416897","https://openalex.org/W6688738766","https://openalex.org/W6844342457"],"related_works":["https://openalex.org/W2760646669","https://openalex.org/W646176396","https://openalex.org/W2125999281","https://openalex.org/W2564445937","https://openalex.org/W2051759953","https://openalex.org/W2897779003","https://openalex.org/W2009278541","https://openalex.org/W2151220608","https://openalex.org/W2520508208","https://openalex.org/W2507179043","https://openalex.org/W2075902498","https://openalex.org/W2111138483","https://openalex.org/W2980401592","https://openalex.org/W2080677175","https://openalex.org/W1981919843","https://openalex.org/W2612205558","https://openalex.org/W1992833820","https://openalex.org/W2613277090","https://openalex.org/W2144586885","https://openalex.org/W3124993569"],"abstract_inverted_index":{"Similarity":[0],"search":[1,26],"is":[2,45],"the":[3,21,68,89,100],"task":[4],"of":[5,24],"retrieving":[6],"data":[7,35],"items":[8,73,94],"that":[9,66,86],"are":[10,57],"similar":[11,93],"to":[12,42,50,75,91,96],"a":[13,62],"given":[14],"query.":[15],"In":[16],"this":[17],"paper,":[18],"we":[19],"introduce":[20],"time-sensitive":[22],"notion":[23],"similarity":[25],"over":[27],"endless":[28],"data-streams":[29],"(SSDS),":[30],"which":[31,115],"takes":[32],"into":[33],"account":[34],"quality":[36],"and":[37,79],"temporal":[38],"characteristics":[39],"in":[40],"addition":[41],"similarity.":[43],"SSDS":[44,64],"challenging":[46],"as":[47],"it":[48],"needs":[49],"process":[51],"unbounded":[52],"data,":[53],"while":[54],"computation":[55],"resources":[56],"bounded.":[58],"We":[59,83,104],"propose":[60],"Stream-LSH,":[61],"randomized":[63],"algorithm":[65],"bounds":[67],"index":[69],"size":[70],"by":[71],"retaining":[72],"according":[74],"their":[76],"freshness,":[77],"quality,":[78],"dynamic":[80],"popularity":[81],"attributes.":[82],"analytically":[84],"show":[85],"Stream-LSH":[87],"increases":[88],"probability":[90],"find":[92],"compared":[95],"alternative":[97],"approaches":[98],"using":[99,110],"same":[101],"space":[102],"capacity.":[103],"further":[105],"conduct":[106],"an":[107],"empirical":[108],"study":[109],"real":[111],"world":[112],"stream":[113],"datasets,":[114],"confirms":[116],"our":[117],"theoretical":[118],"results.":[119]},"counts_by_year":[],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
