{"id":"https://openalex.org/W2782583648","doi":"https://doi.org/10.1109/bigdata.2017.8257970","title":"High-performance geometric algorithms for sparse computation in big data analytics","display_name":"High-performance geometric algorithms for sparse computation in big data analytics","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2782583648","doi":"https://doi.org/10.1109/bigdata.2017.8257970","mag":"2782583648"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2017.8257970","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2017.8257970","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072687277","display_name":"Philipp Baumann","orcid":"https://orcid.org/0000-0002-3286-4474"},"institutions":[{"id":"https://openalex.org/I118564535","display_name":"University of Bern","ror":"https://ror.org/02k7v4d05","country_code":"CH","type":"education","lineage":["https://openalex.org/I118564535"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Philipp Baumann","raw_affiliation_strings":["Department of Business Administration, University of Bern, Switzerland"],"affiliations":[{"raw_affiliation_string":"Department of Business Administration, University of Bern, Switzerland","institution_ids":["https://openalex.org/I118564535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085640376","display_name":"Dorit S. Hochbaum","orcid":"https://orcid.org/0000-0002-2498-0512"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dorit S. Hochbaum","raw_affiliation_strings":["IEOR Department, University of California, Berkeley, USA"],"affiliations":[{"raw_affiliation_string":"IEOR Department, University of California, Berkeley, USA","institution_ids":["https://openalex.org/I95457486"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032198398","display_name":"Quico Spaen","orcid":"https://orcid.org/0000-0003-2788-1904"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Quico Spaen","raw_affiliation_strings":["IEOR Department, University of California, Berkeley, USA"],"affiliations":[{"raw_affiliation_string":"IEOR Department, University of California, Berkeley, USA","institution_ids":["https://openalex.org/I95457486"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5072687277"],"corresponding_institution_ids":["https://openalex.org/I118564535"],"apc_list":null,"apc_paid":null,"fwci":0.7462,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.73247974,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"6","issue":null,"first_page":"546","last_page":"555"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6503701210021973},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.5978167653083801},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5920006036758423},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.5548306703567505},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4747132360935211},{"id":"https://openalex.org/keywords/enumeration","display_name":"Enumeration","score":0.4716041684150696},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.4555046558380127},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.4411747455596924},{"id":"https://openalex.org/keywords/nearest-neighbor-search","display_name":"Nearest neighbor search","score":0.4245951175689697},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.39927056431770325},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.2659037411212921},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.22643664479255676},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.21983042359352112}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6503701210021973},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.5978167653083801},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5920006036758423},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.5548306703567505},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4747132360935211},{"id":"https://openalex.org/C156340839","wikidata":"https://www.wikidata.org/wiki/Q2704791","display_name":"Enumeration","level":2,"score":0.4716041684150696},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.4555046558380127},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.4411747455596924},{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.4245951175689697},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.39927056431770325},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2659037411212921},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.22643664479255676},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.21983042359352112},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/bigdata.2017.8257970","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2017.8257970","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},{"id":"pmh:oai:boris.unibe.ch:111909","is_oa":false,"landing_page_url":"https://boris.unibe.ch/111909/","pdf_url":null,"source":{"id":"https://openalex.org/S4306401086","display_name":"Bern Open Repository and Information System (University of Bern)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I118564535","host_organization_name":"University of Bern","host_organization_lineage":["https://openalex.org/I118564535"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Baumann, Philipp; Hochbaum, Dorit S.; Spaen, Quico (11 December 2017). High-performance geometric algorithms for sparse computation in big data analytics. In: Proceedings of the 2017 IEEE International Conference on Big Data. Boston. 11.-14.12.2017. 10.1109/BigData.2017.8257970 &lt;http://dx.doi.org/10.1109/BigData.2017.8257970&gt;","raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1559060276","https://openalex.org/W1581656968","https://openalex.org/W1621799579","https://openalex.org/W1909224475","https://openalex.org/W2011529808","https://openalex.org/W2015627422","https://openalex.org/W2021404082","https://openalex.org/W2095885101","https://openalex.org/W2122792499","https://openalex.org/W2129575457","https://openalex.org/W2145065594","https://openalex.org/W2147758638","https://openalex.org/W2155319834","https://openalex.org/W2162006472","https://openalex.org/W2165558283","https://openalex.org/W2343765202","https://openalex.org/W2419180118","https://openalex.org/W2564022854","https://openalex.org/W2768149277","https://openalex.org/W2883966112","https://openalex.org/W3105014772","https://openalex.org/W3120740533","https://openalex.org/W4239510810","https://openalex.org/W4247777826","https://openalex.org/W4297795643","https://openalex.org/W6633301734","https://openalex.org/W6683152347","https://openalex.org/W6753046870"],"related_works":["https://openalex.org/W108845024","https://openalex.org/W57712237","https://openalex.org/W2578985712","https://openalex.org/W4300125793","https://openalex.org/W2406961474","https://openalex.org/W2143566611","https://openalex.org/W2013740965","https://openalex.org/W588267724","https://openalex.org/W2952598754","https://openalex.org/W4386291436"],"abstract_inverted_index":{"Several":[0],"leading":[1],"supervised":[2],"and":[3,120,229],"unsupervised":[4],"machine":[5],"learning":[6],"algorithms":[7,189,214,222,239],"require":[8],"as":[9,153,155],"input":[10],"similarities":[11,23,41,61,99],"between":[12],"objects":[13,91,122,140,209],"in":[14,94,103,127,219,225],"a":[15,79,83,144,216],"data":[16,31,44,77,167,202],"set.":[17],"Since":[18],"the":[19,27,30,59,69,76,89,104,114,128,177,192,212,237],"number":[20],"of":[21,29,50,63,139,179,181,236],"pairwise":[22,40,65],"grows":[24],"quadratically":[25],"with":[26,204],"size":[28],"set,":[32],"it":[33],"is":[34,85],"computationally":[35],"prohibitive":[36],"to":[37,176,194,206],"compute":[38],"all":[39,64,137],"for":[42],"large-scale":[43,226],"sets.":[45],"The":[46,97,221],"recently":[47],"introduced":[48],"methodology":[49],"\u201csparse":[51],"computation\u201d":[52],"resolves":[53],"this":[54,95,162],"issue":[55],"by":[56,112],"computing":[57],"only":[58],"relevant":[60,70,87,98],"instead":[62],"similarities.":[66],"To":[67],"identify":[68],"similarities,":[71],"sparse":[72,169],"computation":[73,108,170],"efficiently":[74],"projects":[75],"onto":[78],"low-dimensional":[80,115],"space":[81,116],"where":[82],"similarity":[84],"considered":[86],"if":[88,124],"corresponding":[90],"are":[92,100,142,151,159,240],"close":[93,110,123],"space.":[96,106],"then":[101],"computed":[102],"original":[105],"Sparse":[107],"identifies":[109],"pairs":[111,138,157,180],"partitioning":[113],"into":[117],"grid":[118,132],"blocks,":[119],"considering":[121],"they":[125],"fall":[126],"same":[129],"or":[130],"adjacent":[131,182,196],"blocks.":[133,183,197],"This":[134],"guarantees":[135],"that":[136,141,158,190,211],"within":[143,160],"specified":[145],"L":[146],"<sub":[147],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[148],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">\u221e</sub>":[149],"distance":[150],"identified":[152],"well":[154],"some":[156],"twice":[161],"distance.":[163],"For":[164],"very":[165],"large":[166],"sets,":[168],"can":[171],"have":[172,223],"high":[173],"runtime":[174],"due":[175],"enumeration":[178],"We":[184],"propose":[185],"here":[186],"new":[187,213],"geometric":[188],"eliminate":[191],"need":[193],"enumerate":[195],"Our":[198],"empirical":[199],"results":[200],"on":[201],"sets":[203],"up":[205],"10":[207],"million":[208],"show":[210],"achieve":[215],"significant":[217],"reduction":[218],"runtime.":[220],"applications":[224],"computational":[227],"geometry":[228],"(approximate)":[230],"nearest":[231],"neighbor":[232],"search.":[233],"Python":[234],"implementations":[235],"proposed":[238],"publicly":[241],"available.":[242]},"counts_by_year":[{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
