{"id":"https://openalex.org/W4409657479","doi":"https://doi.org/10.1145/3696410.3714890","title":"Linear-Time Algorithms for Representative Subset Selection From Data Streams","display_name":"Linear-Time Algorithms for Representative Subset Selection From Data Streams","publication_year":2025,"publication_date":"2025-04-22","ids":{"openalex":"https://openalex.org/W4409657479","doi":"https://doi.org/10.1145/3696410.3714890"},"language":"en","primary_location":{"id":"doi:10.1145/3696410.3714890","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3696410.3714890","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3696410.3714890","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Web Conference 2025","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3696410.3714890","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043822784","display_name":"Shuang Cui","orcid":"https://orcid.org/0000-0001-6080-4850"},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shuang Cui","raw_affiliation_strings":["Soochow University, Suzhou, Jiangsu, China"],"affiliations":[{"raw_affiliation_string":"Soochow University, Suzhou, Jiangsu, China","institution_ids":["https://openalex.org/I3923682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084367706","display_name":"Kai Han","orcid":"https://orcid.org/0000-0002-6302-5366"},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Han","raw_affiliation_strings":["Soochow University, Suzhou, Jiangsu, China"],"affiliations":[{"raw_affiliation_string":"Soochow University, Suzhou, Jiangsu, China","institution_ids":["https://openalex.org/I3923682"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077270486","display_name":"Jing Tang","orcid":"https://orcid.org/0000-0002-0785-707X"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]},{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jing Tang","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, Guangdong, China and The Hong Kong University of Science and Technology, Kowloon, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, Guangdong, China and The Hong Kong University of Science and Technology, Kowloon, Hong Kong, China","institution_ids":["https://openalex.org/I200769079","https://openalex.org/I889458895"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5043822784"],"corresponding_institution_ids":["https://openalex.org/I3923682"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0356136,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4710","last_page":"4721"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.986299991607666,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7498727440834045},{"id":"https://openalex.org/keywords/streams","display_name":"STREAMS","score":0.5466982126235962},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5432850122451782},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.490386962890625},{"id":"https://openalex.org/keywords/data-stream-mining","display_name":"Data stream mining","score":0.476136714220047},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3000481128692627},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.20015859603881836},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.1256161630153656}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7498727440834045},{"id":"https://openalex.org/C42090638","wikidata":"https://www.wikidata.org/wiki/Q4048907","display_name":"STREAMS","level":2,"score":0.5466982126235962},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5432850122451782},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.490386962890625},{"id":"https://openalex.org/C89198739","wikidata":"https://www.wikidata.org/wiki/Q3079880","display_name":"Data stream mining","level":2,"score":0.476136714220047},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3000481128692627},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.20015859603881836},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.1256161630153656}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3696410.3714890","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3696410.3714890","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3696410.3714890","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Web Conference 2025","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-159260","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-159260","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"}],"best_oa_location":{"id":"doi:10.1145/3696410.3714890","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3696410.3714890","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3696410.3714890","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Web Conference 2025","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1477544716","display_name":null,"funder_award_id":"Guangdong","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1560154075","display_name":null,"funder_award_id":"2024A03","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2390730835","display_name":null,"funder_award_id":"2023A1515110131","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G380298712","display_name":null,"funder_award_id":"U22B2060","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3845753876","display_name":null,"funder_award_id":"2023A03J0667","funder_id":"https://openalex.org/F4320330743","funder_display_name":"Guangzhou Municipal Science and Technology Bureau"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5992379237","display_name":null,"funder_award_id":"62172384","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6536786679","display_name":null,"funder_award_id":"A1515110","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"},{"id":"https://openalex.org/G6639867748","display_name":null,"funder_award_id":"2023A03","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7723461095","display_name":null,"funder_award_id":"2023A151511","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"},{"id":"https://openalex.org/G7726157001","display_name":null,"funder_award_id":"Grant No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320330743","display_name":"Guangzhou Municipal Science and Technology Bureau","ror":null},{"id":"https://openalex.org/F4320337111","display_name":"Basic and Applied Basic Research Foundation of Guangdong Province","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409657479.pdf","grobid_xml":"https://content.openalex.org/works/W4409657479.grobid-xml"},"referenced_works_count":52,"referenced_works":["https://openalex.org/W112063162","https://openalex.org/W398859631","https://openalex.org/W1503396090","https://openalex.org/W1586809440","https://openalex.org/W1801423597","https://openalex.org/W1989151913","https://openalex.org/W1997959284","https://openalex.org/W2026338082","https://openalex.org/W2033885045","https://openalex.org/W2052876922","https://openalex.org/W2053853578","https://openalex.org/W2061820396","https://openalex.org/W2063280781","https://openalex.org/W2080379754","https://openalex.org/W2109297205","https://openalex.org/W2109309418","https://openalex.org/W2110373679","https://openalex.org/W2145825677","https://openalex.org/W2179494254","https://openalex.org/W2527454481","https://openalex.org/W2540677289","https://openalex.org/W2626914210","https://openalex.org/W2729094633","https://openalex.org/W2745560456","https://openalex.org/W2757107770","https://openalex.org/W2759321404","https://openalex.org/W2944325705","https://openalex.org/W2953374984","https://openalex.org/W2974376984","https://openalex.org/W3012895300","https://openalex.org/W3038620866","https://openalex.org/W3048380211","https://openalex.org/W3105524178","https://openalex.org/W3130088724","https://openalex.org/W3131115866","https://openalex.org/W3134887725","https://openalex.org/W3165223799","https://openalex.org/W3172805627","https://openalex.org/W3181027293","https://openalex.org/W3208860981","https://openalex.org/W3211973203","https://openalex.org/W3213622323","https://openalex.org/W4230174951","https://openalex.org/W4231490457","https://openalex.org/W4246587691","https://openalex.org/W4290927726","https://openalex.org/W4292070111","https://openalex.org/W4294397379","https://openalex.org/W4318812107","https://openalex.org/W4367046887","https://openalex.org/W4385562547","https://openalex.org/W4401863396"],"related_works":["https://openalex.org/W4293083682","https://openalex.org/W2061507057","https://openalex.org/W807005383","https://openalex.org/W2182399080","https://openalex.org/W1501624740","https://openalex.org/W1984941792","https://openalex.org/W2369440580","https://openalex.org/W2106570241","https://openalex.org/W3144654663","https://openalex.org/W2109863941"],"abstract_inverted_index":{"Representative":[0],"subset":[1],"selection":[2],"from":[3],"data":[4,15,26,49,84,117,137,213],"streams":[5],"is":[6,33,61,168],"a":[7,38,44,66,97,183],"critical":[8],"problem":[9,32],"with":[10,192],"wide-ranging":[11],"applications":[12,209],"in":[13,51,104,225],"web":[14,212],"mining":[16,214],"and":[17,28,58,86,107,160,199,215,230],"machine":[18],"learning,":[19],"such":[20],"as":[21,36],"social":[22,216],"media":[23,217],"marketing,":[24],"big":[25],"summarization,":[27],"recommendation":[29],"systems.":[30],"This":[31],"often":[34],"framed":[35],"maximizing":[37],"monotone":[39],"submodular":[40],"function":[41],"subject":[42],"to":[43,62,69,182,211],"knapsack":[45],"constraint,":[46],"where":[47,166],"each":[48],"element":[50],"the":[52,59,81,93,124,136,169,190,220],"stream":[53],"has":[54],"an":[55,150],"associated":[56],"cost,":[57],"goal":[60],"select":[63],"elements":[64],"within":[65],"budget":[67,94],"B":[68],"maximize":[70],"revenue.":[71],"However,":[72],"existing":[73],"algorithms":[74,100,128,224],"typically":[75],"rely":[76],"on":[77,92,135],"restrictive":[78],"assumptions":[79,134],"about":[80],"costs":[82],"of":[83,153,172,222,227],"elements,":[85],"their":[87],"performance":[88],"bounds":[89],"heavily":[90],"depend":[91],"B.":[95],"As":[96],"result,":[98],"these":[99],"are":[101],"only":[102,186],"effective":[103],"limited":[105],"scenarios":[106],"have":[108],"super-linear":[109],"time":[110,158,197],"complexity,":[111,165],"making":[112],"them":[113],"unsuitable":[114],"for":[115,129],"large-scale":[116],"streams.":[118],"In":[119],"this":[120,130,181],"paper,":[121],"we":[122],"introduce":[123],"first":[125],"linear-time":[126],"streaming":[127,147,178],"problem,":[131],"without":[132],"any":[133,173],"stream,":[138,191],"while":[139],"also":[140],"minimizing":[141],"memory":[142],"usage.":[143],"Specifically,":[144],"our":[145,223],"single-pass":[146],"algorithm":[148,179],"achieves":[149],"approximation":[151],"ratio":[152],"1/8-\u03b5":[154],"under":[155],"O":[156,193],"(n)":[157],"complexity":[159,198],"O(k":[161],"log":[162,195,201],"1/\u03b5)":[163,196,202],"space":[164,203],"k":[167],"largest":[170],"cardinality":[171],"feasible":[174],"solution.":[175],"Our":[176],"multi-pass":[177],"improves":[180],"(1/2-\u03b5)-approximation":[184],"using":[185],"three":[187],"passes":[188],"over":[189],"(n/\u03b5":[194],"O(k/\u03b5":[200],"complexity.":[204],"Extensive":[205],"experiments":[206],"across":[207],"various":[208],"related":[210],"marketing":[218],"demonstrate":[219],"superiority":[221],"terms":[226],"both":[228],"effectiveness":[229],"efficiency.":[231]},"counts_by_year":[],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
