{"id":"https://openalex.org/W4312385682","doi":"https://doi.org/10.1109/dsit55514.2022.9943820","title":"An Algorithmic View of Streaming Submodular Data Summarization with A Knapsack Constraint","display_name":"An Algorithmic View of Streaming Submodular Data Summarization with A Knapsack Constraint","publication_year":2022,"publication_date":"2022-07-22","ids":{"openalex":"https://openalex.org/W4312385682","doi":"https://doi.org/10.1109/dsit55514.2022.9943820"},"language":"en","primary_location":{"id":"doi:10.1109/dsit55514.2022.9943820","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsit55514.2022.9943820","pdf_url":null,"source":{"id":"https://openalex.org/S4363608293","display_name":"2022 5th International Conference on Data Science and Information Technology (DSIT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 5th International Conference on Data Science and Information Technology (DSIT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052733753","display_name":"Enpei Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Enpei Zhang","raw_affiliation_strings":["University of Science and Technology of China,School of Computer Science and Technology,Hefei,China","School of Computer Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China,School of Computer Science and Technology,Hefei,China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084367706","display_name":"Kai Han","orcid":"https://orcid.org/0000-0002-6302-5366"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210125878","display_name":"Suzhou Research Institute","ror":"https://ror.org/03ebk0c60","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210125878"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Han","raw_affiliation_strings":["University of Science and Technology of China,School of Computer Science and Technology,Hefei,China","Suzhou Research Institute, University of Science and Technology of China, Suzhou, China","School of Computer Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China,School of Computer Science and Technology,Hefei,China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Suzhou Research Institute, University of Science and Technology of China, Suzhou, China","institution_ids":["https://openalex.org/I4210125878"]},{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012844835","display_name":"Benwei Wu","orcid":"https://orcid.org/0000-0002-5420-2455"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Benwei Wu","raw_affiliation_strings":["University of Science and Technology of China,School of Computer Science and Technology,Hefei,China","School of Computer Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China,School of Computer Science and Technology,Hefei,China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5052733753"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16336634,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"5","issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10720","display_name":"Complexity and Algorithms in Graphs","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10720","display_name":"Complexity and Algorithms in Graphs","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10237","display_name":"Cryptography and Data Security","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.9289142489433289},{"id":"https://openalex.org/keywords/submodular-set-function","display_name":"Submodular set function","score":0.9171895980834961},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7862769961357117},{"id":"https://openalex.org/keywords/knapsack-problem","display_name":"Knapsack problem","score":0.6746506690979004},{"id":"https://openalex.org/keywords/streaming-algorithm","display_name":"Streaming algorithm","score":0.5433119535446167},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.5190547108650208},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.47127267718315125},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.449384868144989},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.43169182538986206},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4229119122028351},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.33181124925613403},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.295793354511261},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2387988567352295},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22804686427116394},{"id":"https://openalex.org/keywords/upper-and-lower-bounds","display_name":"Upper and lower bounds","score":0.15330687165260315},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10989227890968323}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.9289142489433289},{"id":"https://openalex.org/C178621042","wikidata":"https://www.wikidata.org/wiki/Q7631710","display_name":"Submodular set function","level":2,"score":0.9171895980834961},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7862769961357117},{"id":"https://openalex.org/C113138325","wikidata":"https://www.wikidata.org/wiki/Q864457","display_name":"Knapsack problem","level":2,"score":0.6746506690979004},{"id":"https://openalex.org/C187166803","wikidata":"https://www.wikidata.org/wiki/Q2835831","display_name":"Streaming algorithm","level":3,"score":0.5433119535446167},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.5190547108650208},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.47127267718315125},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.449384868144989},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.43169182538986206},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4229119122028351},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.33181124925613403},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.295793354511261},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2387988567352295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22804686427116394},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.15330687165260315},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10989227890968323},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dsit55514.2022.9943820","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsit55514.2022.9943820","pdf_url":null,"source":{"id":"https://openalex.org/S4363608293","display_name":"2022 5th International Conference on Data Science and Information Technology (DSIT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 5th International Conference on Data Science and Information Technology (DSIT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.47999998927116394,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1498671329","https://openalex.org/W1503396090","https://openalex.org/W1680189815","https://openalex.org/W1997959284","https://openalex.org/W2055421030","https://openalex.org/W2100597616","https://openalex.org/W2110373679","https://openalex.org/W2130623086","https://openalex.org/W2143996311","https://openalex.org/W2144933361","https://openalex.org/W2158504911","https://openalex.org/W2473929617","https://openalex.org/W2745561525","https://openalex.org/W2809067649","https://openalex.org/W2950680139","https://openalex.org/W2964165521","https://openalex.org/W2974376984","https://openalex.org/W3090042385","https://openalex.org/W3094553672","https://openalex.org/W3165629504","https://openalex.org/W3213622323","https://openalex.org/W4288560659","https://openalex.org/W4364374016","https://openalex.org/W6629615516","https://openalex.org/W6679392573","https://openalex.org/W6681106510","https://openalex.org/W6720980371","https://openalex.org/W6742761132","https://openalex.org/W6752724758","https://openalex.org/W6761195460","https://openalex.org/W6762219430","https://openalex.org/W6762785454","https://openalex.org/W6783566758","https://openalex.org/W6784784755"],"related_works":["https://openalex.org/W2963844234","https://openalex.org/W2803250016","https://openalex.org/W2896347948","https://openalex.org/W4302557420","https://openalex.org/W2950500962","https://openalex.org/W2915041254","https://openalex.org/W2963443186","https://openalex.org/W4382197677","https://openalex.org/W3128830699","https://openalex.org/W4299680505"],"abstract_inverted_index":{"Data":[0],"summarization,":[1],"in":[2,127],"the":[3,34,44,54,72,108,136,149,173,185,199],"form":[4],"of":[5,43,56,75,110,123,157,203],"extracting":[6],"a":[7,11,15,40,57,61,143,178],"representative":[8],"subset":[9],"(i.e,":[10],"data":[12,17,24,76,80,95,168,194],"summary)":[13],"from":[14],"massive":[16,91],"set,":[18],"is":[19,153],"often":[20],"used":[21,126],"for":[22,148],"big":[23],"processing.":[25],"A":[26],"good":[27],"summary":[28,58],"can":[29,171],"not":[30],"only":[31],"significantly":[32],"reduce":[33],"information":[35],"redundancy,":[36],"but":[37],"also":[38,66],"provide":[39],"better":[41],"understanding":[42],"original":[45],"data.":[46],"The":[47],"utility":[48],"function":[49],"we":[50,117,140,187],"use":[51],"to":[52,71,88,103,107,197],"evaluate":[53],"quality":[55],"usually":[59],"has":[60,82],"natrual":[62],"diminishing":[63],"returns":[64],"property,":[65],"known":[67],"as":[68],"submodularity.":[69],"Due":[70],"rapid":[73],"growth":[74],"scale,":[77],"traditional":[78,158],"offline":[79],"processing":[81,96],"become":[83],"more":[84,86],"and":[85,93,164,181,201],"difficult":[87],"deal":[89],"with":[90,131,167],"data,":[92],"streaming":[94,128],"methods":[97,124],"that":[98],"require":[99],"less":[100],"space":[101,182],"start":[102],"attract":[104],"attention,":[105],"leading":[106],"emergence":[109],"many":[111],"related":[112],"studies.":[113],"In":[114],"this":[115],"paper,":[116],"first":[118],"make":[119],"an":[120,154],"algorithmic":[121],"view":[122],"widely":[125],"submodu-lar":[129],"maximization":[130],"knapsack":[132],"constraint.":[133],"After":[134],"analyzing":[135],"ideas":[137],"behind":[138],"them,":[139],"further":[141],"propose":[142],"new":[144],"algorithm,":[145],"called":[146],"RSStream,":[147],"same":[150],"problem.":[151],"RSStream":[152],"innovative":[155],"combination":[156],"sieve":[159],"approach,":[160],"multi-cadidate":[161],"set":[162],"method":[163],"augmentation":[165],"strategy":[166],"sampling.":[169],"It":[170],"achieve":[172],"state-of-the-art":[174],"approximation":[175],"ratio":[176],"within":[177],"near-linear":[179],"time":[180],"complexity.":[183],"At":[184],"end,":[186],"execute":[188],"our":[189],"algorithm":[190],"on":[191],"two":[192],"real":[193],"summarization":[195],"applications":[196],"demonstrate":[198],"effectiveness":[200],"efficiency":[202],"it.":[204]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
