{"id":"https://openalex.org/W4318187661","doi":"https://doi.org/10.1109/bigdata55660.2022.10021052","title":"A Crowd Source System for YouTube Big Data Analytics: Unpacking Values from Data Sprawl","display_name":"A Crowd Source System for YouTube Big Data Analytics: Unpacking Values from Data Sprawl","publication_year":2022,"publication_date":"2022-12-17","ids":{"openalex":"https://openalex.org/W4318187661","doi":"https://doi.org/10.1109/bigdata55660.2022.10021052"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata55660.2022.10021052","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/bigdata55660.2022.10021052","pdf_url":null,"source":{"id":"https://openalex.org/S4363607709","display_name":"2022 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112207879","display_name":"Jagan Mohan Reddy","orcid":null},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jagan Mohan Reddy","raw_affiliation_strings":["University at Buffalo, SUNY,Institute for Artificial Intelligence and Data Science,New York,USA","Institute for Artificial Intelligence and Data Science, University at Buffalo, SUNY, New York, USA"],"affiliations":[{"raw_affiliation_string":"University at Buffalo, SUNY,Institute for Artificial Intelligence and Data Science,New York,USA","institution_ids":["https://openalex.org/I63190737"]},{"raw_affiliation_string":"Institute for Artificial Intelligence and Data Science, University at Buffalo, SUNY, New York, USA","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021929880","display_name":"Abhishek Attuluri","orcid":null},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abhishek Attuluri","raw_affiliation_strings":["University at Buffalo, SUNY,Institute for Artificial Intelligence and Data Science,New York,USA","Institute for Artificial Intelligence and Data Science, University at Buffalo, SUNY, New York, USA"],"affiliations":[{"raw_affiliation_string":"University at Buffalo, SUNY,Institute for Artificial Intelligence and Data Science,New York,USA","institution_ids":["https://openalex.org/I63190737"]},{"raw_affiliation_string":"Institute for Artificial Intelligence and Data Science, University at Buffalo, SUNY, New York, USA","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080730479","display_name":"Abhinay Kolli","orcid":null},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abhinay Kolli","raw_affiliation_strings":["University at Buffalo, SUNY,Institute for Artificial Intelligence and Data Science,New York,USA","Institute for Artificial Intelligence and Data Science, University at Buffalo, SUNY, New York, USA"],"affiliations":[{"raw_affiliation_string":"University at Buffalo, SUNY,Institute for Artificial Intelligence and Data Science,New York,USA","institution_ids":["https://openalex.org/I63190737"]},{"raw_affiliation_string":"Institute for Artificial Intelligence and Data Science, University at Buffalo, SUNY, New York, USA","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064445643","display_name":"Nazmus Sakib","orcid":"https://orcid.org/0000-0001-7671-9888"},"institutions":[{"id":"https://openalex.org/I172980758","display_name":"Kennesaw State University","ror":"https://ror.org/00jeqjx33","country_code":"US","type":"education","lineage":["https://openalex.org/I172980758"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nazmus Sakib","raw_affiliation_strings":["Kennesaw State University,Department of Information Technology,Georgia,United States","Department of Information Technology, Kennesaw State University, Georgia, United States"],"affiliations":[{"raw_affiliation_string":"Kennesaw State University,Department of Information Technology,Georgia,United States","institution_ids":["https://openalex.org/I172980758"]},{"raw_affiliation_string":"Department of Information Technology, Kennesaw State University, Georgia, United States","institution_ids":["https://openalex.org/I172980758"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052820694","display_name":"Hossain Shahriar","orcid":"https://orcid.org/0000-0003-1021-7986"},"institutions":[{"id":"https://openalex.org/I172980758","display_name":"Kennesaw State University","ror":"https://ror.org/00jeqjx33","country_code":"US","type":"education","lineage":["https://openalex.org/I172980758"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hossain Shahriar","raw_affiliation_strings":["Kennesaw State University,Department of Information Technology,Georgia,United States","Department of Information Technology, Kennesaw State University, Georgia, United States"],"affiliations":[{"raw_affiliation_string":"Kennesaw State University,Department of Information Technology,Georgia,United States","institution_ids":["https://openalex.org/I172980758"]},{"raw_affiliation_string":"Department of Information Technology, Kennesaw State University, Georgia, United States","institution_ids":["https://openalex.org/I172980758"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053225136","display_name":"Alfredo Cuzzocrea","orcid":"https://orcid.org/0000-0002-7104-6415"},"institutions":[{"id":"https://openalex.org/I45204951","display_name":"University of Calabria","ror":"https://ror.org/02rc97e94","country_code":"IT","type":"education","lineage":["https://openalex.org/I45204951"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Alfredo Cuzzocrea","raw_affiliation_strings":["University of Calabria,iDEA Lab,Rende,Italy","iDEA Lab, University of Calabria, Rende, Italy"],"affiliations":[{"raw_affiliation_string":"University of Calabria,iDEA Lab,Rende,Italy","institution_ids":["https://openalex.org/I45204951"]},{"raw_affiliation_string":"iDEA Lab, University of Calabria, Rende, Italy","institution_ids":["https://openalex.org/I45204951"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5112207879"],"corresponding_institution_ids":["https://openalex.org/I63190737"],"apc_list":null,"apc_paid":null,"fwci":0.2079,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.45852187,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"3","issue":null,"first_page":"5451","last_page":"5457"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9801999926567078,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/upload","display_name":"Upload","score":0.7851284742355347},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6794736385345459},{"id":"https://openalex.org/keywords/entertainment","display_name":"Entertainment","score":0.6776523590087891},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.5561050772666931},{"id":"https://openalex.org/keywords/animation","display_name":"Animation","score":0.5537523031234741},{"id":"https://openalex.org/keywords/unpacking","display_name":"Unpacking","score":0.5195470452308655},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.4839661419391632},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.4838672876358032},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.4310782253742218},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.41203126311302185},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.39575865864753723},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3235568702220917},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.220828115940094},{"id":"https://openalex.org/keywords/visual-arts","display_name":"Visual arts","score":0.10284900665283203},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.08999234437942505}],"concepts":[{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.7851284742355347},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6794736385345459},{"id":"https://openalex.org/C512170562","wikidata":"https://www.wikidata.org/wiki/Q173799","display_name":"Entertainment","level":2,"score":0.6776523590087891},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.5561050772666931},{"id":"https://openalex.org/C502989409","wikidata":"https://www.wikidata.org/wiki/Q11425","display_name":"Animation","level":2,"score":0.5537523031234741},{"id":"https://openalex.org/C2777256151","wikidata":"https://www.wikidata.org/wiki/Q7897273","display_name":"Unpacking","level":2,"score":0.5195470452308655},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.4839661419391632},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.4838672876358032},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.4310782253742218},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.41203126311302185},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.39575865864753723},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3235568702220917},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.220828115940094},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.10284900665283203},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.08999234437942505},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata55660.2022.10021052","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/bigdata55660.2022.10021052","pdf_url":null,"source":{"id":"https://openalex.org/S4363607709","display_name":"2022 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.4099999964237213,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1905517526","https://openalex.org/W1970546327","https://openalex.org/W2019880039","https://openalex.org/W2055533652","https://openalex.org/W2064947852","https://openalex.org/W2131635820","https://openalex.org/W2326236514","https://openalex.org/W2360467051","https://openalex.org/W2486439025","https://openalex.org/W2566979091","https://openalex.org/W2608540862","https://openalex.org/W2806822625","https://openalex.org/W2964248614","https://openalex.org/W2972495354","https://openalex.org/W2979325626","https://openalex.org/W2982685870","https://openalex.org/W3010323204","https://openalex.org/W3096600429","https://openalex.org/W3134077353","https://openalex.org/W3160602257","https://openalex.org/W3196049610","https://openalex.org/W4213207641","https://openalex.org/W4300801802","https://openalex.org/W6639714453","https://openalex.org/W6731596640","https://openalex.org/W6736763614","https://openalex.org/W6746988035","https://openalex.org/W6767805426","https://openalex.org/W6774642716"],"related_works":["https://openalex.org/W2980032325","https://openalex.org/W2042188247","https://openalex.org/W2017714611","https://openalex.org/W4224995949","https://openalex.org/W1992482086","https://openalex.org/W2385797406","https://openalex.org/W2024662052","https://openalex.org/W2608610227","https://openalex.org/W2527888910","https://openalex.org/W2902937489"],"abstract_inverted_index":{"YouTube":[0,30],"has":[1],"emerged":[2],"as":[3],"the":[4,10,35,43,46,55,58,75,113,119,130,136,174],"most":[5],"popular":[6],"video":[7,77,109,116,121,133],"platform":[8],"across":[9],"world.":[11],"This":[12],"paper":[13],"proposes":[14],"a":[15],"system":[16,33],"for":[17,29,40,84,106],"stream":[18],"based":[19],"meta-data":[20,78],"analytics,":[21],"to":[22,57,67,70,95],"gain":[23],"insights":[24],"and":[25,49,61,64,161],"uncover":[26],"hidden":[27],"patterns,":[28],"videos.":[31],"The":[32,163],"reports":[34],"number":[36,138],"of":[37,123,139],"videos":[38,44,140,165],"uploaded":[39,167],"each":[41],"category,":[42,170],"with":[45,89,118,135],"highest":[47,50,137,164],"views":[48],"likes":[51],"etc.":[52],"It":[53],"crowd-sources":[54],"calls":[56],"YouTube\u2019s":[59],"search":[60],"data":[62,110],"APIs,":[63],"feeds":[65],"it":[66,98],"Kafka":[68],"Stream":[69],"process":[71],"using":[72],"PySpark.":[73],"Finally,":[74],"processed":[76],"in":[79,81],"stored":[80],"Apache":[82],"Cassandra":[83],"downstream":[85],"consumption.":[86],"By":[87],"experimenting":[88],"different":[90],"time":[91],"windows":[92],"from":[93],"5":[94],"30":[96,115,124],"minutes,":[97,125],"is":[99,104],"observed":[100,128],"that":[101,129],"15-minute":[102],"window":[103],"optimum":[105],"getting":[107],"adequate":[108],"de-duplication.":[111],"From":[112],"available":[114],"categories,":[117],"minimum":[120],"length":[122],"our":[126],"study":[127],"top":[131],"10":[132],"categories":[134],"are":[141,166],"Film":[142],"&":[143,146,151,155,159],"Animation,":[144],"Autos":[145],"Vehicles,":[147],"Music,":[148],"Sports,":[149],"Travel":[150],"Events,":[152],"Entertainment,":[153],"News":[154],"politics,":[156],"Documentary,":[157],"Science":[158],"Technology":[160],"Education.":[162],"under":[168],"Entertainment":[169],"which":[171],"clearly":[172],"captures":[173],"content":[175],"creator\u2019s":[176],"interest.":[177]},"counts_by_year":[{"year":2024,"cited_by_count":2}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
