{"id":"https://openalex.org/W7160824895","doi":"https://doi.org/10.48550/arxiv.2605.06999","title":"TubeCensus: A Transparent, Replicable, and Large-Scale Census of YouTube Channels and their Subscriber Counts Over Time","display_name":"TubeCensus: A Transparent, Replicable, and Large-Scale Census of YouTube Channels and their Subscriber Counts Over Time","publication_year":2026,"publication_date":"2026-05-07","ids":{"openalex":"https://openalex.org/W7160824895","doi":"https://doi.org/10.48550/arxiv.2605.06999"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.06999","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06999","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.06999","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086659454","display_name":"Chloe Eggleston","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Eggleston, Chloe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135836988","display_name":"Abram Handler","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Handler, Abram","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5005560875","display_name":"Mar\u00eda Leonor Pacheco","orcid":"https://orcid.org/0000-0001-8399-3199"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pacheco, Maria Leonor","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5086659454"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10609","display_name":"Digital Marketing and Social Media","score":0.3555999994277954,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10609","display_name":"Digital Marketing and Social Media","score":0.3555999994277954,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.05640000104904175,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12214","display_name":"Media Influence and Health","score":0.04100000113248825,"subfield":{"id":"https://openalex.org/subfields/1208","display_name":"Literature and Literary Theory"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.6468999981880188},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.5932999849319458},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.5375999808311462},{"id":"https://openalex.org/keywords/identifier","display_name":"Identifier","score":0.5332000255584717},{"id":"https://openalex.org/keywords/visibility","display_name":"Visibility","score":0.4837000072002411},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.47450000047683716},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4108000099658966},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4065000116825104}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6629999876022339},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.6468999981880188},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.5932999849319458},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.573199987411499},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.5375999808311462},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.5332000255584717},{"id":"https://openalex.org/C123403432","wikidata":"https://www.wikidata.org/wiki/Q654068","display_name":"Visibility","level":2,"score":0.4837000072002411},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.47450000047683716},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4108000099658966},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4065000116825104},{"id":"https://openalex.org/C108827166","wikidata":"https://www.wikidata.org/wiki/Q175975","display_name":"Internet privacy","level":1,"score":0.37139999866485596},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.36329999566078186},{"id":"https://openalex.org/C29122968","wikidata":"https://www.wikidata.org/wiki/Q1414816","display_name":"Incentive","level":2,"score":0.35530000925064087},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.3206000030040741},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3068999946117401},{"id":"https://openalex.org/C52130261","wikidata":"https://www.wikidata.org/wiki/Q39825","display_name":"Census","level":3,"score":0.30239999294281006},{"id":"https://openalex.org/C558299567","wikidata":"https://www.wikidata.org/wiki/Q11033","display_name":"Mass media","level":2,"score":0.29750001430511475},{"id":"https://openalex.org/C113954288","wikidata":"https://www.wikidata.org/wiki/Q186885","display_name":"Timestamp","level":2,"score":0.2973000109195709},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.290800005197525},{"id":"https://openalex.org/C83849155","wikidata":"https://www.wikidata.org/wiki/Q1472399","display_name":"Internet access","level":3,"score":0.2815999984741211},{"id":"https://openalex.org/C85973986","wikidata":"https://www.wikidata.org/wiki/Q1091731","display_name":"Exploratory research","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.2635999917984009},{"id":"https://openalex.org/C17632256","wikidata":"https://www.wikidata.org/wiki/Q1076968","display_name":"Digital media","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C119839945","wikidata":"https://www.wikidata.org/wiki/Q6545185","display_name":"Unique identifier","level":3,"score":0.25360000133514404}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.06999","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06999","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.06999","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06999","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"YouTube":[0,10,35,58,80,106,121,141,175,199,227,235],"is":[1,130],"central":[2],"to":[3,16,53,69,78,221],"contemporary":[4],"mass":[5,90],"media.":[6],"However,":[7],"the":[8,17,26,34,40,79,89,93,125,140,151,194,198,231],"official":[9],"API":[11],"does":[12,135],"not":[13,136],"provide":[14],"access":[15],"full":[18],"set":[19],"of":[20,30,39,57,105,120,153,158,173,185,197,226],"creators":[21,59,107,167],"or":[22,50],"creator":[23,42,84],"metadata":[24],"on":[25,92],"platform.":[27,94],"This":[28,65,128],"lack":[29],"basic":[31,223],"visibility":[32],"into":[33],"ecosystem":[36],"hinders":[37],"understanding":[38],"platform's":[41],"economy.":[43],"Researchers":[44],"currently":[45],"have":[46],"no":[47],"easy,":[48],"transparent,":[49],"replicable":[51,133],"way":[52],"construct":[54],"large-scale":[55,102],"datasets":[56],"and":[60,86,108,115,132,134,161,202,230],"their":[61],"audiences":[62],"over":[63,147],"time.":[64,148],"makes":[66],"it":[67],"challenging":[68],"study":[70],"vital":[71],"social":[72],"questions,":[73],"such":[74],"as":[75],"how":[76],"changes":[77],"recommendation":[81],"algorithm":[82],"shape":[83],"incentives":[85],"by":[87,112,207],"extension":[88],"media":[91],"We":[95,149,177],"address":[96],"this":[97],"gap":[98],"with":[99,139,234],"TubeCensus,":[100],"a":[101],"longitudinal":[103],"dataset":[104,210],"subscriber":[109],"counts,":[110],"constructed":[111],"collecting,":[113],"linking,":[114],"organizing":[116],"nearly":[117],"two":[118],"decades":[119],"page":[122],"captures":[123],"from":[124],"Internet":[126,203],"Archive.":[127],"approach":[129],"transparent":[131],"require":[137],"interaction":[138],"API,":[142],"whose":[143],"output":[144],"can":[145],"change":[146],"validate":[150],"coverage":[152,184],"TubeCensus":[154,181],"against":[155],"prior":[156],"estimates":[157],"YouTube's":[159],"size":[160],"find":[162,179],"that":[163,180],"our":[164,209,219],"resource":[165,220],"includes":[166],"responsible":[168],"for":[169],"at":[170],"least":[171],"30-36%":[172],"all":[174],"content.":[176],"also":[178],"provides":[182],"good":[183],"prominent":[186],"creators.":[187],"To":[188],"support":[189],"future":[190],"research,":[191],"we":[192,217],"hide":[193],"substantial":[195],"complexities":[196],"identifier":[200],"system":[201,206],"Archive":[204],"capture":[205],"distributing":[208],"via":[211],"an":[212],"easy-to-use":[213],"pip":[214],"package.":[215],"Finally,":[216],"use":[218],"complete":[222],"exploratory":[224],"analysis":[225],"channel":[228,236],"content":[229],"mechanisms":[232],"associated":[233],"growth.":[237]},"counts_by_year":[],"updated_date":"2026-05-12T06:14:25.881160","created_date":"2026-05-12T00:00:00"}
