{"id":"https://openalex.org/W2064486843","doi":"https://doi.org/10.1007/s10579-013-9227-2","title":"Twitter n-gram corpus with demographic metadata","display_name":"Twitter n-gram corpus with demographic metadata","publication_year":2013,"publication_date":"2013-04-17","ids":{"openalex":"https://openalex.org/W2064486843","doi":"https://doi.org/10.1007/s10579-013-9227-2","mag":"2064486843"},"language":"en","primary_location":{"id":"doi:10.1007/s10579-013-9227-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10579-013-9227-2","pdf_url":null,"source":{"id":"https://openalex.org/S4306424877","display_name":"Language Resources and Evaluation","issn_l":"1574-020X","issn":["1574-020X","1574-0218"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Language Resources and Evaluation","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1007/s10579-013-9227-2","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002546244","display_name":"Ama\u00e7 Herda\u011fdelen","orcid":"https://orcid.org/0000-0001-6402-1407"},"institutions":[{"id":"https://openalex.org/I193223587","display_name":"University of Trento","ror":"https://ror.org/05trd4x28","country_code":"IT","type":"education","lineage":["https://openalex.org/I193223587"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Ama\u00e7 Herda\u011fdelen","raw_affiliation_strings":["CIMeC, University of Trento, Rovereto, Italy","Facebook Inc., Menlo Park, USA 94025 and CIMeC, University of Trento, Rovereto, Italy#TAB#"],"affiliations":[{"raw_affiliation_string":"CIMeC, University of Trento, Rovereto, Italy","institution_ids":["https://openalex.org/I193223587"]},{"raw_affiliation_string":"Facebook Inc., Menlo Park, USA 94025 and CIMeC, University of Trento, Rovereto, Italy#TAB#","institution_ids":["https://openalex.org/I193223587"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5002546244"],"corresponding_institution_ids":["https://openalex.org/I193223587"],"apc_list":null,"apc_paid":null,"fwci":6.8637,"has_fulltext":false,"cited_by_count":30,"citation_normalized_percentile":{"value":0.96316833,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"47","issue":"4","first_page":"1127","last_page":"1147"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10557","display_name":"Social Media and Politics","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/3315","display_name":"Communication"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10557","display_name":"Social Media and Politics","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/3315","display_name":"Communication"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9836999773979187,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.8976829051971436},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.6558351516723633},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.595115065574646},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5863005518913269},{"id":"https://openalex.org/keywords/n-gram","display_name":"n-gram","score":0.5497727990150452},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.5473669767379761},{"id":"https://openalex.org/keywords/gram","display_name":"Gram","score":0.4404154419898987},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.2555065155029297},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.18578267097473145},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.10741713643074036},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.07901903986930847}],"concepts":[{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.8976829051971436},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.6558351516723633},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.595115065574646},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5863005518913269},{"id":"https://openalex.org/C117884012","wikidata":"https://www.wikidata.org/wiki/Q94489","display_name":"n-gram","level":3,"score":0.5497727990150452},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.5473669767379761},{"id":"https://openalex.org/C161369605","wikidata":"https://www.wikidata.org/wiki/Q41803","display_name":"Gram","level":3,"score":0.4404154419898987},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2555065155029297},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.18578267097473145},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.10741713643074036},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.07901903986930847},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C523546767","wikidata":"https://www.wikidata.org/wiki/Q10876","display_name":"Bacteria","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10579-013-9227-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10579-013-9227-2","pdf_url":null,"source":{"id":"https://openalex.org/S4306424877","display_name":"Language Resources and Evaluation","issn_l":"1574-020X","issn":["1574-020X","1574-0218"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Language Resources and Evaluation","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10579-013-9227-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10579-013-9227-2","pdf_url":null,"source":{"id":"https://openalex.org/S4306424877","display_name":"Language Resources and Evaluation","issn_l":"1574-020X","issn":["1574-020X","1574-0218"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Language Resources and Evaluation","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Gender equality","score":0.47999998927116394,"id":"https://metadata.un.org/sdg/5"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W9223698","https://openalex.org/W91442942","https://openalex.org/W154079225","https://openalex.org/W195681115","https://openalex.org/W205260337","https://openalex.org/W1522263329","https://openalex.org/W1574454071","https://openalex.org/W1590495275","https://openalex.org/W1603920809","https://openalex.org/W1752870744","https://openalex.org/W1800296434","https://openalex.org/W1966703356","https://openalex.org/W1969568357","https://openalex.org/W1976323204","https://openalex.org/W1996802155","https://openalex.org/W2004214228","https://openalex.org/W2008803468","https://openalex.org/W2019096529","https://openalex.org/W2032420854","https://openalex.org/W2033444463","https://openalex.org/W2044688197","https://openalex.org/W2048064382","https://openalex.org/W2074835059","https://openalex.org/W2096438711","https://openalex.org/W2102764191","https://openalex.org/W2110302976","https://openalex.org/W2112056172","https://openalex.org/W2113641473","https://openalex.org/W2124499489","https://openalex.org/W2126176556","https://openalex.org/W2139575250","https://openalex.org/W2145139979","https://openalex.org/W2145639447","https://openalex.org/W2145833060","https://openalex.org/W2146341589","https://openalex.org/W2155870214","https://openalex.org/W2157765050","https://openalex.org/W2159397589","https://openalex.org/W2160164169","https://openalex.org/W2165044314","https://openalex.org/W2167102709","https://openalex.org/W2168332560","https://openalex.org/W2250489604","https://openalex.org/W2292907674","https://openalex.org/W2396764674","https://openalex.org/W2591619550","https://openalex.org/W2962860893","https://openalex.org/W3154772965","https://openalex.org/W4241452721","https://openalex.org/W4285719527","https://openalex.org/W6603689333","https://openalex.org/W6607985903","https://openalex.org/W6608350269","https://openalex.org/W6669121539","https://openalex.org/W6676670208","https://openalex.org/W6684102810","https://openalex.org/W6712568582","https://openalex.org/W6724331316"],"related_works":["https://openalex.org/W2906970013","https://openalex.org/W3126081632","https://openalex.org/W2088254117","https://openalex.org/W4254593385","https://openalex.org/W2790582133","https://openalex.org/W1901380241","https://openalex.org/W4247016990","https://openalex.org/W2789473152","https://openalex.org/W3132255358","https://openalex.org/W1575504723"],"abstract_inverted_index":{"Social":[0],"media":[1],"is":[2],"a":[3,31,47,70,84,107,114],"natural":[4],"laboratory":[5],"for":[6],"linguistic":[7],"and":[8,28,58,95,112],"sociological":[9],"purposes.":[10],"In":[11,75],"micro-blogging":[12,66],"platforms":[13],"such":[14],"as":[15],"Twitter,":[16],"people":[17],"share":[18],"hundreds":[19],"of":[20,22,50,63,89,121],"millions":[21],"short":[23],"messages":[24],"about":[25,39],"their":[26,40],"lives":[27],"experiences":[29],"on":[30],"daily":[32],"basis.":[33],"These":[34],"messages,":[35,91],"coupled":[36],"with":[37,99,126],"metadata":[38],"authors,":[41],"provide":[42],"an":[43,123],"opportunity":[44],"to":[45,56,72,106],"understand":[46],"wide":[48],"variety":[49],"phenomena":[51],"ranging":[52],"from":[53],"political":[54],"polarization":[55],"geographic":[57],"demographic":[59,127],"lexical":[60],"variation.":[61],"Lack":[62],"publicly":[64,85],"available":[65,86],"datasets":[67],"has":[68],"been":[69],"hindrance":[71],"replicable":[73],"research.":[74],"this":[76,104],"paper,":[77],"I":[78,102],"introduce":[79],"Rovereto":[80],"Twitter":[81,90],"n-gram":[82,87,124],"corpus,":[83],"dataset":[88,105],"which":[92,117],"contains":[93],"gender-of-the-author":[94],"time-of-posting":[96],"tags":[97],"associated":[98],"the":[100,119],"n-grams.":[101],"compare":[103],"more":[108],"traditional":[109],"web-based":[110],"corpus":[111,125],"present":[113],"case":[115],"study":[116],"shows":[118],"potential":[120],"combining":[122],"metadata.":[128]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
