{"id":"https://openalex.org/W2233301138","doi":"https://doi.org/10.1186/s40537-015-0037-9","title":"Mining Chinese social media UGC: a big-data framework for analyzing Douban movie reviews","display_name":"Mining Chinese social media UGC: a big-data framework for analyzing Douban movie reviews","publication_year":2016,"publication_date":"2016-01-13","ids":{"openalex":"https://openalex.org/W2233301138","doi":"https://doi.org/10.1186/s40537-015-0037-9","mag":"2233301138"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-015-0037-9","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-015-0037-9","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-015-0037-9","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-015-0037-9","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101445040","display_name":"Jie Yang","orcid":"https://orcid.org/0000-0003-1317-8142"},"institutions":[{"id":"https://openalex.org/I204824540","display_name":"University of Wollongong","ror":"https://ror.org/00jtmb277","country_code":"AU","type":"education","lineage":["https://openalex.org/I204824540"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Jie Yang","raw_affiliation_strings":["SMART Infrastructure Facility, Faculty of Engineering and Information Sciences, University of Wollongong, Northfields Avenue, Wollongong, NSW, 2522, Australia","SMART Infrastructure Facility, Faculty of Engineering and Information Sciences, University of Wollongong, Wollongong, Australia"],"affiliations":[{"raw_affiliation_string":"SMART Infrastructure Facility, Faculty of Engineering and Information Sciences, University of Wollongong, Northfields Avenue, Wollongong, NSW, 2522, Australia","institution_ids":["https://openalex.org/I204824540"]},{"raw_affiliation_string":"SMART Infrastructure Facility, Faculty of Engineering and Information Sciences, University of Wollongong, Wollongong, Australia","institution_ids":["https://openalex.org/I204824540"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072791093","display_name":"Brian Yecies","orcid":"https://orcid.org/0000-0001-9296-6651"},"institutions":[{"id":"https://openalex.org/I204824540","display_name":"University of Wollongong","ror":"https://ror.org/00jtmb277","country_code":"AU","type":"education","lineage":["https://openalex.org/I204824540"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Brian Yecies","raw_affiliation_strings":["School of Humanities and Social Inquiry, Faculty of Law, Humanities and the Arts, University of Wollongong, Northfields Avenue, Wollongong, NSW, 2522, Australia","School of Humanities and Social Inquiry, Faculty of Law, Humanities and the Arts, University of Wollongong, Wollongong, Australia"],"affiliations":[{"raw_affiliation_string":"School of Humanities and Social Inquiry, Faculty of Law, Humanities and the Arts, University of Wollongong, Northfields Avenue, Wollongong, NSW, 2522, Australia","institution_ids":["https://openalex.org/I204824540"]},{"raw_affiliation_string":"School of Humanities and Social Inquiry, Faculty of Law, Humanities and the Arts, University of Wollongong, Wollongong, Australia","institution_ids":["https://openalex.org/I204824540"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5101445040"],"corresponding_institution_ids":["https://openalex.org/I204824540"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":22.8972,"has_fulltext":true,"cited_by_count":56,"citation_normalized_percentile":{"value":0.99175941,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"3","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10609","display_name":"Digital Marketing and Social Media","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10609","display_name":"Digital Marketing and Social Media","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.986299991607666,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.856285572052002},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.6871089935302734},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.6132573485374451},{"id":"https://openalex.org/keywords/popularity","display_name":"Popularity","score":0.5562295913696289},{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.5288169384002686},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.48947441577911377},{"id":"https://openalex.org/keywords/raw-data","display_name":"Raw data","score":0.44300875067710876},{"id":"https://openalex.org/keywords/web-crawler","display_name":"Web crawler","score":0.4410141706466675},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.42168253660202026},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.2625952363014221}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.856285572052002},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.6871089935302734},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.6132573485374451},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.5562295913696289},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.5288169384002686},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.48947441577911377},{"id":"https://openalex.org/C132964779","wikidata":"https://www.wikidata.org/wiki/Q2110223","display_name":"Raw data","level":2,"score":0.44300875067710876},{"id":"https://openalex.org/C13743948","wikidata":"https://www.wikidata.org/wiki/Q45842","display_name":"Web crawler","level":2,"score":0.4410141706466675},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.42168253660202026},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2625952363014221},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1186/s40537-015-0037-9","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-015-0037-9","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-015-0037-9","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:ro.uow.edu.au:lhapapers-3749","is_oa":false,"landing_page_url":"https://ro.uow.edu.au/lhapapers/2738","pdf_url":null,"source":{"id":"https://openalex.org/S4306400510","display_name":"Research Online (University of Wollongong)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I204824540","host_organization_name":"University of Wollongong","host_organization_lineage":["https://openalex.org/I204824540"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Faculty of Law, Humanities and the Arts - Papers (Archive)","raw_type":"article"},{"id":"pmh:oai:figshare.com:article/27766839","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/s40537-015-0037-9","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-015-0037-9","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-015-0037-9","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2233301138.pdf","grobid_xml":"https://content.openalex.org/works/W2233301138.grobid-xml"},"referenced_works_count":48,"referenced_works":["https://openalex.org/W626233317","https://openalex.org/W1484413656","https://openalex.org/W1499121225","https://openalex.org/W1583082330","https://openalex.org/W1606710192","https://openalex.org/W1623534659","https://openalex.org/W1880280183","https://openalex.org/W1952928510","https://openalex.org/W1983111533","https://openalex.org/W1993335727","https://openalex.org/W1995797177","https://openalex.org/W1998199407","https://openalex.org/W2000497899","https://openalex.org/W2021843073","https://openalex.org/W2035064075","https://openalex.org/W2037965136","https://openalex.org/W2058292883","https://openalex.org/W2059503205","https://openalex.org/W2067505258","https://openalex.org/W2069539533","https://openalex.org/W2071222832","https://openalex.org/W2083680523","https://openalex.org/W2087103452","https://openalex.org/W2094547854","https://openalex.org/W2095535748","https://openalex.org/W2100406636","https://openalex.org/W2111620038","https://openalex.org/W2120890992","https://openalex.org/W2121043186","https://openalex.org/W2127757685","https://openalex.org/W2129714679","https://openalex.org/W2134802138","https://openalex.org/W2140864287","https://openalex.org/W2140910558","https://openalex.org/W2145955806","https://openalex.org/W2154325488","https://openalex.org/W2160687722","https://openalex.org/W2160932861","https://openalex.org/W2166445532","https://openalex.org/W2170482468","https://openalex.org/W2181482409","https://openalex.org/W2185520150","https://openalex.org/W2277115990","https://openalex.org/W2394642784","https://openalex.org/W2481003398","https://openalex.org/W2583051850","https://openalex.org/W4255173720","https://openalex.org/W6680750130"],"related_works":["https://openalex.org/W2368605798","https://openalex.org/W2518037665","https://openalex.org/W2348524959","https://openalex.org/W2477036161","https://openalex.org/W2368049389","https://openalex.org/W2384861574","https://openalex.org/W2170801710","https://openalex.org/W2952704802","https://openalex.org/W4294565801","https://openalex.org/W2142306706"],"abstract_inverted_index":{"Analysis":[0],"of":[1,29,56,93,110,141,148,179],"online":[2,66],"user-generated":[3,57],"content":[4,60],"is":[5,49,133],"receiving":[6],"attention":[7],"for":[8,135,152],"its":[9],"wide":[10],"applications":[11],"from":[12,87,156],"both":[13],"academic":[14],"researchers":[15],"and":[16,32,41,99,146,172,177,183],"industry":[17],"stakeholders.":[18],"In":[19,124],"this":[20,169],"pilot":[21],"study,":[22],"we":[23],"address":[24],"common":[25],"Big":[26,45],"Data":[27,46],"problems":[28],"time":[30],"constraints":[31],"memory":[33],"costs":[34],"involved":[35],"with":[36,104],"using":[37],"standard":[38],"single-machine":[39],"hardware":[40],"software.":[42],"A":[43],"novel":[44],"processing":[47],"framework":[48,151],"proposed":[50,134,150],"to":[51,83,90,107,174],"investigate":[52],"a":[53,63,108],"niche":[54,170],"subset":[55],"popular":[58],"culture":[59],"on":[61,102,131],"Douban,":[62],"well-known":[64],"Chinese-language":[65],"social":[67,158],"network.":[68],"Huge":[69],"data":[70],"samples":[71,89],"are":[72],"harvested":[73],"via":[74],"an":[75,126],"asynchronous":[76],"scraping":[77],"crawler.":[78],"We":[79],"also":[80],"discuss":[81],"how":[82],"manipulate":[84],"heterogeneous":[85],"features":[86],"raw":[88],"facilitate":[91],"analysis":[92],"various":[94],"film":[95,122],"details,":[96],"review":[97],"comments,":[98],"user":[100],"profiles":[101],"Douban":[103],"specific":[105],"regard":[106],"wave":[109],"South":[111],"Korean":[112],"films":[113],"(2003\u20132014),":[114],"which":[115,162],"have":[116],"increased":[117],"in":[118,164],"popularity":[119],"among":[120],"Chinese":[121],"fans.":[123],"addition,":[125],"improved":[127],"Apriori":[128],"algorithm":[129],"based":[130],"MapReduce":[132],"content-mining":[136],"functions.":[137],"An":[138],"exploratory":[139],"simulation":[140],"results":[142],"demonstrates":[143],"the":[144,149],"flexibility":[145],"applicability":[147],"extracting":[153],"relevant":[154],"information":[155],"complex":[157],"media":[159,186],"data,":[160],"knowledge":[161],"can":[163],"turn":[165],"be":[166],"extended":[167],"beyond":[168],"dataset":[171],"used":[173],"inform":[175],"producers":[176],"distributors":[178],"films,":[180],"television":[181],"shows,":[182],"other":[184],"digital":[185],"content.":[187]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":15},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":9},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":3}],"updated_date":"2026-04-20T07:46:08.049788","created_date":"2025-10-10T00:00:00"}
