{"id":"https://openalex.org/W3007414605","doi":"https://doi.org/10.3233/web-200428","title":"Deep text classification of Instagram data using word embeddings and weak supervision","display_name":"Deep text classification of Instagram data using word embeddings and weak supervision","publication_year":2020,"publication_date":"2020-02-25","ids":{"openalex":"https://openalex.org/W3007414605","doi":"https://doi.org/10.3233/web-200428","mag":"3007414605"},"language":"en","primary_location":{"id":"doi:10.3233/web-200428","is_oa":false,"landing_page_url":"https://doi.org/10.3233/web-200428","pdf_url":null,"source":{"id":"https://openalex.org/S4210183871","display_name":"Web Intelligence","issn_l":"2405-6456","issn":["2405-6456","2405-6464"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Web Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074576259","display_name":"Kim Hammar","orcid":"https://orcid.org/0000-0003-1773-8354"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Kim Hammar","raw_affiliation_strings":["Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0,\u00a0,\u00a0,\u00a0","Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0kimham@kth.se,\u00a0shatha@kth.se,\u00a0nimad@kth.se,\u00a0misha@kth.se"],"affiliations":[{"raw_affiliation_string":"Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0,\u00a0,\u00a0,\u00a0","institution_ids":["https://openalex.org/I86987016"]},{"raw_affiliation_string":"Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0kimham@kth.se,\u00a0shatha@kth.se,\u00a0nimad@kth.se,\u00a0misha@kth.se","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006122675","display_name":"Shatha Jaradat","orcid":null},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Shatha Jaradat","raw_affiliation_strings":["Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0,\u00a0,\u00a0,\u00a0","Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0kimham@kth.se,\u00a0shatha@kth.se,\u00a0nimad@kth.se,\u00a0misha@kth.se"],"affiliations":[{"raw_affiliation_string":"Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0,\u00a0,\u00a0,\u00a0","institution_ids":["https://openalex.org/I86987016"]},{"raw_affiliation_string":"Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0kimham@kth.se,\u00a0shatha@kth.se,\u00a0nimad@kth.se,\u00a0misha@kth.se","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085085036","display_name":"Nima Dokoohaki","orcid":"https://orcid.org/0000-0003-2339-2337"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Nima Dokoohaki","raw_affiliation_strings":["Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0,\u00a0,\u00a0,\u00a0","Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0kimham@kth.se,\u00a0shatha@kth.se,\u00a0nimad@kth.se,\u00a0misha@kth.se"],"affiliations":[{"raw_affiliation_string":"Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0,\u00a0,\u00a0,\u00a0","institution_ids":["https://openalex.org/I86987016"]},{"raw_affiliation_string":"Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0kimham@kth.se,\u00a0shatha@kth.se,\u00a0nimad@kth.se,\u00a0misha@kth.se","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056152467","display_name":"Mihhail Matskin","orcid":null},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Mihhail Matskin","raw_affiliation_strings":["Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0,\u00a0,\u00a0,\u00a0","Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0kimham@kth.se,\u00a0shatha@kth.se,\u00a0nimad@kth.se,\u00a0misha@kth.se"],"affiliations":[{"raw_affiliation_string":"Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0,\u00a0,\u00a0,\u00a0","institution_ids":["https://openalex.org/I86987016"]},{"raw_affiliation_string":"Department of Software and Computer Systems, KTH Royal Institute of Technology, Stockholm, Sweden. E-mails:\u00a0kimham@kth.se,\u00a0shatha@kth.se,\u00a0nimad@kth.se,\u00a0misha@kth.se","institution_ids":["https://openalex.org/I86987016"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5074576259"],"corresponding_institution_ids":["https://openalex.org/I86987016"],"apc_list":null,"apc_paid":null,"fwci":0.5481,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.72371461,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"18","issue":"1","first_page":"53","last_page":"67"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.7025045156478882},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6947447061538696},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.610328733921051},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5322059988975525},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5178430676460266},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4631807804107666},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4286845922470093},{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment analysis","score":0.41982078552246094},{"id":"https://openalex.org/keywords/clothing","display_name":"Clothing","score":0.41195985674858093},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3928992748260498},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3013058304786682},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.0943063497543335}],"concepts":[{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.7025045156478882},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6947447061538696},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.610328733921051},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5322059988975525},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5178430676460266},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4631807804107666},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4286845922470093},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.41982078552246094},{"id":"https://openalex.org/C530175646","wikidata":"https://www.wikidata.org/wiki/Q11460","display_name":"Clothing","level":2,"score":0.41195985674858093},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3928992748260498},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3013058304786682},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0943063497543335},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/web-200428","is_oa":false,"landing_page_url":"https://doi.org/10.3233/web-200428","pdf_url":null,"source":{"id":"https://openalex.org/S4210183871","display_name":"Web Intelligence","issn_l":"2405-6456","issn":["2405-6456","2405-6464"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Web Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W560371024","https://openalex.org/W1647671624","https://openalex.org/W1832693441","https://openalex.org/W1854884267","https://openalex.org/W2053921957","https://openalex.org/W2123661878","https://openalex.org/W2124637492","https://openalex.org/W2137349054","https://openalex.org/W2143017621","https://openalex.org/W2153848201","https://openalex.org/W2153853937","https://openalex.org/W2157765050","https://openalex.org/W2158899491","https://openalex.org/W2169200297","https://openalex.org/W2250539671","https://openalex.org/W2404161646","https://openalex.org/W2493916176","https://openalex.org/W2515248967","https://openalex.org/W2746086086","https://openalex.org/W2769041395","https://openalex.org/W2899941041","https://openalex.org/W2910198407","https://openalex.org/W2952230511","https://openalex.org/W2963291843","https://openalex.org/W2963801581","https://openalex.org/W2964046515","https://openalex.org/W3104718125","https://openalex.org/W3216404684","https://openalex.org/W6677237759"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2738456166","https://openalex.org/W2352745894","https://openalex.org/W2057731951","https://openalex.org/W2358836583","https://openalex.org/W2387983088","https://openalex.org/W2135888309","https://openalex.org/W3080469217","https://openalex.org/W791876968","https://openalex.org/W2022897160"],"abstract_inverted_index":{"With":[0,127,149],"the":[1,21,34,106,124,174,195,199,208],"advent":[2],"of":[3,11,20,33,58,95,102,135,190,197,202],"social":[4,23,41],"media,":[5],"our":[6,128],"online":[7],"feeds":[8],"increasingly":[9],"consist":[10],"short,":[12],"informal,":[13],"and":[14,29,49,80,109],"unstructured":[15],"text.":[16,97,126],"Instagram":[17,59,96,103,120,203],"is":[18,43,77,145,192,212],"one":[19],"largest":[22],"media":[24,42],"platforms,":[25],"containing":[26],"both":[27,78],"text":[28,38,56,63,93],"images.":[30],"However,":[31],"most":[32],"prior":[35],"research":[36],"on":[37,45,67,123,194,207,213],"processing":[39],"in":[40,75,133,160,180],"focused":[44],"analyzing":[46],"Twitter":[47],"data,":[48,138],"little":[50],"attention":[51],"has":[52],"been":[53],"paid":[54],"to":[55,82,118,142,155,168],"mining":[57,64],"data.":[60],"Moreover,":[61],"many":[62],"methods":[65,89],"rely":[66],"training":[68,137],"data":[69],"annotated":[70,136],"manually":[71],"by":[72],"humans,":[73],"which":[74,211],"practice":[76],"difficult":[79],"expensive":[81],"obtain.":[83],"In":[84],"this":[85],"paper,":[86],"we":[87,130,152],"present":[88],"for":[90],"weakly":[91],"supervised":[92],"classification":[94],"We":[98],"analyze":[99],"a":[100,111,146,157],"corpora":[101],"posts":[104,121,204],"from":[105],"fashion":[107],"domain":[108],"train":[110,143],"deep":[112],"clothing":[113],"classifier":[114],"with":[115,170,177,182,215],"weak":[116,140,150,178],"supervision":[117,141,151,179],"classify":[119],"based":[122,205],"associated":[125,209],"experiments,":[129],"demonstrate":[131],"that":[132,163],"absence":[134],"using":[139],"models":[144],"viable":[147],"approach.":[148],"were":[153],"able":[154],"label":[156],"large":[158],"dataset":[159,175],"hours,":[161],"something":[162],"would":[164],"have":[165],"taken":[166],"months":[167],"do":[169],"human":[171,216],"annotators.":[172],"Using":[173],"labeled":[176],"combination":[181],"generative":[183],"modeling,":[184],"an":[185],"[Formula:":[186],"see":[187],"text]":[188],"score":[189],"0.61":[191],"achieved":[193],"task":[196],"classifying":[198],"image":[200],"contents":[201],"solely":[206],"text,":[210],"level":[214],"performance.":[217]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-03-03T06:13:14.889584","created_date":"2025-10-10T00:00:00"}
