{"id":"https://openalex.org/W2758388002","doi":"https://doi.org/10.15439/2017f531","title":"A Web Corpus for eCare: Collection, Lay Annotation and Learning -First Results-","display_name":"A Web Corpus for eCare: Collection, Lay Annotation and Learning -First Results-","publication_year":2017,"publication_date":"2017-09-24","ids":{"openalex":"https://openalex.org/W2758388002","doi":"https://doi.org/10.15439/2017f531","mag":"2758388002"},"language":"en","primary_location":{"id":"doi:10.15439/2017f531","is_oa":true,"landing_page_url":"https://doi.org/10.15439/2017f531","pdf_url":"https://annals-csis.org/proceedings/2017/drp/pdf/531.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://annals-csis.org/proceedings/2017/drp/pdf/531.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069654949","display_name":"Marina Santini","orcid":"https://orcid.org/0000-0002-5737-8149"},"institutions":[{"id":"https://openalex.org/I102134673","display_name":"Link\u00f6ping University","ror":"https://ror.org/05ynxx418","country_code":"SE","type":"education","lineage":["https://openalex.org/I102134673"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Marina Santini","raw_affiliation_strings":["RISE SICS East, Linkping University Linkping, Sweden","RISE SICS East, \u2020Link\u00f6ping University Link\u00f6ping, Sweden"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RISE SICS East, Linkping University Linkping, Sweden","institution_ids":["https://openalex.org/I102134673"]},{"raw_affiliation_string":"RISE SICS East, \u2020Link\u00f6ping University Link\u00f6ping, Sweden","institution_ids":["https://openalex.org/I102134673"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053932004","display_name":"Arne J\u00f6nsson","orcid":"https://orcid.org/0000-0001-9852-5531"},"institutions":[{"id":"https://openalex.org/I102134673","display_name":"Link\u00f6ping University","ror":"https://ror.org/05ynxx418","country_code":"SE","type":"education","lineage":["https://openalex.org/I102134673"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Arne J\u00f6nsson","raw_affiliation_strings":["RISE SICS East, \u2020Link\u00f6ping University Link\u00f6ping, Sweden"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RISE SICS East, \u2020Link\u00f6ping University Link\u00f6ping, Sweden","institution_ids":["https://openalex.org/I102134673"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103555666","display_name":"Mikael Nystr\u00f6m","orcid":null},"institutions":[{"id":"https://openalex.org/I102134673","display_name":"Link\u00f6ping University","ror":"https://ror.org/05ynxx418","country_code":"SE","type":"education","lineage":["https://openalex.org/I102134673"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Mikael Nystr\u00f6m","raw_affiliation_strings":["RISE SICS East, \u2020Link\u00f6ping University Link\u00f6ping, Sweden"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RISE SICS East, \u2020Link\u00f6ping University Link\u00f6ping, Sweden","institution_ids":["https://openalex.org/I102134673"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054915833","display_name":"Marjan Alirezai","orcid":null},"institutions":[{"id":"https://openalex.org/I26437253","display_name":"\u00d6rebro University","ror":"https://ror.org/05kytsw45","country_code":"SE","type":"education","lineage":["https://openalex.org/I26437253"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Marjan Alirezai","raw_affiliation_strings":["\u00d6rebro University \u00d6rebro, Sweden"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"\u00d6rebro University \u00d6rebro, Sweden","institution_ids":["https://openalex.org/I26437253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2321,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.59739319,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"12","issue":null,"first_page":"71","last_page":"78"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8669719696044922},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6466401815414429},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6054052114486694},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5952586531639099},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5733327269554138},{"id":"https://openalex.org/keywords/sublanguage","display_name":"Sublanguage","score":0.5307193994522095},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.49387603998184204},{"id":"https://openalex.org/keywords/text-corpus","display_name":"Text corpus","score":0.44687986373901367},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.40223273634910583},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.13454875349998474}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8669719696044922},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6466401815414429},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6054052114486694},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5952586531639099},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5733327269554138},{"id":"https://openalex.org/C2776411971","wikidata":"https://www.wikidata.org/wiki/Q17141398","display_name":"Sublanguage","level":2,"score":0.5307193994522095},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.49387603998184204},{"id":"https://openalex.org/C2474386","wikidata":"https://www.wikidata.org/wiki/Q461183","display_name":"Text corpus","level":2,"score":0.44687986373901367},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.40223273634910583},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.13454875349998474}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.15439/2017f531","is_oa":true,"landing_page_url":"https://doi.org/10.15439/2017f531","pdf_url":"https://annals-csis.org/proceedings/2017/drp/pdf/531.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.15439/2017f531","is_oa":true,"landing_page_url":"https://doi.org/10.15439/2017f531","pdf_url":"https://annals-csis.org/proceedings/2017/drp/pdf/531.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2758388002.pdf","grobid_xml":"https://content.openalex.org/works/W2758388002.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W84079877","https://openalex.org/W115481586","https://openalex.org/W136732505","https://openalex.org/W610032745","https://openalex.org/W1550291595","https://openalex.org/W1570448133","https://openalex.org/W1577927940","https://openalex.org/W2006832571","https://openalex.org/W2020777959","https://openalex.org/W2053154970","https://openalex.org/W2073449354","https://openalex.org/W2087926223","https://openalex.org/W2106695714","https://openalex.org/W2122314939","https://openalex.org/W2130585834","https://openalex.org/W2141766660","https://openalex.org/W2170021941","https://openalex.org/W2174606549","https://openalex.org/W2211265567","https://openalex.org/W2336669601","https://openalex.org/W2406081996","https://openalex.org/W6652244895","https://openalex.org/W6663855623","https://openalex.org/W7066577604"],"related_works":["https://openalex.org/W74549753","https://openalex.org/W1513056508","https://openalex.org/W2081289543","https://openalex.org/W4233809365","https://openalex.org/W2578505095","https://openalex.org/W2348452562","https://openalex.org/W2050072000","https://openalex.org/W3163680058","https://openalex.org/W2251724625","https://openalex.org/W3183077996"],"abstract_inverted_index":{"In":[0],"this":[1],"position":[2],"paper,":[3],"we":[4,46,63],"put":[5],"forward":[6],"two":[7,65],"claims:":[8],"1)":[9],"it":[10,30],"is":[11,31,72,108,148],"possible":[12,32],"to":[13,33,159,165],"design":[14],"a":[15,54,73,103,111],"dynamic":[16],"and":[17,51,62],"extensible":[18],"corpus":[19,75,83,107],"without":[20,39],"running":[21],"the":[22,48,127,132,154,157,179,197],"risk":[23],"of":[24,53,76,156,178,182],"getting":[25],"into":[26],"scalability":[27,147],"problems;":[28],"2)":[29],"devise":[34],"noise-resistant":[35],"Language":[36],"Technology":[37],"applications":[38],"affecting":[40],"performance.":[41],"To":[42],"support":[43],"our":[44],"claims,":[45],"describe":[47],"design,":[49],"construction":[50],"limitations":[52],"very":[55],"specialized":[56],"medical":[57,117],"web":[58,77],"corpus,":[59],"called":[60],"eCare_Sv_01,":[61],"present":[64],"experiments":[66],"on":[67],"lay-specialized":[68,172],"text":[69,113],"classification.":[70],"eCare_Sv_01":[71],"small":[74],"documents":[78,85,118,189],"written":[79],"in":[80,92,196],"Swedish.":[81],"The":[82,89,106],"contains":[84],"about":[86],"chronic":[87],"diseases.":[88],"sublanguage":[90],"used":[91],"each":[93],"document":[94],"has":[95],"been":[96],"labelled":[97],"as":[98,110,186],"\"lay\"":[99],"or":[100,190],"\"specialized\"":[101],"by":[102,131,138],"lay":[104,133],"annotator.":[105],"designed":[109],"flexible":[112],"resource,":[114],"where":[115],"additional":[116],"will":[119],"be":[120,160,175],"appended":[121],"over":[122],"time.":[123],"Experiments":[124],"show":[125],"that":[126,146,171],"layspecialized":[128],"labels":[129,173],"assigned":[130],"annotator":[134],"are":[135,194],"reliably":[136],"learned":[137,161,176],"standard":[139],"classifiers.":[140],"More":[141],"specifically,":[142],"Experiment":[143,168],"1":[144],"shows":[145,170],"not":[149],"an":[150],"issue":[151],"when":[152],"increasing":[153],"size":[155],"datasets":[158],"from":[162],"156":[163],"up":[164],"801":[166],"documents.":[167],"2":[169],"can":[174],"regardless":[177],"large":[180],"amount":[181],"disturbing":[183],"factors,":[184],"such":[185],"machine":[187],"translated":[188],"low-quality":[191],"texts,":[192],"which":[193],"numerous":[195],"corpus.":[198]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
