{"id":"https://openalex.org/W2962605866","doi":"https://doi.org/10.1108/el-08-2018-0165","title":"Selecting a text similarity measure for a content-based recommender system","display_name":"Selecting a text similarity measure for a content-based recommender system","publication_year":2019,"publication_date":"2019-07-08","ids":{"openalex":"https://openalex.org/W2962605866","doi":"https://doi.org/10.1108/el-08-2018-0165","mag":"2962605866"},"language":"en","primary_location":{"id":"doi:10.1108/el-08-2018-0165","is_oa":false,"landing_page_url":"https://doi.org/10.1108/el-08-2018-0165","pdf_url":null,"source":{"id":"https://openalex.org/S902750600","display_name":"The Electronic Library","issn_l":"0264-0473","issn":["0264-0473","1758-616X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319811","host_organization_name":"Emerald Publishing Limited","host_organization_lineage":["https://openalex.org/P4310319811"],"host_organization_lineage_names":["Emerald Publishing Limited"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Electronic Library","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037523672","display_name":"Manjula Wijewickrema","orcid":"https://orcid.org/0000-0003-4922-098X"},"institutions":[{"id":"https://openalex.org/I39343248","display_name":"Humboldt-Universit\u00e4t zu Berlin","ror":"https://ror.org/01hcx6992","country_code":"DE","type":"education","lineage":["https://openalex.org/I39343248"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Manjula Wijewickrema","raw_affiliation_strings":["Berlin School of Library and Information Science, Humboldt University of Berlin, Germany"],"affiliations":[{"raw_affiliation_string":"Berlin School of Library and Information Science, Humboldt University of Berlin, Germany","institution_ids":["https://openalex.org/I39343248"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051093555","display_name":"Vivien Petras","orcid":"https://orcid.org/0000-0002-8113-1509"},"institutions":[{"id":"https://openalex.org/I39343248","display_name":"Humboldt-Universit\u00e4t zu Berlin","ror":"https://ror.org/01hcx6992","country_code":"DE","type":"education","lineage":["https://openalex.org/I39343248"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Vivien Petras","raw_affiliation_strings":["Berlin School of Library and Information Science, Humboldt University of Berlin, Germany"],"affiliations":[{"raw_affiliation_string":"Berlin School of Library and Information Science, Humboldt University of Berlin, Germany","institution_ids":["https://openalex.org/I39343248"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110702200","display_name":"N.G.J. Dias","orcid":null},"institutions":[{"id":"https://openalex.org/I142651801","display_name":"University of Kelaniya","ror":"https://ror.org/02r91my29","country_code":"LK","type":"education","lineage":["https://openalex.org/I142651801"]}],"countries":["LK"],"is_corresponding":false,"raw_author_name":"Naomal Dias","raw_affiliation_strings":["Department of Computer Systems Engineering, University of Kelaniya, Kelaniya, Sri Lanka"],"affiliations":[{"raw_affiliation_string":"Department of Computer Systems Engineering, University of Kelaniya, Kelaniya, Sri Lanka","institution_ids":["https://openalex.org/I142651801"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5037523672"],"corresponding_institution_ids":["https://openalex.org/I39343248"],"apc_list":null,"apc_paid":null,"fwci":1.0111,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.82665872,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"ahead-of-print","issue":"ahead-of-print","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cosine-similarity","display_name":"Cosine similarity","score":0.8690536022186279},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7846524715423584},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.7194740772247314},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.642778754234314},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5786311626434326},{"id":"https://openalex.org/keywords/similarity-measure","display_name":"Similarity measure","score":0.572446882724762},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5700031518936157},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5538783669471741},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5505169630050659},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.5396144390106201},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.5025410652160645},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.41146695613861084},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.18599900603294373},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.1660541594028473},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15696263313293457},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.10705411434173584}],"concepts":[{"id":"https://openalex.org/C2780762811","wikidata":"https://www.wikidata.org/wiki/Q1784941","display_name":"Cosine similarity","level":3,"score":0.8690536022186279},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7846524715423584},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.7194740772247314},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.642778754234314},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5786311626434326},{"id":"https://openalex.org/C2776517306","wikidata":"https://www.wikidata.org/wiki/Q29017317","display_name":"Similarity measure","level":2,"score":0.572446882724762},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5700031518936157},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5538783669471741},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5505169630050659},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.5396144390106201},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.5025410652160645},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.41146695613861084},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.18599900603294373},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.1660541594028473},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15696263313293457},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.10705411434173584},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1108/el-08-2018-0165","is_oa":false,"landing_page_url":"https://doi.org/10.1108/el-08-2018-0165","pdf_url":null,"source":{"id":"https://openalex.org/S902750600","display_name":"The Electronic Library","issn_l":"0264-0473","issn":["0264-0473","1758-616X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319811","host_organization_name":"Emerald Publishing Limited","host_organization_lineage":["https://openalex.org/P4310319811"],"host_organization_lineage_names":["Emerald Publishing Limited"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Electronic Library","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8500000238418579,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":57,"referenced_works":["https://openalex.org/W8870360","https://openalex.org/W1601266066","https://openalex.org/W1826790618","https://openalex.org/W1846261984","https://openalex.org/W1965367439","https://openalex.org/W1969232170","https://openalex.org/W1972594981","https://openalex.org/W1982643343","https://openalex.org/W1982889956","https://openalex.org/W1992577265","https://openalex.org/W1993318811","https://openalex.org/W2007280555","https://openalex.org/W2014415866","https://openalex.org/W2015690580","https://openalex.org/W2039447541","https://openalex.org/W2045929671","https://openalex.org/W2061261643","https://openalex.org/W2068395167","https://openalex.org/W2069870183","https://openalex.org/W2076506714","https://openalex.org/W2082179583","https://openalex.org/W2082815071","https://openalex.org/W2085030399","https://openalex.org/W2093390569","https://openalex.org/W2098608698","https://openalex.org/W2099781321","https://openalex.org/W2105276905","https://openalex.org/W2108024108","https://openalex.org/W2108934940","https://openalex.org/W2114597819","https://openalex.org/W2129971563","https://openalex.org/W2140880926","https://openalex.org/W2145940953","https://openalex.org/W2151629867","https://openalex.org/W2156695938","https://openalex.org/W2157807817","https://openalex.org/W2168812139","https://openalex.org/W2171313960","https://openalex.org/W2172263659","https://openalex.org/W2174052796","https://openalex.org/W2295077356","https://openalex.org/W2332951940","https://openalex.org/W2335622251","https://openalex.org/W2407920565","https://openalex.org/W2463824207","https://openalex.org/W2497122656","https://openalex.org/W2498452554","https://openalex.org/W2571930895","https://openalex.org/W2578757680","https://openalex.org/W2613302129","https://openalex.org/W2742389902","https://openalex.org/W2745813871","https://openalex.org/W2783915166","https://openalex.org/W2790231300","https://openalex.org/W2809716804","https://openalex.org/W4252060112","https://openalex.org/W6624664881"],"related_works":["https://openalex.org/W2951075339","https://openalex.org/W1966742602","https://openalex.org/W4226161247","https://openalex.org/W3134944010","https://openalex.org/W2135511601","https://openalex.org/W2394168050","https://openalex.org/W2284045667","https://openalex.org/W57923944","https://openalex.org/W2056226831","https://openalex.org/W1598081081"],"abstract_inverted_index":{"Purpose":[0],"The":[1,36,95,109,117,139],"purpose":[2],"of":[3,41,49,52,80,126,150,161,167,189,192],"this":[4],"paper":[5],"is":[6,180],"to":[7,185],"develop":[8],"a":[9,19,65,68,190],"journal":[10,24,69,75,200],"recommender":[11,70,201],"system,":[12],"which":[13],"compares":[14],"the":[15,22,31,39,47,89,101,114,130,159,165,181,187],"content":[16],"similarities":[17],"between":[18,123],"manuscript":[20],"and":[21,34,46,85,103,132,153,176],"existing":[23],"articles":[25],"in":[26,164],"two":[27,73],"subject":[28],"corpora":[29,198],"(covering":[30],"social":[32,168],"sciences":[33,169],"medicine).":[35],"study":[37],"examines":[38],"appropriateness":[40],"three":[42,60],"text":[43],"similarity":[44,61,97,106,127,134,141,175,194],"measures":[45,62,107,135,195],"impact":[48],"numerous":[50],"aspects":[51],"corpus":[53,155,162],"documents":[54],"on":[55,67,88],"system":[56,71],"performance.":[57,116],"Design/methodology/approach":[58],"Implemented":[59],"one":[63],"at":[64],"time":[66],"with":[72,147,196],"separate":[74],"corpora.":[76],"Two":[77],"distinct":[78,197],"samples":[79],"test":[81],"abstracts":[82],"were":[83],"classified":[84],"evaluated":[86],"based":[87],"normalized":[90],"discounted":[91],"cumulative":[92],"gain.":[93],"Findings":[94],"BM25":[96,131],"measure":[98,112],"outperforms":[99],"both":[100],"cosine":[102,133,140,174],"unigram":[104,110],"language":[105,111],"overall.":[108],"shows":[113],"lowest":[115],"performance":[118,144,172],"results":[119],"are":[120,136],"significantly":[121],"different":[122],"each":[124],"pair":[125],"measures,":[128],"while":[129],"moderately":[137],"correlated.":[138],"achieves":[142],"better":[143,171],"for":[145,173,199],"subjects":[146],"higher":[148],"density":[149],"technical":[151],"vocabulary":[152],"shorter":[154],"documents.":[156],"Moreover,":[157],"increasing":[158],"number":[160,191],"journals":[163],"domain":[166],"achieved":[170],"BM25.":[177],"Originality/value":[178],"This":[179],"first":[182],"work":[183],"related":[184],"comparing":[186],"suitability":[188],"string-based":[193],"systems.":[202]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":1}],"updated_date":"2026-03-04T09:10:02.777135","created_date":"2025-10-10T00:00:00"}
