{"id":"https://openalex.org/W7154147553","doi":"https://doi.org/10.1109/access.2026.3683598","title":"A Comprehensive Analysis of Text Similarity Metrics and Vectorization Techniques for Content-Based Product Recommendation","display_name":"A Comprehensive Analysis of Text Similarity Metrics and Vectorization Techniques for Content-Based Product Recommendation","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7154147553","doi":"https://doi.org/10.1109/access.2026.3683598"},"language":"en","primary_location":{"id":"doi:10.1109/access.2026.3683598","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3683598","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2026.3683598","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121145332","display_name":"Simona-Vasilica Oprea","orcid":null},"institutions":[{"id":"https://openalex.org/I88491126","display_name":"Bucharest University of Economic Studies","ror":"https://ror.org/04yvncj21","country_code":"RO","type":"education","lineage":["https://openalex.org/I88491126"]}],"countries":["RO"],"is_corresponding":false,"raw_author_name":"Simona Vasilica Oprea","raw_affiliation_strings":["Economic Informatics and Cybernetics Department, Bucharest University of Economic Studies, Bucharest, Romania"],"raw_orcid":"https://orcid.org/0000-0002-9005-5181","affiliations":[{"raw_affiliation_string":"Economic Informatics and Cybernetics Department, Bucharest University of Economic Studies, Bucharest, Romania","institution_ids":["https://openalex.org/I88491126"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083962910","display_name":"Adela B\u00c2RA","orcid":null},"institutions":[{"id":"https://openalex.org/I88491126","display_name":"Bucharest University of Economic Studies","ror":"https://ror.org/04yvncj21","country_code":"RO","type":"education","lineage":["https://openalex.org/I88491126"]}],"countries":["RO"],"is_corresponding":false,"raw_author_name":"Adela B\u00e2ra","raw_affiliation_strings":["Economic Informatics and Cybernetics Department, Bucharest University of Economic Studies, Bucharest, Romania"],"raw_orcid":"https://orcid.org/0000-0002-0961-352X","affiliations":[{"raw_affiliation_string":"Economic Informatics and Cybernetics Department, Bucharest University of Economic Studies, Bucharest, Romania","institution_ids":["https://openalex.org/I88491126"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067396962","display_name":"Marian Pompiliu Cristescu","orcid":"https://orcid.org/0000-0003-3638-4379"},"institutions":[{"id":"https://openalex.org/I124121301","display_name":"Lucian Blaga University of Sibiu","ror":"https://ror.org/026gdz537","country_code":"RO","type":"education","lineage":["https://openalex.org/I124121301"]}],"countries":["RO"],"is_corresponding":false,"raw_author_name":"Marian Pompiliu Cristescu","raw_affiliation_strings":["Faculty of Economic Sciences, Lucian Blaga University of Sibiu, Sibiu, Romania"],"raw_orcid":"https://orcid.org/0000-0003-3638-4379","affiliations":[{"raw_affiliation_string":"Faculty of Economic Sciences, Lucian Blaga University of Sibiu, Sibiu, Romania","institution_ids":["https://openalex.org/I124121301"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.54411598,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"14","issue":null,"first_page":"58670","last_page":"58689"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.2556999921798706,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.2556999921798706,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.13420000672340393,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.08299999684095383,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6115000247955322},{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.5985999703407288},{"id":"https://openalex.org/keywords/product","display_name":"Product (mathematics)","score":0.5882999897003174},{"id":"https://openalex.org/keywords/similitude","display_name":"Similitude","score":0.3255999982357025},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.28200000524520874}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8406000137329102},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6115000247955322},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.5985999703407288},{"id":"https://openalex.org/C90673727","wikidata":"https://www.wikidata.org/wiki/Q901718","display_name":"Product (mathematics)","level":2,"score":0.5882999897003174},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.48190000653266907},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4235000014305115},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.39660000801086426},{"id":"https://openalex.org/C143271835","wikidata":"https://www.wikidata.org/wiki/Q254515","display_name":"Similitude","level":2,"score":0.3255999982357025},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.27720001339912415},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.26440000534057617}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2026.3683598","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3683598","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:2afc4fef29644779a21234b328987789","is_oa":true,"landing_page_url":"https://doaj.org/article/2afc4fef29644779a21234b328987789","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 14, Pp 58670-58689 (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2026.3683598","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3683598","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0,225],"paper":[1],"proposes":[2],"a":[3,48,228],"benchmark":[4,67,229],"analysis":[5,167],"of":[6,26,50,73],"various":[7],"similarity":[8,39,98,106,149],"metrics":[9,154],"and":[10,44,59,70,87,109,136,173,194],"text":[11,28],"vectorization":[12,29],"methods":[13],"applied":[14],"to":[15,156],"content-based":[16,74],"product":[17,53,75],"recommendation":[18,178],"systems":[19],"in":[20,124,140,190],"e-commerce.":[21],"It":[22],"presents":[23],"an":[24],"evaluation":[25,199],"four":[27],"techniques:":[30],"Count":[31],"Vectorizer,":[32],"TF-IDF,":[33],"Word2Vec,":[34],"GloVe,":[35,144],"combined":[36],"with":[37,96,118,129,152],"three":[38,79],"metrics:":[40],"cosine":[41,97,148],"similarity,":[42],"Manhattan":[43,162],"Euclidean":[45,119],"distances.":[46],"Using":[47],"dataset":[49,63],"10,002":[51],"Amazon":[52],"descriptions":[54],"spanning":[55],"over":[56],"20":[57],"categories":[58,84],"other":[60,101],"additional":[61],"product-related":[62],"for":[64,114,175],"validation,":[65],"we":[66,220],"the":[68,104,141,198,209],"accuracy":[69,113],"contextual":[71],"relevance":[72,171],"recommendations.":[76,143,215],"We":[77],"selected":[78,205],"representative":[80],"products":[81,207],"from":[82,208],"distinct":[83],"(puzzles,":[85],"longboards":[86],"costumes)":[88],"as":[89,132,134],"test":[90,180],"cases.":[91],"Results":[92],"show":[93],"that":[94,183],"Word2Vec":[95,188],"consistently":[99],"outperforms":[100],"methods,":[102],"achieving":[103],"highest":[105],"score":[107],"(0.906)":[108],"producing":[110,213],"top-1":[111],"match":[112],"franchise-specific":[115],"items.":[116],"TF-IDF":[117],"distance":[120,153],"demonstrated":[121],"strong":[122],"performance":[123],"structured,":[125],"lexically":[126],"consistent":[127],"categories,":[128],"average":[130,161],"distances":[131,163],"low":[133],"1.11":[135],"90%":[137],"category":[138],"alignment":[139],"top-5":[142],"while":[145],"competitive":[146],"under":[147],"(~0.813),":[150],"underperformed":[151],"due":[155],"higher":[157],"vector":[158],"magnitudes,":[159],"recording":[160],"above":[164],"150.":[165],"Our":[166],"also":[168],"includes":[169],"qualitative":[170],"annotations":[172],"justifications":[174],"each":[176,212,217],"top-10":[177,214],"per":[179],"case,":[181],"confirming":[182],"dense":[184],"embedding":[185],"models":[186],"like":[187],"excel":[189],"capturing":[191],"semantic":[192],"nuance":[193],"brand-level":[195],"similarity.":[196],"Further,":[197],"is":[200],"conducted":[201],"on":[202],"500":[203],"randomly":[204],"seed":[206],"two":[210],"datasets,":[211],"For":[216],"vectorizer-similarity":[218,232],"combination,":[219],"computed:":[221],"Precision@10,":[222],"Recall@10,":[223],"NDCG@10.":[224],"research":[226],"contributes":[227],"across":[230],"12":[231],"metric":[233],"combinations.":[234]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-14T00:00:00"}
