{"id":"https://openalex.org/W2789577389","doi":"https://doi.org/10.1145/3018896.3056785","title":"Combined WSD algorithms with LSA to identify semantic similarity in unstructured textual data","display_name":"Combined WSD algorithms with LSA to identify semantic similarity in unstructured textual data","publication_year":2017,"publication_date":"2017-03-22","ids":{"openalex":"https://openalex.org/W2789577389","doi":"https://doi.org/10.1145/3018896.3056785","mag":"2789577389"},"language":"en","primary_location":{"id":"doi:10.1145/3018896.3056785","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3018896.3056785","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Second International Conference on Internet of things, Data and Cloud Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029760187","display_name":"Mohammed Ahmed Taiye","orcid":"https://orcid.org/0000-0002-0025-118X"},"institutions":[{"id":"https://openalex.org/I94625822","display_name":"Northern University of Malaysia","ror":"https://ror.org/01ss10648","country_code":"MY","type":"education","lineage":["https://openalex.org/I94625822"]}],"countries":["MY"],"is_corresponding":true,"raw_author_name":"Mohammed Ahmed Taiye","raw_affiliation_strings":["Universiti Utara Malaysia"],"affiliations":[{"raw_affiliation_string":"Universiti Utara Malaysia","institution_ids":["https://openalex.org/I94625822"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088005888","display_name":"Siti Sakira Kamaruddin","orcid":"https://orcid.org/0000-0002-5937-7801"},"institutions":[{"id":"https://openalex.org/I94625822","display_name":"Northern University of Malaysia","ror":"https://ror.org/01ss10648","country_code":"MY","type":"education","lineage":["https://openalex.org/I94625822"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"Siti Sakira Kamaruddin","raw_affiliation_strings":["Universiti Utara Malaysia"],"affiliations":[{"raw_affiliation_string":"Universiti Utara Malaysia","institution_ids":["https://openalex.org/I94625822"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067483180","display_name":"Farzana Kabir Ahmad","orcid":"https://orcid.org/0000-0002-0374-6559"},"institutions":[{"id":"https://openalex.org/I94625822","display_name":"Northern University of Malaysia","ror":"https://ror.org/01ss10648","country_code":"MY","type":"education","lineage":["https://openalex.org/I94625822"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"Farzana Kabir Ahmad","raw_affiliation_strings":["Universiti Utara Malaysia"],"affiliations":[{"raw_affiliation_string":"Universiti Utara Malaysia","institution_ids":["https://openalex.org/I94625822"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5029760187"],"corresponding_institution_ids":["https://openalex.org/I94625822"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.21006784,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8336688280105591},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.7780158519744873},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7180836200714111},{"id":"https://openalex.org/keywords/polysemy","display_name":"Polysemy","score":0.6631448268890381},{"id":"https://openalex.org/keywords/latent-semantic-analysis","display_name":"Latent semantic analysis","score":0.6221194863319397},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5909772515296936},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5831613540649414},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5721756219863892},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5599786639213562},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5377452969551086},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5101890563964844},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4816371500492096},{"id":"https://openalex.org/keywords/explicit-semantic-analysis","display_name":"Explicit semantic analysis","score":0.4802972972393036},{"id":"https://openalex.org/keywords/semantic-computing","display_name":"Semantic computing","score":0.43640953302383423},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4363025724887848},{"id":"https://openalex.org/keywords/wordnet","display_name":"WordNet","score":0.4255073070526123},{"id":"https://openalex.org/keywords/semantic-technology","display_name":"Semantic technology","score":0.18041402101516724},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.14870285987854004},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.14652925729751587}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8336688280105591},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.7780158519744873},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7180836200714111},{"id":"https://openalex.org/C2780276568","wikidata":"https://www.wikidata.org/wiki/Q191928","display_name":"Polysemy","level":2,"score":0.6631448268890381},{"id":"https://openalex.org/C170133592","wikidata":"https://www.wikidata.org/wiki/Q1806883","display_name":"Latent semantic analysis","level":2,"score":0.6221194863319397},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5909772515296936},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5831613540649414},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5721756219863892},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5599786639213562},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5377452969551086},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5101890563964844},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4816371500492096},{"id":"https://openalex.org/C173862523","wikidata":"https://www.wikidata.org/wiki/Q5421270","display_name":"Explicit semantic analysis","level":5,"score":0.4802972972393036},{"id":"https://openalex.org/C511149849","wikidata":"https://www.wikidata.org/wiki/Q7449051","display_name":"Semantic computing","level":3,"score":0.43640953302383423},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4363025724887848},{"id":"https://openalex.org/C157659113","wikidata":"https://www.wikidata.org/wiki/Q533822","display_name":"WordNet","level":2,"score":0.4255073070526123},{"id":"https://openalex.org/C6881194","wikidata":"https://www.wikidata.org/wiki/Q7449091","display_name":"Semantic technology","level":4,"score":0.18041402101516724},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.14870285987854004},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.14652925729751587},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3018896.3056785","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3018896.3056785","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Second International Conference on Internet of things, Data and Cloud Computing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.699999988079071,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1788602","https://openalex.org/W125550881","https://openalex.org/W218889330","https://openalex.org/W751890724","https://openalex.org/W1546714804","https://openalex.org/W1880262756","https://openalex.org/W2030129670","https://openalex.org/W2091879664","https://openalex.org/W2118293227","https://openalex.org/W2134632846","https://openalex.org/W2150159277","https://openalex.org/W2159917432","https://openalex.org/W2160732112","https://openalex.org/W2160923007","https://openalex.org/W2165403938","https://openalex.org/W2171313960","https://openalex.org/W2250409846","https://openalex.org/W2251322122","https://openalex.org/W2305815027","https://openalex.org/W2324052717","https://openalex.org/W2344464929","https://openalex.org/W2436001372","https://openalex.org/W2964274239","https://openalex.org/W6639619044","https://openalex.org/W6681948635"],"related_works":["https://openalex.org/W2113144812","https://openalex.org/W2103835134","https://openalex.org/W2113661533","https://openalex.org/W1976495436","https://openalex.org/W2890241594","https://openalex.org/W3016822073","https://openalex.org/W2047143235","https://openalex.org/W3152143533","https://openalex.org/W2786154338","https://openalex.org/W4246972993"],"abstract_inverted_index":{"Semantically":[0],"related":[1],"sentence":[2,18,133],"may":[3],"not":[4,63,94],"have":[5,81],"any":[6],"word":[7,60],"in":[8,44,73,116,120],"common.":[9],"However,":[10],"identifying":[11,71,117],"the":[12,52,67,97,106,110,142,154],"semantic":[13,78,118,134,155],"similarity":[14,79,135,156],"between":[15],"words":[16,43],"at":[17,127],"level":[19],"possess":[20],"difficult":[21],"challenges":[22,69],"such":[23],"as":[24],"polysemy,":[25],"synonyms,":[26],"heterogeneity":[27],"and":[28,101,109,159],"sparsity":[29],"of":[30,70,99,112,157],"unstructured":[31,74],"textual":[32],"datasets.":[33],"It":[34,49],"is":[35],"assumed":[36],"that":[37,51,137],"sentences":[38,158],"with":[39,148,163],"similar":[40],"text":[41,75],"or":[42],"common":[45],"are":[46,62],"semantically":[47],"related.":[48],"means":[50],"standard":[53],"Information":[54],"Retrieval":[55],"(IR)":[56],"measure":[57],"based":[58],"on":[59],"co-occurrence":[61],"appropriate":[64],"to":[65,84,104,152,160],"tackle":[66],"aforementioned":[68],"semantics":[72],"documents.":[76],"Many":[77],"measures":[80],"been":[82],"proposed":[83],"resolve":[85],"this":[86,123],"non-trivial":[87],"issues,":[88],"but":[89],"many":[90],"existing":[91],"studies":[92],"did":[93],"properly":[95],"utilize":[96],"combination":[98],"Corpus":[100],"Knowledge-based":[102],"approach":[103],"solve":[105],"syntactic":[107],"construct":[108],"roles":[111],"Part":[113],"Of":[114],"Speech":[115],"similarities":[119],"sentences.":[121],"In":[122],"research,":[124],"we":[125],"aim":[126],"proposing":[128],"a":[129],"method":[130],"for":[131],"measuring":[132],"identification":[136],"combines":[138],"two":[139],"algorithms":[140,147],"from":[141],"knowledge-based":[143],"Word":[144],"Sense":[145],"Disambiguation":[146],"Latent":[149],"Semantic":[150],"Analysis":[151],"identify":[153],"compare":[161],"results":[162],"human":[164],"evaluation.":[165]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
