{"id":"https://openalex.org/W4360585195","doi":"https://doi.org/10.1109/ic3i56241.2022.10072927","title":"A Comparative Analysis of word embedding techniques and text similarity Measures","display_name":"A Comparative Analysis of word embedding techniques and text similarity Measures","publication_year":2022,"publication_date":"2022-12-14","ids":{"openalex":"https://openalex.org/W4360585195","doi":"https://doi.org/10.1109/ic3i56241.2022.10072927"},"language":"en","primary_location":{"id":"doi:10.1109/ic3i56241.2022.10072927","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ic3i56241.2022.10072927","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 5th International Conference on Contemporary Computing and Informatics (IC3I)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016944963","display_name":"Nagothi Vaibhav Anjani Kumar","orcid":null},"institutions":[{"id":"https://openalex.org/I875944469","display_name":"Koneru Lakshmaiah Education Foundation","ror":"https://ror.org/02k949197","country_code":"IN","type":"education","lineage":["https://openalex.org/I875944469"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Nagothi Vaibhav Anjani Kumar","raw_affiliation_strings":["Koneru Lakshmaiah Education Foundation,Department of Computer Science and Engineering,Vaddeswaram,AP,India","Department of Computer Science and Engineering, Koneru Lakshmaiah Education Foundation, Vaddeswaram, AP, India"],"affiliations":[{"raw_affiliation_string":"Koneru Lakshmaiah Education Foundation,Department of Computer Science and Engineering,Vaddeswaram,AP,India","institution_ids":["https://openalex.org/I875944469"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Koneru Lakshmaiah Education Foundation, Vaddeswaram, AP, India","institution_ids":["https://openalex.org/I875944469"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034408629","display_name":"Shashi Mehrotra","orcid":"https://orcid.org/0000-0003-3907-5790"},"institutions":[{"id":"https://openalex.org/I134705546","display_name":"Teerthanker Mahaveer University","ror":"https://ror.org/04vkd2013","country_code":"IN","type":"education","lineage":["https://openalex.org/I134705546"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Shashi Mehrotra","raw_affiliation_strings":["Teerthanker Mahaveer University,Dept of Computer Science and Engineering,Moradabad,India","Dept of Computer Science and Engineering, Teerthanker Mahaveer University, Moradabad, India"],"affiliations":[{"raw_affiliation_string":"Teerthanker Mahaveer University,Dept of Computer Science and Engineering,Moradabad,India","institution_ids":["https://openalex.org/I134705546"]},{"raw_affiliation_string":"Dept of Computer Science and Engineering, Teerthanker Mahaveer University, Moradabad, India","institution_ids":["https://openalex.org/I134705546"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5016944963"],"corresponding_institution_ids":["https://openalex.org/I875944469"],"apc_list":null,"apc_paid":null,"fwci":0.3979,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.68447705,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/word2vec","display_name":"Word2vec","score":0.8282963037490845},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7779915928840637},{"id":"https://openalex.org/keywords/word-embedding","display_name":"Word embedding","score":0.6857004165649414},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6242720484733582},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5998207926750183},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5887694954872131},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5883468985557556},{"id":"https://openalex.org/keywords/closeness","display_name":"Closeness","score":0.5661070942878723},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.5619027614593506},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5391393899917603},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.4232941269874573},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.10730701684951782},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10636362433433533}],"concepts":[{"id":"https://openalex.org/C2776461190","wikidata":"https://www.wikidata.org/wiki/Q22673982","display_name":"Word2vec","level":3,"score":0.8282963037490845},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7779915928840637},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.6857004165649414},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6242720484733582},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5998207926750183},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5887694954872131},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5883468985557556},{"id":"https://openalex.org/C2779545769","wikidata":"https://www.wikidata.org/wiki/Q5135364","display_name":"Closeness","level":2,"score":0.5661070942878723},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.5619027614593506},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5391393899917603},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.4232941269874573},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.10730701684951782},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10636362433433533},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ic3i56241.2022.10072927","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ic3i56241.2022.10072927","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 5th International Conference on Contemporary Computing and Informatics (IC3I)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7799999713897705}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2786842250","https://openalex.org/W2894747149","https://openalex.org/W2896016608","https://openalex.org/W2897148785","https://openalex.org/W2904891763","https://openalex.org/W2944400536","https://openalex.org/W3019027838","https://openalex.org/W3020931369","https://openalex.org/W3024922541","https://openalex.org/W3083306642","https://openalex.org/W3104059174","https://openalex.org/W3128209463","https://openalex.org/W3129548754","https://openalex.org/W3138979178","https://openalex.org/W3156699288","https://openalex.org/W3163920200","https://openalex.org/W4237467126","https://openalex.org/W6758745265"],"related_works":["https://openalex.org/W2946409105","https://openalex.org/W3152932816","https://openalex.org/W2985392712","https://openalex.org/W4388996947","https://openalex.org/W2798009317","https://openalex.org/W4382201653","https://openalex.org/W3203949288","https://openalex.org/W3107848922","https://openalex.org/W3133567596","https://openalex.org/W4312127319"],"abstract_inverted_index":{"Digital":[0],"text":[1,50,60],"data":[2,23,87],"is":[3,34,75],"increasing":[4],"daily":[5],"in":[6,62],"various":[7],"uses,":[8],"such":[9,93],"as":[10,94],"clinical":[11],"notes,":[12],"lab":[13],"test":[14],"reports,":[15],"research":[16],"articles,":[17],"etc.":[18],"Most":[19],"of":[20,31,45,59,72,80,84],"the":[21,37,85],"mentioned":[22],"are":[24,61],"unstructured.":[25],"While":[26],"searching":[27],"for":[28],"information":[29,33],"lot":[30],"unrelated":[32],"returned":[35],"against":[36],"query.":[38],"The":[39,69],"paper":[40,74],"presents":[41],"a":[42],"comparative":[43],"analysis":[44],"word":[46,90],"embedding":[47,91],"techniques":[48,92],"and":[49,67,97],"similarity":[51],"measures":[52],"to":[53,76],"determine":[54],"how":[55],"similar":[56],"two":[57],"bits":[58],"respective":[63],"lexical,":[64],"semantic":[65],"characteristics,":[66],"closeness.":[68],"principal":[70],"aim":[71],"this":[73],"perform":[77],"pre-processing":[78],"process":[79],"medical":[81],"history":[82],"notes":[83],"patient's":[86],"followed":[88],"by":[89],"Word2Vec,":[95],"FastText,":[96],"Doc2Vec.":[98]},"counts_by_year":[{"year":2024,"cited_by_count":3}],"updated_date":"2025-12-24T23:09:58.560324","created_date":"2025-10-10T00:00:00"}
