{"id":"https://openalex.org/W4362591143","doi":"https://doi.org/10.1142/s0219649223500168","title":"GepH: Entity Predictor for Hindi News","display_name":"GepH: Entity Predictor for Hindi News","publication_year":2023,"publication_date":"2023-03-31","ids":{"openalex":"https://openalex.org/W4362591143","doi":"https://doi.org/10.1142/s0219649223500168"},"language":"en","primary_location":{"id":"doi:10.1142/s0219649223500168","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0219649223500168","pdf_url":null,"source":{"id":"https://openalex.org/S30163770","display_name":"Journal of Information & Knowledge Management","issn_l":"0219-6492","issn":["0219-6492","1793-6926"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information &amp; Knowledge Management","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055303991","display_name":"Prafulla Bafna","orcid":"https://orcid.org/0000-0001-9990-5990"},"institutions":[{"id":"https://openalex.org/I244572783","display_name":"Symbiosis International University","ror":"https://ror.org/005r2ww51","country_code":"IN","type":"education","lineage":["https://openalex.org/I244572783"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Prafulla B. Bafna","raw_affiliation_strings":["Symbiosis Institute of Computer Studies and Research, Symbiosis International (Deemed) University, Pune, India"],"affiliations":[{"raw_affiliation_string":"Symbiosis Institute of Computer Studies and Research, Symbiosis International (Deemed) University, Pune, India","institution_ids":["https://openalex.org/I244572783"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5055303991"],"corresponding_institution_ids":["https://openalex.org/I244572783"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.02906747,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"22","issue":"04","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hindi","display_name":"Hindi","score":0.8864938616752625},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7391119599342346},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6996738314628601},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.6491794586181641},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.525118887424469},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5195336937904358},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.5179058909416199},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.46601608395576477},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.44181081652641296},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.42484351992607117}],"concepts":[{"id":"https://openalex.org/C519982507","wikidata":"https://www.wikidata.org/wiki/Q1568","display_name":"Hindi","level":2,"score":0.8864938616752625},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7391119599342346},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6996738314628601},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.6491794586181641},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.525118887424469},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5195336937904358},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.5179058909416199},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.46601608395576477},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.44181081652641296},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.42484351992607117}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1142/s0219649223500168","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0219649223500168","pdf_url":null,"source":{"id":"https://openalex.org/S30163770","display_name":"Journal of Information & Knowledge Management","issn_l":"0219-6492","issn":["0219-6492","1793-6926"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information &amp; Knowledge Management","raw_type":"journal-article"},{"id":"pmh:oai:RePEc:wsi:jikmxx:v:22:y:2023:i:04:n:s0219649223500168","is_oa":false,"landing_page_url":"http://www.worldscientific.com/doi/abs/10.1142/S0219649223500168","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1975568433","https://openalex.org/W2317540622","https://openalex.org/W2413241054","https://openalex.org/W2558405088","https://openalex.org/W2886890203","https://openalex.org/W2972332940","https://openalex.org/W3004824196","https://openalex.org/W3005832002","https://openalex.org/W3007892413","https://openalex.org/W3010336755","https://openalex.org/W3023262615","https://openalex.org/W3023882301","https://openalex.org/W3041481294","https://openalex.org/W3210781772","https://openalex.org/W4236122429","https://openalex.org/W4247545505","https://openalex.org/W4255325693"],"related_works":["https://openalex.org/W4367336074","https://openalex.org/W4379620016","https://openalex.org/W3154045278","https://openalex.org/W3210764983","https://openalex.org/W4367335949","https://openalex.org/W3089416646","https://openalex.org/W4380048833","https://openalex.org/W4285162676","https://openalex.org/W4382052559","https://openalex.org/W3036529732"],"abstract_inverted_index":{"In":[0],"this":[1],"era,":[2],"news":[3,25,36,81],"is":[4,47,56,62,151],"not":[5,71],"only":[6],"generated":[7],"continuously":[8],"with":[9],"high":[10],"speed":[11],"but":[12],"also":[13],"growing":[14],"in":[15],"its":[16,39,68],"amount":[17],"by":[18,76],"different":[19],"web":[20],"sources":[21],"like":[22],"talent":[23],"hunt,":[24],"agencies,":[26],"and":[27,52,89,106,157,164,185],"so":[28,74],"on.":[29],"To":[30],"predict":[31],"the":[32,92,131,173,177],"exact":[33],"class":[34],"of":[35,125,134],"depending":[37],"on":[38],"topic,":[40],"GepH":[41,179],"(Grouped":[42],"entity":[43,50,86,108],"predictor":[44],"for":[45,58,96,103,111,136,190],"Hindi)":[46],"proposed":[48,174],"using":[49,91,127,161,172],"extraction":[51,55],"grouping.":[53],"Entity":[54],"popular":[57],"English":[59],"corpus.":[60],"Hindi":[61,97,104,112,192],"a":[63,154],"national":[64],"language":[65],"due":[66],"to":[67,84,120,149],"resource":[69],"scarceness":[70],"being":[72],"explored":[73],"much":[75],"researchers.":[77],"More":[78],"than":[79],"1,270":[80],"are":[82,118,159],"processed":[83],"apply":[85],"extraction,":[87],"clustering,":[88],"classification":[90],"vector":[93,100],"space":[94,101],"model":[95,102],"(VSMH),":[98],"Synset":[99],"(SVSMH),":[105],"grouped":[107],"document":[109],"matrix":[110],"(GEDMH).":[113],"Synset-based":[114],"dimension":[115],"reduction":[116],"techniques":[117],"used":[119,152],"get":[121],"improved":[122],"accuracy.":[123],"Evaluation":[124],"HAC":[126,145],"three":[128],"matrices":[129],"shows":[130,180],"best":[132],"performance":[133],"GEDMH":[135,150,175],"varied":[137],"datasets.":[138],"Thus":[139],"labelled":[140],"corpus":[141],"obtained":[142],"after":[143],"applying":[144],"(Hierarchical":[146],"agglomerative":[147],"clustering)":[148],"as":[153,187],"training":[155],"dataset":[156],"predictions":[158],"done":[160],"random":[162],"forest":[163],"Na\u00efve":[165,168],"Bayes.":[166],"The":[167],"Bayes":[169],"classifier":[170],"implemented":[171],"performs":[176],"best.":[178],"0.8":[181],"purity,":[182],"0.4":[183],"entropy,":[184],"0.3":[186],"error":[188],"rate":[189],"1,273":[191],"news.":[193]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
