{"id":"https://openalex.org/W4406633411","doi":"https://doi.org/10.3390/computers14010030","title":"Set-Word Embeddings and Semantic Indices: A New Contextual Model for Empirical Language Analysis","display_name":"Set-Word Embeddings and Semantic Indices: A New Contextual Model for Empirical Language Analysis","publication_year":2025,"publication_date":"2025-01-20","ids":{"openalex":"https://openalex.org/W4406633411","doi":"https://doi.org/10.3390/computers14010030"},"language":"en","primary_location":{"id":"doi:10.3390/computers14010030","is_oa":true,"landing_page_url":"https://doi.org/10.3390/computers14010030","pdf_url":"https://www.mdpi.com/2073-431X/14/1/30/pdf?version=1737452825","source":{"id":"https://openalex.org/S4210228075","display_name":"Computers","issn_l":"2073-431X","issn":["2073-431X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2073-431X/14/1/30/pdf?version=1737452825","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062053931","display_name":"Pedro Fern\u00e1ndez de C\u00f3rdoba","orcid":"https://orcid.org/0000-0002-0347-7280"},"institutions":[{"id":"https://openalex.org/I60053951","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859","country_code":"ES","type":"education","lineage":["https://openalex.org/I60053951"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Pedro Fern\u00e1ndez de C\u00f3rdoba","raw_affiliation_strings":["Instituto Universitario de Matem\u00e1tica Pura y Aplicada, Universitat Polit\u00e8cnica de Val\u00e8ncia, 46022 Val\u00e8ncia, Spain"],"raw_orcid":"https://orcid.org/0000-0002-0347-7280","affiliations":[{"raw_affiliation_string":"Instituto Universitario de Matem\u00e1tica Pura y Aplicada, Universitat Polit\u00e8cnica de Val\u00e8ncia, 46022 Val\u00e8ncia, Spain","institution_ids":["https://openalex.org/I60053951"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104073080","display_name":"Carlos A. Perez","orcid":"https://orcid.org/0009-0002-6829-1150"},"institutions":[{"id":"https://openalex.org/I60053951","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859","country_code":"ES","type":"education","lineage":["https://openalex.org/I60053951"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Carlos A. Reyes P\u00e9rez","raw_affiliation_strings":["Instituto Universitario de Matem\u00e1tica Pura y Aplicada, Universitat Polit\u00e8cnica de Val\u00e8ncia, 46022 Val\u00e8ncia, Spain"],"raw_orcid":"https://orcid.org/0009-0002-6829-1150","affiliations":[{"raw_affiliation_string":"Instituto Universitario de Matem\u00e1tica Pura y Aplicada, Universitat Polit\u00e8cnica de Val\u00e8ncia, 46022 Val\u00e8ncia, Spain","institution_ids":["https://openalex.org/I60053951"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115955657","display_name":"Claudia S\u00e1nchez Arnau","orcid":null},"institutions":[{"id":"https://openalex.org/I16097986","display_name":"Universitat de Val\u00e8ncia","ror":"https://ror.org/043nxc105","country_code":"ES","type":"education","lineage":["https://openalex.org/I16097986"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Claudia S\u00e1nchez Arnau","raw_affiliation_strings":["E.T.S. Ingenier\u00eda, Universitat de Val\u00e8ncia, 46100 Val\u00e9ncia, Spain"],"raw_orcid":"https://orcid.org/0009-0004-1245-9289","affiliations":[{"raw_affiliation_string":"E.T.S. Ingenier\u00eda, Universitat de Val\u00e8ncia, 46100 Val\u00e9ncia, Spain","institution_ids":["https://openalex.org/I16097986"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059955897","display_name":"Enrique A. S\u00e1nchez\u2010P\u00e9rez","orcid":"https://orcid.org/0000-0001-8854-3154"},"institutions":[{"id":"https://openalex.org/I60053951","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859","country_code":"ES","type":"education","lineage":["https://openalex.org/I60053951"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Enrique A. S\u00e1nchez P\u00e9rez","raw_affiliation_strings":["Instituto Universitario de Matem\u00e1tica Pura y Aplicada, Universitat Polit\u00e8cnica de Val\u00e8ncia, 46022 Val\u00e8ncia, Spain"],"raw_orcid":"https://orcid.org/0000-0001-8854-3154","affiliations":[{"raw_affiliation_string":"Instituto Universitario de Matem\u00e1tica Pura y Aplicada, Universitat Polit\u00e8cnica de Val\u00e8ncia, 46022 Val\u00e8ncia, Spain","institution_ids":["https://openalex.org/I60053951"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5059955897"],"corresponding_institution_ids":["https://openalex.org/I60053951"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":1.0502,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.73790296,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"14","issue":"1","first_page":"30","last_page":"30"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12592","display_name":"Opinion Dynamics and Social Influence","score":0.6183000206947327,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12592","display_name":"Opinion Dynamics and Social Influence","score":0.6183000206947327,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6966333389282227},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6828278303146362},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5785611867904663},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5253947377204895},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5030614733695984},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.4775018095970154},{"id":"https://openalex.org/keywords/semantic-analysis","display_name":"Semantic analysis (machine learning)","score":0.41210705041885376},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.11992543935775757}],"concepts":[{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6966333389282227},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6828278303146362},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5785611867904663},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5253947377204895},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5030614733695984},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.4775018095970154},{"id":"https://openalex.org/C2777946921","wikidata":"https://www.wikidata.org/wiki/Q7449044","display_name":"Semantic analysis (machine learning)","level":2,"score":0.41210705041885376},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.11992543935775757},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/computers14010030","is_oa":true,"landing_page_url":"https://doi.org/10.3390/computers14010030","pdf_url":"https://www.mdpi.com/2073-431X/14/1/30/pdf?version=1737452825","source":{"id":"https://openalex.org/S4210228075","display_name":"Computers","issn_l":"2073-431X","issn":["2073-431X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:70ac52e1455144bab2a35368df9f3fef","is_oa":true,"landing_page_url":"https://doaj.org/article/70ac52e1455144bab2a35368df9f3fef","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computers, Vol 14, Iss 1, p 30 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/computers14010030","is_oa":true,"landing_page_url":"https://doi.org/10.3390/computers14010030","pdf_url":"https://www.mdpi.com/2073-431X/14/1/30/pdf?version=1737452825","source":{"id":"https://openalex.org/S4210228075","display_name":"Computers","issn_l":"2073-431X","issn":["2073-431X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4295176169","display_name":null,"funder_award_id":"PROMETEO CIPROM/2023/32","funder_id":"https://openalex.org/F4320321864","funder_display_name":"Generalitat Valenciana"},{"id":"https://openalex.org/G6219168559","display_name":null,"funder_award_id":"CIPROM/2023/32","funder_id":"https://openalex.org/F4320321864","funder_display_name":"Generalitat Valenciana"}],"funders":[{"id":"https://openalex.org/F4320321864","display_name":"Generalitat Valenciana","ror":"https://ror.org/0097mvx21"},{"id":"https://openalex.org/F4320334905","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4406633411.pdf"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W821951396","https://openalex.org/W1533842436","https://openalex.org/W1597195725","https://openalex.org/W1608322251","https://openalex.org/W1991358523","https://openalex.org/W2017462139","https://openalex.org/W2031457979","https://openalex.org/W2058582101","https://openalex.org/W2141599568","https://openalex.org/W2153579005","https://openalex.org/W2250539671","https://openalex.org/W2500063528","https://openalex.org/W2585439946","https://openalex.org/W2768113420","https://openalex.org/W2794783369","https://openalex.org/W2891503716","https://openalex.org/W2892410331","https://openalex.org/W2896457183","https://openalex.org/W3008374555","https://openalex.org/W3130450512","https://openalex.org/W3133839445","https://openalex.org/W4223947928","https://openalex.org/W4229451295","https://openalex.org/W4253680019","https://openalex.org/W4293581639","https://openalex.org/W4300958603","https://openalex.org/W4319163914","https://openalex.org/W4385570071","https://openalex.org/W4385572845","https://openalex.org/W4391099575","https://openalex.org/W4396722682","https://openalex.org/W4401043136","https://openalex.org/W4401943272","https://openalex.org/W4402715022","https://openalex.org/W4403678472"],"related_works":["https://openalex.org/W1569283511","https://openalex.org/W4236193183","https://openalex.org/W2053866214","https://openalex.org/W2607505004","https://openalex.org/W2296205523","https://openalex.org/W4235488275","https://openalex.org/W2903379275","https://openalex.org/W4366961134","https://openalex.org/W2579156435","https://openalex.org/W4392201942"],"abstract_inverted_index":{"We":[0,93,228],"present":[1],"a":[2,8,20,42,54,61,108,173,235],"new":[3,55],"word":[4,90,163],"embedding":[5,91,164,175],"technique":[6],"in":[7,19,78,120,130,224,260],"(non-linear)":[9],"metric":[10,27,50,132,143],"space":[11,51,146,168],"based":[12,165],"on":[13,46,166,254],"the":[14,26,32,39,49,68,85,89,101,105,113,121,131,135,138,142,145,153,187,193,196,199,206,210,216,243,247,252,264,272,282,285,291,295],"shared":[15],"membership":[16],"of":[17,22,35,38,74,115,144,155,184,198,209,218,246,284],"terms":[18,119,257,262,289],"corpus":[21,40],"textual":[23],"documents,":[24],"where":[25],"is":[28,52,268,278],"naturally":[29],"defined":[30,45,81],"by":[31,72],"Boolean":[33],"algebra":[34],"all":[36,96],"subsets":[37],"and":[41,70,88,99,141],"measure":[43,86],"\u03bc":[44,87],"it.":[47],"Once":[48],"constructed,":[53],"term":[56],"(a":[57],"noun,":[58],"an":[59,181],"adjective,":[60],"classification":[62],"term)":[63],"can":[64,169],"be":[65,170,275],"introduced":[66],"into":[67,212],"model":[69,122,211,249],"analyzed":[71],"means":[73],"semantic":[75,139,188,261,265],"projections,":[76],"which":[77],"turn":[79],"are":[80,124,250,258],"as":[82,126,172,221,223],"indexes":[83],"using":[84,201,239],"tools.":[92],"formally":[94],"define":[95],"necessary":[97],"elements":[98],"prove":[100],"main":[102,150,244],"results":[103,200,253],"about":[104],"model,":[106],"including":[107,234],"compatibility":[109],"theorem":[110],"for":[111,186,195,215],"estimating":[112],"representability":[114],"semantically":[116],"meaningful":[117],"external":[118],"(which":[123],"written":[125,171],"real":[127],"Lipschitz":[128],"functions":[129],"space),":[133],"proving":[134,159],"relation":[136],"between":[137,256,287],"index":[140,266],"(Theorem":[147,176],"1).":[148],"Our":[149],"result":[151],"proves":[152],"universality":[154],"our":[156],"word-set":[157,174],"embedding,":[158],"mathematically":[160],"that":[161,251],"every":[162],"linear":[167],"2).":[177],"Since":[178],"we":[179,190],"adopt":[180],"empirical":[182],"point":[183],"view":[185],"issues,":[189],"also":[191,229],"provide":[192],"keys":[194],"interpretation":[197],"probabilistic":[202],"arguments":[203],"(to":[204],"facilitate":[205],"subsequent":[207],"integration":[208],"Bayesian":[213],"frameworks":[214],"construction":[217],"inductive":[219],"tools),":[220],"well":[222],"fuzzy":[225],"set-theoretic":[226],"terms.":[227],"show":[230],"some":[231],"illustrative":[232],"examples,":[233],"complete":[236],"computational":[237],"case":[238],"big-data-based":[240],"computations.":[241],"Thus,":[242],"advantages":[245],"proposed":[248],"distances":[255],"interpretable":[259],"once":[263],"used":[267],"fixed":[269],"and,":[270],"although":[271],"calculations":[273],"could":[274],"costly,":[276],"it":[277],"possible":[279],"to":[280,293],"calculate":[281,294],"value":[283],"distance":[286,297],"two":[288],"without":[290],"need":[292],"whole":[296],"matrix.":[298],"\u201cWovon":[299],"man":[300,306],"nicht":[301],"sprechen":[302],"kann,":[303],"dar\u00fcber":[304],"muss":[305],"schweigen\u201d.":[307],"Tractatus":[308],"Logico-Philosophicus.":[309],"L.":[310],"Wittgenstein.":[311]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
