{"id":"https://openalex.org/W1546862095","doi":"https://doi.org/10.1109/dictap.2015.7113185","title":"Semantic vector space model for reducing Arabic text dimensionality","display_name":"Semantic vector space model for reducing Arabic text dimensionality","publication_year":2015,"publication_date":"2015-04-01","ids":{"openalex":"https://openalex.org/W1546862095","doi":"https://doi.org/10.1109/dictap.2015.7113185","mag":"1546862095"},"language":"en","primary_location":{"id":"doi:10.1109/dictap.2015.7113185","is_oa":true,"landing_page_url":"https://doi.org/10.1109/dictap.2015.7113185","pdf_url":"https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7113185","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 Fifth International Conference on Digital Information and Communication Technology and its Applications (DICTAP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7113185","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062695565","display_name":"Arafat Awajan","orcid":"https://orcid.org/0000-0002-7067-5658"},"institutions":[{"id":"https://openalex.org/I158749337","display_name":"Princess Sumaya University for Technology","ror":"https://ror.org/01jy46q10","country_code":"JO","type":"education","lineage":["https://openalex.org/I158749337"]}],"countries":["JO"],"is_corresponding":true,"raw_author_name":"Arafat Awajan","raw_affiliation_strings":["Computer Science Department, Princess Sumaya University for Technology, Amman, JORDAN","Computer Science Department, Princess Sumaya University for Technology, Amman - Jordan"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Princess Sumaya University for Technology, Amman, JORDAN","institution_ids":["https://openalex.org/I158749337"]},{"raw_affiliation_string":"Computer Science Department, Princess Sumaya University for Technology, Amman - Jordan","institution_ids":["https://openalex.org/I158749337"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5062695565"],"corresponding_institution_ids":["https://openalex.org/I158749337"],"apc_list":null,"apc_paid":null,"fwci":1.2943,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.8503356,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"25","issue":null,"first_page":"129","last_page":"135"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/wordnet","display_name":"WordNet","score":0.8945456743240356},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7228915095329285},{"id":"https://openalex.org/keywords/vector-space-model","display_name":"Vector space model","score":0.7118042707443237},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6943601369857788},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.683438241481781},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5958765745162964},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.567037045955658},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5616313815116882},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4882681369781494},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.46837979555130005},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.45261791348457336},{"id":"https://openalex.org/keywords/arabic","display_name":"Arabic","score":0.44449248909950256},{"id":"https://openalex.org/keywords/vector-space","display_name":"Vector space","score":0.43648457527160645},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.42968830466270447},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.22951382398605347},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.18807992339134216}],"concepts":[{"id":"https://openalex.org/C157659113","wikidata":"https://www.wikidata.org/wiki/Q533822","display_name":"WordNet","level":2,"score":0.8945456743240356},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7228915095329285},{"id":"https://openalex.org/C89686163","wikidata":"https://www.wikidata.org/wiki/Q1187982","display_name":"Vector space model","level":2,"score":0.7118042707443237},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6943601369857788},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.683438241481781},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5958765745162964},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.567037045955658},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5616313815116882},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4882681369781494},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.46837979555130005},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.45261791348457336},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.44449248909950256},{"id":"https://openalex.org/C13336665","wikidata":"https://www.wikidata.org/wiki/Q125977","display_name":"Vector space","level":2,"score":0.43648457527160645},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.42968830466270447},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.22951382398605347},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.18807992339134216},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dictap.2015.7113185","is_oa":true,"landing_page_url":"https://doi.org/10.1109/dictap.2015.7113185","pdf_url":"https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7113185","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 Fifth International Conference on Digital Information and Communication Technology and its Applications (DICTAP)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1109/dictap.2015.7113185","is_oa":true,"landing_page_url":"https://doi.org/10.1109/dictap.2015.7113185","pdf_url":"https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=7113185","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 Fifth International Conference on Digital Information and Communication Technology and its Applications (DICTAP)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7200000286102295}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1546862095.pdf","grobid_xml":"https://content.openalex.org/works/W1546862095.grobid-xml"},"referenced_works_count":25,"referenced_works":["https://openalex.org/W1485311222","https://openalex.org/W1662133657","https://openalex.org/W1987302197","https://openalex.org/W2009466421","https://openalex.org/W2059503205","https://openalex.org/W2109791464","https://openalex.org/W2114523070","https://openalex.org/W2139161410","https://openalex.org/W2147272182","https://openalex.org/W2149709850","https://openalex.org/W2165612380","https://openalex.org/W2526234476","https://openalex.org/W2757950651","https://openalex.org/W2882319491","https://openalex.org/W2963486821","https://openalex.org/W4251146235","https://openalex.org/W4252520227","https://openalex.org/W4256133489","https://openalex.org/W4285719527","https://openalex.org/W4293874803","https://openalex.org/W6676276270","https://openalex.org/W6680707895","https://openalex.org/W6682004857","https://openalex.org/W6727699327","https://openalex.org/W7045898636"],"related_works":["https://openalex.org/W2043952800","https://openalex.org/W2047143235","https://openalex.org/W2957377172","https://openalex.org/W2165693052","https://openalex.org/W2164877079","https://openalex.org/W2113471940","https://openalex.org/W2569513598","https://openalex.org/W2907883452","https://openalex.org/W101928771","https://openalex.org/W2251695880"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3],"introduce":[4],"an":[5],"efficient":[6],"method":[7,22,116],"to":[8,41,50,67,99],"represent":[9],"Arabic":[10,29],"texts":[11],"in":[12,39,97],"comparatively":[13],"smaller":[14],"sizes":[15],"without":[16],"losing":[17],"significant":[18],"information.":[19],"The":[20,108],"proposed":[21,115],"uses":[23],"the":[24,28,43,46,75,90,95,114,119,129,140],"linguistic":[25],"features":[26],"of":[27,45,70,121,143],"language,":[30],"mainly":[31],"its":[32,37,52],"very":[33],"productive":[34],"morphology":[35],"and":[36,49,78,134],"richness":[38],"synonyms,":[40],"reduce":[42],"dimension":[44],"document":[47,96],"vector":[48,53,131],"improve":[51],"space":[54,132],"model":[55,133],"representation.":[56],"We":[57],"have":[58,111],"incorporated":[59],"semantic":[60],"information":[61],"from":[62,74],"word":[63],"thesauri":[64],"like":[65],"WordNet":[66],"create":[68],"clusters":[69],"similar":[71,101],"words":[72,102,144],"extracted":[73],"same":[76],"root":[77],"regrouped":[79],"along":[80],"with":[81,94,128,139],"their":[82],"synonyms.":[83],"Distributional":[84],"similarity":[85],"measures":[86],"are":[87],"applied":[88],"on":[89,104],"word-context":[91],"matrix":[92],"associated":[93],"order":[98],"identify":[100],"based":[103],"a":[105],"text's":[106],"context.":[107],"experimental":[109],"results":[110],"confirmed":[112],"that":[113],"significantly":[117],"reduces":[118],"size":[120],"text":[122],"representation":[123],"by":[124,135],"about":[125,136],"20%":[126],"compared":[127,138],"stem-based":[130],"40%":[137],"traditional":[141],"bag":[142],"model.":[145]},"counts_by_year":[{"year":2017,"cited_by_count":2},{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
