{"id":"https://openalex.org/W2766809237","doi":"https://doi.org/10.1109/ccoms.2017.8075264","title":"A procedure to build multiword expression data set","display_name":"A procedure to build multiword expression data set","publication_year":2017,"publication_date":"2017-07-01","ids":{"openalex":"https://openalex.org/W2766809237","doi":"https://doi.org/10.1109/ccoms.2017.8075264","mag":"2766809237"},"language":"en","primary_location":{"id":"doi:10.1109/ccoms.2017.8075264","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ccoms.2017.8075264","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 2nd International Conference on Computer and Communication Systems (ICCCS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032502490","display_name":"Senem Kumova Met\u0131n","orcid":"https://orcid.org/0000-0002-9606-3625"},"institutions":[{"id":"https://openalex.org/I15059493","display_name":"\u0130zmir University of Economics","ror":"https://ror.org/04hjr4202","country_code":"TR","type":"education","lineage":["https://openalex.org/I15059493"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Senem Kumova Metin","raw_affiliation_strings":["Department of Software Engineering, Izmir University of Economics, Izmir, Turkey","Department of Software Engineering Faculty of Engineering, Izmir University of Economics, \u0130zmir, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Software Engineering, Izmir University of Economics, Izmir, Turkey","institution_ids":["https://openalex.org/I15059493"]},{"raw_affiliation_string":"Department of Software Engineering Faculty of Engineering, Izmir University of Economics, \u0130zmir, Turkey","institution_ids":["https://openalex.org/I15059493"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038657021","display_name":"Mehmet Taze","orcid":"https://orcid.org/0000-0001-6835-302X"},"institutions":[{"id":"https://openalex.org/I15059493","display_name":"\u0130zmir University of Economics","ror":"https://ror.org/04hjr4202","country_code":"TR","type":"education","lineage":["https://openalex.org/I15059493"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Mehmet Taze","raw_affiliation_strings":["Department of Software Engineering, Izmir University of Economics, Izmir, Turkey","Department of Computer Engineering Faculty of Engineering, Izmir University of Economics, \u0130zmir, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Software Engineering, Izmir University of Economics, Izmir, Turkey","institution_ids":["https://openalex.org/I15059493"]},{"raw_affiliation_string":"Department of Computer Engineering Faculty of Engineering, Izmir University of Economics, \u0130zmir, Turkey","institution_ids":["https://openalex.org/I15059493"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5032502490"],"corresponding_institution_ids":["https://openalex.org/I15059493"],"apc_list":null,"apc_paid":null,"fwci":0.195,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.63197493,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"1","issue":null,"first_page":"46","last_page":"49"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11587","display_name":"Second Language Acquisition and Learning","score":0.9779000282287598,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9681000113487244,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8297733068466187},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7606549859046936},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6879727840423584},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6050978302955627},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.5532761812210083},{"id":"https://openalex.org/keywords/expression","display_name":"Expression (computer science)","score":0.5456167459487915},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5296273827552795},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.5209744572639465},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.41360437870025635},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09544366598129272},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.06461858749389648}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8297733068466187},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7606549859046936},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6879727840423584},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6050978302955627},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.5532761812210083},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.5456167459487915},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5296273827552795},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.5209744572639465},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.41360437870025635},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09544366598129272},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.06461858749389648},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ccoms.2017.8075264","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ccoms.2017.8075264","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 2nd International Conference on Computer and Communication Systems (ICCCS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8100000023841858,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1498763386","https://openalex.org/W1509179932","https://openalex.org/W1971624066","https://openalex.org/W1975879668","https://openalex.org/W1994129711","https://openalex.org/W1994560811","https://openalex.org/W2003131523","https://openalex.org/W2042380438","https://openalex.org/W2103464847","https://openalex.org/W2147777361","https://openalex.org/W2250486177","https://openalex.org/W2759478409","https://openalex.org/W3102214172","https://openalex.org/W4235118305","https://openalex.org/W6630342943","https://openalex.org/W6744764900","https://openalex.org/W7056080538"],"related_works":["https://openalex.org/W2980611886","https://openalex.org/W42295635","https://openalex.org/W1973996291","https://openalex.org/W2330575325","https://openalex.org/W2163803519","https://openalex.org/W2497592525","https://openalex.org/W3096145648","https://openalex.org/W3197510923","https://openalex.org/W2370579019","https://openalex.org/W2392243736"],"abstract_inverted_index":{"In":[0,173],"this":[1,174],"paper,":[2],"we":[3,96],"propose":[4],"a":[5,14,54,164],"procedure":[6,44],"employing":[7],"natural":[8],"language":[9],"processing":[10],"methods":[11,105],"to":[12,62,108,129,162],"build":[13,163],"golden":[15,165],"standard":[16,166],"multiword":[17],"expression":[18],"data":[19,26,58,83,168],"set":[20,27,84,169],"and":[21,31,75],"present":[22],"our":[23],"Turkish":[24],"MWE":[25,57,64,82,90,110,131,167,182],"of":[28,56,70,89,100,124,140],"3946":[29],"positive":[30],"4230":[32],"negative":[33],"candidates":[34,91,111,135,151,177],"that":[35,112,136],"is":[36,52,85,170],"built":[37],"following":[38],"the":[39,68,93,98,118,134,138,150,171,176],"proposed":[40,43],"procedure.":[41],"The":[42,49,159],"covers":[45],"three":[46],"main":[47],"tasks.":[48],"first":[50],"task":[51,79,161],"collecting":[53],"variety":[55],"resources":[59],"in":[60,80],"order":[61],"extract":[63,109],"candidates.":[65,132],"We":[66],"suggest":[67,97],"use":[69],"corpora":[71],"together":[72],"with":[73,152],"idiom":[74],"term":[76],"dictionaries.":[77],"Second":[78],"building":[81],"extracting":[86],"different":[87],"types":[88],"from":[92],"resources.":[94],"Here,":[95],"aggregation":[99],"four":[101],"methods.":[102],"Firstly,":[103],"statistical":[104],"are":[106,127,143,147,157,178],"applied":[107],"have":[113],"high":[114],"occurrence":[115],"frequencies.":[116],"Secondly,":[117],"linguistic":[119],"properties":[120,139],"such":[121],"as":[122,181],"part":[123],"speech":[125],"patterns":[126],"considered":[128],"select":[130],"Thirdly,":[133],"mimic":[137],"idioms":[141,146],"or":[142,183],"already":[144],"true":[145],"chosen.":[148],"Lastly,":[149],"domain":[153],"specific":[154],"properties,":[155],"term-similar,":[156],"extracted.":[158],"final":[160],"labeling.":[172],"task,":[175],"labeled":[179],"either":[180],"non-MWE":[184],"by":[185],"multiple":[186],"judges.":[187]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
