{"id":"https://openalex.org/W2285225925","doi":"https://doi.org/10.1109/dsdis.2015.30","title":"Discovering Aspectual Classes of Russian Verbs in Untagged Large Corpora","display_name":"Discovering Aspectual Classes of Russian Verbs in Untagged Large Corpora","publication_year":2015,"publication_date":"2015-12-01","ids":{"openalex":"https://openalex.org/W2285225925","doi":"https://doi.org/10.1109/dsdis.2015.30","mag":"2285225925"},"language":"en","primary_location":{"id":"doi:10.1109/dsdis.2015.30","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsdis.2015.30","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Data Science and Data Intensive Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058277099","display_name":"Aleksandr Drozd","orcid":"https://orcid.org/0000-0002-4575-7213"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Aleksandr Drozd","raw_affiliation_strings":["Tokyo Institute of Technology, Global Scientific Information and Computing Center, Meguro-ku, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Tokyo Institute of Technology, Global Scientific Information and Computing Center, Meguro-ku, Tokyo, Japan","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112209348","display_name":"Anna Gladkova","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]},{"id":"https://openalex.org/I14396692","display_name":"Tokyo University of Information Sciences","ror":"https://ror.org/044bdx604","country_code":"JP","type":"education","lineage":["https://openalex.org/I14396692"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Anna Gladkova","raw_affiliation_strings":["Department of Language and Information Sciences, The University of Tokyo, Meguro-ku, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Language and Information Sciences, The University of Tokyo, Meguro-ku, Tokyo, Japan","institution_ids":["https://openalex.org/I14396692","https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103252086","display_name":"Satoshi Matsuoka","orcid":"https://orcid.org/0000-0003-2126-2926"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Satoshi Matsuoka","raw_affiliation_strings":["Tokyo Institute of Technology, Global Scientific Information and Computing Center, Meguro-ku, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Tokyo Institute of Technology, Global Scientific Information and Computing Center, Meguro-ku, Tokyo, Japan","institution_ids":["https://openalex.org/I114531698"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5058277099"],"corresponding_institution_ids":["https://openalex.org/I114531698"],"apc_list":null,"apc_paid":null,"fwci":1.2943,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.86586481,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"61","last_page":"68"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8184690475463867},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7009633779525757},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6643131971359253},{"id":"https://openalex.org/keywords/cryptographic-nonce","display_name":"Cryptographic nonce","score":0.5910576581954956},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5025973320007324},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.4390407204627991},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.20827767252922058}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8184690475463867},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7009633779525757},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6643131971359253},{"id":"https://openalex.org/C9996903","wikidata":"https://www.wikidata.org/wiki/Q1749235","display_name":"Cryptographic nonce","level":3,"score":0.5910576581954956},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5025973320007324},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.4390407204627991},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.20827767252922058},{"id":"https://openalex.org/C148730421","wikidata":"https://www.wikidata.org/wiki/Q141090","display_name":"Encryption","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/dsdis.2015.30","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsdis.2015.30","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Data Science and Data Intensive Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:publications/f4dfe0ba-fcc6-41d1-a292-389e18faddef","is_oa":false,"landing_page_url":"http://www.ieeexplore.ieee.org/document/7396482/","pdf_url":null,"source":{"id":"https://openalex.org/S4377196680","display_name":"IT University Of Copenhagen (IT University of Copenhagen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I83467386","host_organization_name":"IT University of Copenhagen","host_organization_lineage":["https://openalex.org/I83467386"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Drozd, A, Gladkova, A & Matsuoka, S 2015, Discovering Aspectual Classes of Russian Verbs in Untagged Large Corpora. in Proceedings of 2015 IEEE International Conference on Data Science and Data Intensive Systems (DSDIS). pp. 61-68. https://doi.org/10.1109/DSDIS.2015.30","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8700000047683716,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W3753517","https://openalex.org/W73629738","https://openalex.org/W1499253590","https://openalex.org/W1524834623","https://openalex.org/W1579035156","https://openalex.org/W1593045043","https://openalex.org/W1967838552","https://openalex.org/W1981617416","https://openalex.org/W1981745143","https://openalex.org/W1983578042","https://openalex.org/W1985258161","https://openalex.org/W1992009922","https://openalex.org/W2040985480","https://openalex.org/W2052474702","https://openalex.org/W2086486316","https://openalex.org/W2119610041","https://openalex.org/W2124966964","https://openalex.org/W2125031621","https://openalex.org/W2136159041","https://openalex.org/W2141289451","https://openalex.org/W2153579005","https://openalex.org/W2159637323","https://openalex.org/W2170036644","https://openalex.org/W2250189634","https://openalex.org/W2250539671","https://openalex.org/W2326587081","https://openalex.org/W2752885492","https://openalex.org/W2882319491","https://openalex.org/W2979401726","https://openalex.org/W3197748241","https://openalex.org/W3198160809","https://openalex.org/W4238530616","https://openalex.org/W4294170691","https://openalex.org/W4372046852","https://openalex.org/W6600177566","https://openalex.org/W6631615774","https://openalex.org/W6634589335","https://openalex.org/W6635456232","https://openalex.org/W6678885109","https://openalex.org/W6682691769","https://openalex.org/W6801561724","https://openalex.org/W7029321148"],"related_works":["https://openalex.org/W4392666870","https://openalex.org/W4386794377","https://openalex.org/W2954455763","https://openalex.org/W2967369616","https://openalex.org/W3047523978","https://openalex.org/W2353810166","https://openalex.org/W1877660496","https://openalex.org/W2371127504","https://openalex.org/W3112251563","https://openalex.org/W3204019825"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,50,62,92],"case":[4],"study":[5],"of":[6,24,30,36,45,75,97],"discovering":[7],"and":[8,26,81,87,100,118],"classifying":[9],"verbs":[10,90,117],"in":[11,16,40,78,91],"large":[12],"web-corpora.":[13],"Many":[14],"tasks":[15],"natural":[17],"language":[18],"processing":[19,82],"require":[20],"corpora":[21],"containing":[22],"billions":[23],"words,":[25],"with":[27],"such":[28],"volumes":[29],"data":[31],"co-occurrence":[32,51],"extraction":[33,52],"becomes":[34],"one":[35],"the":[37,41],"performance":[38],"bottlenecks":[39],"Vector":[42],"Space":[43],"Models":[44],"computational":[46],"linguistics.":[47],"We":[48],"propose":[49],"kernel":[53,71],"based":[54,68],"on":[55],"ternary":[56],"trees":[57],"as":[58],"an":[59,73],"alternative":[60],"(or":[61],"complimentary":[63],"stage)":[64],"to":[65],"conventional":[66],"map-reduce":[67],"approach,":[69],"this":[70],"achieves":[72],"order":[74],"magnitude":[76],"improvement":[77],"memory":[79],"footprint":[80],"speed.":[83],"Our":[84],"classifier":[85],"successfully":[86],"efficiently":[88],"identified":[89],"1.2-billion":[93],"words":[94],"untagged":[95],"corpus":[96],"Russian":[98],"fiction":[99],"distinguished":[101],"between":[102],"their":[103],"two":[104],"aspectual":[105],"classes.":[106],"The":[107],"model":[108],"proved":[109],"efficient":[110],"even":[111],"for":[112],"low-frequency":[113],"vocabulary,":[114],"including":[115],"nonce":[116],"neologisms.":[119]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2018,"cited_by_count":2},{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
