{"id":"https://openalex.org/W2124926790","doi":"https://doi.org/10.3115/v1/d14-1143","title":"Formalizing Word Sampling for Vocabulary Prediction as Graph-based Active Learning","display_name":"Formalizing Word Sampling for Vocabulary Prediction as Graph-based Active Learning","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2124926790","doi":"https://doi.org/10.3115/v1/d14-1143","mag":"2124926790"},"language":"en","primary_location":{"id":"doi:10.3115/v1/d14-1143","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/d14-1143","pdf_url":"https://aclanthology.org/D14-1143.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/D14-1143.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007171156","display_name":"Yo Ehara","orcid":"https://orcid.org/0000-0001-9314-4617"},"institutions":[{"id":"https://openalex.org/I90023481","display_name":"National Institute of Information and Communications Technology","ror":"https://ror.org/016bgq349","country_code":"JP","type":"facility","lineage":["https://openalex.org/I90023481"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yo Ehara","raw_affiliation_strings":["National Institute of Information and Communications Technology"],"affiliations":[{"raw_affiliation_string":"National Institute of Information and Communications Technology","institution_ids":["https://openalex.org/I90023481"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004444958","display_name":"Yusuke Miyao","orcid":"https://orcid.org/0000-0002-0678-3400"},"institutions":[{"id":"https://openalex.org/I184597095","display_name":"National Institute of Informatics","ror":"https://ror.org/04ksd4g47","country_code":"JP","type":"facility","lineage":["https://openalex.org/I1319490839","https://openalex.org/I184597095","https://openalex.org/I4210158934"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yusuke Miyao","raw_affiliation_strings":["National Institute of Informatics,"],"affiliations":[{"raw_affiliation_string":"National Institute of Informatics,","institution_ids":["https://openalex.org/I184597095"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042638926","display_name":"Hidekazu Oiwa","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hidekazu Oiwa","raw_affiliation_strings":["university of Tokyo;"],"affiliations":[{"raw_affiliation_string":"university of Tokyo;","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060421432","display_name":"Issei Sato","orcid":"https://orcid.org/0000-0002-5066-1435"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Issei Sato","raw_affiliation_strings":["university of Tokyo;"],"affiliations":[{"raw_affiliation_string":"university of Tokyo;","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020912760","display_name":"Hiroshi Nakagawa","orcid":"https://orcid.org/0000-0002-3024-9136"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hiroshi Nakagawa","raw_affiliation_strings":["university of Tokyo;"],"affiliations":[{"raw_affiliation_string":"university of Tokyo;","institution_ids":["https://openalex.org/I74801974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5007171156"],"corresponding_institution_ids":["https://openalex.org/I90023481"],"apc_list":null,"apc_paid":null,"fwci":0.8457,"has_fulltext":true,"cited_by_count":24,"citation_normalized_percentile":{"value":0.82179971,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1374","last_page":"1384"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8544257879257202},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.8461387157440186},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.6296320557594299},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6055949926376343},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.5985067486763},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5939138531684875},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5904799103736877},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.557429850101471},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4367435574531555},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3457632064819336},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2137279212474823},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.06556618213653564}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8544257879257202},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.8461387157440186},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.6296320557594299},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6055949926376343},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5985067486763},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5939138531684875},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5904799103736877},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.557429850101471},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4367435574531555},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3457632064819336},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2137279212474823},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.06556618213653564},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3115/v1/d14-1143","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/d14-1143","pdf_url":"https://aclanthology.org/D14-1143.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.671.5794","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.671.5794","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://emnlp2014.org/papers/pdf/EMNLP2014143.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.697.5754","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.697.5754","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://aclweb.org/anthology/D/D14/D14-1143.pdf","raw_type":"text"}],"best_oa_location":{"id":"doi:10.3115/v1/d14-1143","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/d14-1143","pdf_url":"https://aclanthology.org/D14-1143.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.8600000143051147,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G1069223013","display_name":null,"funder_award_id":"JSPS KAKENHI","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G195965828","display_name":"\u5fc3\u5185\u8f9e\u66f8\u3068\u8a9e\u5f59\u30cd\u30c3\u30c8\u30ef\u30fc\u30af\u306e\u6570\u7406\u30e2\u30c7\u30eb\u5316\u306b\u3088\u308b\u7b2c\u4e8c\u8a00\u8a9e\u904b\u7528\u652f\u63f4\u30b7\u30b9\u30c6\u30e0\u306e\u7814\u7a76","funder_award_id":"12J09575","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G3236194794","display_name":null,"funder_award_id":"Grant-in-Aid","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G3459562248","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G4227499671","display_name":null,"funder_award_id":"KAKENHI Grant","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G4636223006","display_name":null,"funder_award_id":"JSPS KAK","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G4874944895","display_name":null,"funder_award_id":"-in-Aid","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G5396239172","display_name":null,"funder_award_id":"Grant-in-Aid for JSPS Fellows","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G5786340949","display_name":null,"funder_award_id":"KAKENHI Grant Number","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G8430481527","display_name":null,"funder_award_id":"Number","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2124926790.pdf","grobid_xml":"https://content.openalex.org/works/W2124926790.grobid-xml"},"referenced_works_count":13,"referenced_works":["https://openalex.org/W1980018014","https://openalex.org/W1985672254","https://openalex.org/W2017803598","https://openalex.org/W2047328202","https://openalex.org/W2099993990","https://openalex.org/W2127816222","https://openalex.org/W2135069250","https://openalex.org/W2154455818","https://openalex.org/W2164318591","https://openalex.org/W2250340570","https://openalex.org/W2793582435","https://openalex.org/W3158183629","https://openalex.org/W4239280779"],"related_works":["https://openalex.org/W2349784553","https://openalex.org/W3022596247","https://openalex.org/W2601444686","https://openalex.org/W4307058054","https://openalex.org/W4292238148","https://openalex.org/W4323660495","https://openalex.org/W2385319785","https://openalex.org/W2900827440","https://openalex.org/W1997182898","https://openalex.org/W2944691285"],"abstract_inverted_index":{"Predicting":[0],"vocabulary":[1,45],"of":[2,15,19,40,50],"second":[3],"language":[4,11,20],"learners":[5],"is":[6],"essential":[7],"to":[8,35,93],"support":[9,106],"their":[10],"learning;":[12],"however,":[13],"because":[14],"the":[16,27,43,48,51,102],"large":[17],"size":[18],"vocabularies,":[21],"we":[22,33,56,104],"cannot":[23],"collect":[24],"information":[25],"on":[26,68],"entire":[28,44],"vocabulary.":[29],"For":[30],"practical":[31],"measurements,":[32],"need":[34],"sample":[36],"a":[37,58,85,94],"small":[38],"portion":[39],"words":[41],"from":[42,116],"and":[46,114],"predict":[47],"rest":[49],"words.":[52],"In":[53],"this":[54,62],"study,":[55],"propose":[57],"novel":[59],"framework":[60],"for":[61],"sampling":[63,115],"method.":[64],"Current":[65],"methods":[66],"rely":[67],"simple":[69],"heuristic":[70,82],"techniques":[71,83],"involving":[72],"inflexible":[73],"manual":[74],"tuning":[75],"by":[76,100],"educational":[77],"experts.":[78],"We":[79,97],"formalize":[80],"these":[81],"as":[84,91,110],"graph-based":[86],"non-interactive":[87],"active":[88],"learning":[89],"method":[90],"applied":[92],"special":[95],"graph.":[96],"show":[98],"that":[99],"extending":[101],"graph,":[103],"can":[105],"additional":[107],"functionality":[108],"such":[109],"incorporating":[111],"domain":[112],"specificity":[113],"multiple":[117],"corpora.":[118]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2026-04-15T08:11:43.952461","created_date":"2025-10-10T00:00:00"}
