{"id":"https://openalex.org/W7131123447","doi":"https://doi.org/10.48550/arxiv.2602.18326","title":"Predicting Contextual Informativeness for Vocabulary Learning using Deep Learning","display_name":"Predicting Contextual Informativeness for Vocabulary Learning using Deep Learning","publication_year":2026,"publication_date":"2026-02-20","ids":{"openalex":"https://openalex.org/W7131123447","doi":"https://doi.org/10.48550/arxiv.2602.18326"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.18326","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126600336","display_name":"Tao Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Tao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5068936812","display_name":"Adam Kapelner","orcid":"https://orcid.org/0000-0001-5985-6792"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kapelner, Adam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.26350000500679016,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.26350000500679016,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.1298999935388565,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.11089999973773956,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.7057999968528748},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5641000270843506},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5493000149726868},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5008000135421753},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.4593000113964081},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.44830000400543213},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4408000111579895},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.34880000352859497}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7757999897003174},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7143999934196472},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.7057999968528748},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5641000270843506},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5493000149726868},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5116000175476074},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5008000135421753},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4763000011444092},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.4593000113964081},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.44830000400543213},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4408000111579895},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.34880000352859497},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.31679999828338623},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3091000020503998},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.30799999833106995},{"id":"https://openalex.org/C62737587","wikidata":"https://www.wikidata.org/wiki/Q7939179","display_name":"Vocabulary development","level":3,"score":0.30309998989105225},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.29100000858306885},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.2761000096797943},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.26980000734329224},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.2578999996185303}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.18326","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.18326","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.18326","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.18326","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8000668287277222}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,62],"describe":[1],"a":[2,40,50,64,88,105,125,140,151],"modern":[3,126],"deep":[4],"learning":[5],"system":[6],"that":[7,124],"automatically":[8],"identifies":[9],"informative":[10],"contextual":[11],"examples":[12],"(\\qu{contexts})":[13],"for":[14,19,147,150],"first":[15],"language":[16],"vocabulary":[17,149],"instruction":[18],"high":[20],"school":[21],"student.":[22],"Our":[23],"paper":[24],"compares":[25],"three":[26],"modeling":[27],"approaches:":[28],"(i)":[29],"an":[30],"unsupervised":[31],"similarity-based":[32],"strategy":[33],"using":[34],"MPNet's":[35],"uniformly":[36],"contextualized":[37],"embeddings,":[38],"(ii)":[39,57],"supervised":[41],"framework":[42],"built":[43],"on":[44,92,129],"instruction-aware,":[45],"fine-tuned":[46],"Qwen3":[47],"embeddings":[48],"with":[49,102],"nonlinear":[51],"regression":[52],"head":[53],"and":[54,82],"(iii)":[55,96],"model":[56,93,128],"plus":[58],"handcrafted":[59],"context":[60],"features.":[61],"introduce":[63],"novel":[65],"metric":[66],"called":[67],"the":[68,76,83,98,117],"Retention":[69],"Competency":[70],"Curve":[71],"to":[72],"visualize":[73],"trade-offs":[74],"between":[75],"discarded":[77],"proportion":[78],"of":[79,104,108,116,144,153],"good":[80,118],"contexts":[81,85,146],"\\qu{good-to-bad}":[84],"ratio":[86,107],"providing":[87],"compact,":[89],"unified":[90],"lens":[91],"performance.":[94],"Model":[95],"delivers":[97],"most":[99],"dramatic":[100],"gains":[101],"performance":[103],"good-to-bad":[106],"440":[109],"all":[110],"while":[111],"only":[112],"throwing":[113],"out":[114],"70\\%":[115],"contexts.":[119],"In":[120],"summary,":[121],"we":[122],"demonstrate":[123],"embedding":[127],"neural":[130],"network":[131],"architecture,":[132],"when":[133],"guided":[134],"by":[135],"human":[136],"supervision,":[137],"results":[138],"in":[139],"low-cost":[141],"large":[142],"supply":[143],"near-perfect":[145],"teaching":[148],"variety":[152],"target":[154],"words.":[155]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2026-02-24T00:00:00"}
