{"id":"https://openalex.org/W4403579130","doi":"https://doi.org/10.48550/arxiv.2410.13086","title":"Reverse-Engineering the Reader","display_name":"Reverse-Engineering the Reader","publication_year":2024,"publication_date":"2024-10-16","ids":{"openalex":"https://openalex.org/W4403579130","doi":"https://doi.org/10.48550/arxiv.2410.13086"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2410.13086","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.13086","pdf_url":"https://arxiv.org/pdf/2410.13086","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2410.13086","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114337809","display_name":"Samuel Kiegeland","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kiegeland, Samuel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011708753","display_name":"Ethan Wilcox","orcid":"https://orcid.org/0000-0002-5128-9890"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wilcox, Ethan Gotlieb","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039644501","display_name":"Afra Amini","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Amini, Afra","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114337810","display_name":"David Robert Reich","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reich, David Robert","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5061951606","display_name":"Ryan Cotterell","orcid":"https://orcid.org/0000-0003-4080-1833"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cotterell, Ryan","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5114337809"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13071","display_name":"Digital Storytelling and Education","score":0.295199990272522,"subfield":{"id":"https://openalex.org/subfields/3616","display_name":"Speech and Hearing"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T13071","display_name":"Digital Storytelling and Education","score":0.295199990272522,"subfield":{"id":"https://openalex.org/subfields/3616","display_name":"Speech and Hearing"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reverse-engineering","display_name":"Reverse engineering","score":0.545966386795044},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4625987112522125},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2020411193370819}],"concepts":[{"id":"https://openalex.org/C207850805","wikidata":"https://www.wikidata.org/wiki/Q269608","display_name":"Reverse engineering","level":2,"score":0.545966386795044},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4625987112522125},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2020411193370819}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2410.13086","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.13086","pdf_url":"https://arxiv.org/pdf/2410.13086","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2410.13086","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2410.13086","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2410.13086","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.13086","pdf_url":"https://arxiv.org/pdf/2410.13086","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4403579130.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2363831530","https://openalex.org/W2363845219","https://openalex.org/W2381057835","https://openalex.org/W1789649838","https://openalex.org/W1780668307","https://openalex.org/W1984362519","https://openalex.org/W2051831113"],"abstract_inverted_index":{"Numerous":[0],"previous":[1],"studies":[2],"have":[3],"sought":[4],"to":[5,7,43,52,72,176,184],"determine":[6],"what":[8],"extent":[9],"language":[10,15,41,70,102,125],"models,":[11],"pretrained":[12],"on":[13,143,152],"natural":[14],"text,":[16],"can":[17,37],"serve":[18],"as":[19,106,147,149],"useful":[20,46],"models":[21],"of":[22,77,87],"human":[23,53],"cognition.":[24],"In":[25],"this":[26,157],"paper,":[27],"we":[28,36,59,67,110,131,172],"are":[29,173],"interested":[30],"in":[31,65],"the":[32,75,101,174],"opposite":[33],"question:":[34],"whether":[35],"directly":[38,82],"optimize":[39,74],"a":[40,45,61,69,78,107,140,181],"model":[42,48,71,116],"be":[44],"cognitive":[47],"by":[49,179],"aligning":[50],"it":[51,123,178],"psychometric":[54,127,137,185],"data.":[55,155,186],"To":[56],"achieve":[57],"this,":[58],"introduce":[60],"novel":[62],"alignment":[63,183],"technique":[64,113],"which":[66],"fine-tune":[68],"implicitly":[73],"parameters":[76],"linear":[79],"regressor":[80],"that":[81,122],"predicts":[83],"humans'":[84],"reading":[85],"times":[86],"in-context":[88],"linguistic":[89],"units,":[90],"e.g.,":[91],"phonemes,":[92],"morphemes,":[93],"or":[94],"words,":[95],"using":[96],"surprisal":[97],"estimates":[98],"derived":[99],"from":[100],"model.":[103],"Using":[104],"words":[105],"test":[108,154],"case,":[109],"evaluate":[111],"our":[112],"across":[114],"multiple":[115],"sizes":[117],"and":[118,120,139],"datasets":[119],"find":[121,132],"improves":[124],"models'":[126],"predictive":[128],"power.":[129],"However,":[130],"an":[133],"inverse":[134],"relationship":[135],"between":[136],"power":[138],"model's":[141,182],"performance":[142],"downstream":[144],"NLP":[145],"tasks":[146],"well":[148],"its":[150],"perplexity":[151],"held-out":[153],"While":[156],"latter":[158],"trend":[159],"has":[160],"been":[161],"observed":[162],"before":[163],"(Oh":[164],"et":[165,169],"al.,":[166,170],"2022;":[167],"Shain":[168],"2024),":[171],"first":[175],"induce":[177],"manipulating":[180]},"counts_by_year":[],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
