{"id":"https://openalex.org/W4377130927","doi":"https://doi.org/10.48550/arxiv.2305.10782","title":"Human Behavioral Benchmarking: Numeric Magnitude Comparison Effects in Large Language Models","display_name":"Human Behavioral Benchmarking: Numeric Magnitude Comparison Effects in Large Language Models","publication_year":2023,"publication_date":"2023-05-18","ids":{"openalex":"https://openalex.org/W4377130927","doi":"https://doi.org/10.48550/arxiv.2305.10782"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2305.10782","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.10782","pdf_url":"https://arxiv.org/pdf/2305.10782","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2305.10782","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030471602","display_name":"Raj Sanjay Shah","orcid":"https://orcid.org/0000-0002-0847-8426"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Shah, Raj Sanjay","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035761603","display_name":"Vijay Marupudi","orcid":"https://orcid.org/0000-0001-5128-1197"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marupudi, Vijay","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091983129","display_name":"Reba Koenen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koenen, Reba","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074106082","display_name":"Khushi Bhardwaj","orcid":"https://orcid.org/0000-0003-2129-3060"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhardwaj, Khushi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5036602199","display_name":"Sashank Varma","orcid":"https://orcid.org/0000-0002-1107-0982"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Varma, Sashank","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5030471602"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9872000217437744,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9872000217437744,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9419000148773193,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9337999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.6082971096038818},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.5572569370269775},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.5249084234237671},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.4440540671348572},{"id":"https://openalex.org/keywords/ask-price","display_name":"Ask price","score":0.41948631405830383},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4007910490036011},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.3958679139614105},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.17912057042121887}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.6082971096038818},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.5572569370269775},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.5249084234237671},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.4440540671348572},{"id":"https://openalex.org/C90329073","wikidata":"https://www.wikidata.org/wiki/Q914232","display_name":"Ask price","level":2,"score":0.41948631405830383},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4007910490036011},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3958679139614105},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.17912057042121887},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C136264566","wikidata":"https://www.wikidata.org/wiki/Q159810","display_name":"Economy","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2305.10782","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.10782","pdf_url":"https://arxiv.org/pdf/2305.10782","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2305.10782","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2305.10782","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2305.10782","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2305.10782","pdf_url":"https://arxiv.org/pdf/2305.10782","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"score":0.8399999737739563,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4377130927.pdf","grobid_xml":"https://content.openalex.org/works/W4377130927.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4238897586","https://openalex.org/W435179959","https://openalex.org/W2619091065","https://openalex.org/W2059640416","https://openalex.org/W1490753184","https://openalex.org/W2284465472","https://openalex.org/W2291782699","https://openalex.org/W1993948687","https://openalex.org/W2000169967","https://openalex.org/W2112883198"],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"do":[4,85],"not":[5],"differentially":[6],"represent":[7],"numbers,":[8],"which":[9],"are":[10],"pervasive":[11],"in":[12,153],"text.":[13],"In":[14,27],"contrast,":[15],"neuroscience":[16],"research":[17,51,158],"has":[18],"identified":[19],"distinct":[20],"neural":[21,146],"representations":[22,88,134,152,178],"for":[23,64],"numbers":[24,40],"and":[25,103,123,168,181],"words.":[26],"this":[28],"work,":[29],"we":[30,73],"investigate":[31],"how":[32],"well":[33],"popular":[34],"LLMs":[35,57,164,180],"capture":[36],"the":[37,53,86,100,114,117,142,145,154,160,170,176],"magnitudes":[38],"of":[39,56,89,93,120,138,144,162,179],"(e.g.,":[41],"that":[42,148],"$4":[43],"&lt;":[44],"5$)":[45],"from":[46],"a":[47,75,109],"behavioral":[48,166],"lens.":[49],"Prior":[50],"on":[52,69,108,175],"representational":[54],"capabilities":[55],"evaluates":[58],"whether":[59],"they":[60],"show":[61],"human-level":[62],"performance,":[63],"instance,":[65],"high":[66],"overall":[67],"accuracy":[68],"standard":[70],"benchmarks.":[71],"Here,":[72],"ask":[74],"different":[76,139],"question,":[77],"one":[78],"inspired":[79],"by":[80],"cognitive":[81,183],"science:":[82],"How":[83],"closely":[84],"number":[87,121,177],"LLMscorrespond":[90],"to":[91,112,125,172],"those":[92],"human":[94,126,155],"language":[95,136],"users,":[96],"who":[97],"typically":[98],"demonstrate":[99],"distance,":[101],"size,":[102],"ratio":[104],"effects?":[105],"We":[106],"depend":[107],"linking":[110],"hypothesis":[111],"map":[113],"similarities":[115],"among":[116],"model":[118],"embeddings":[119],"words":[122],"digits":[124],"response":[127],"times.":[128],"The":[129],"results":[130],"reveal":[131],"surprisingly":[132],"human-like":[133],"across":[135],"models":[137],"architectures,":[140],"despite":[141],"absence":[143],"circuitry":[147],"directly":[149],"supports":[150],"these":[151],"brain.":[156],"This":[157],"shows":[159],"utility":[161],"understanding":[163],"using":[165],"benchmarks":[167],"points":[169],"way":[171],"future":[173],"work":[174],"their":[182],"plausibility.":[184]},"counts_by_year":[],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2023-05-21T00:00:00"}
