{"id":"https://openalex.org/W4406459044","doi":"https://doi.org/10.1109/bigdata62323.2024.10825481","title":"Can a Large Language Model Learn Matrix Functions In Context?","display_name":"Can a Large Language Model Learn Matrix Functions In Context?","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406459044","doi":"https://doi.org/10.1109/bigdata62323.2024.10825481"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10825481","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825481","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001694225","display_name":"Paul J. Goulart","orcid":"https://orcid.org/0000-0002-0456-4124"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"education","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Paimon Goulart","raw_affiliation_strings":["University of California Riverside,Computer Science and Engineering,Riverside,CA,USA"],"affiliations":[{"raw_affiliation_string":"University of California Riverside,Computer Science and Engineering,Riverside,CA,USA","institution_ids":["https://openalex.org/I103635307"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054849323","display_name":"Evangelos E. Papalexakis","orcid":"https://orcid.org/0000-0002-3411-8483"},"institutions":[{"id":"https://openalex.org/I103635307","display_name":"University of California, Riverside","ror":"https://ror.org/03nawhv43","country_code":"US","type":"education","lineage":["https://openalex.org/I103635307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Evangelos E. Papalexakis","raw_affiliation_strings":["University of California Riverside,Computer Science and Engineering,Riverside,CA,USA"],"affiliations":[{"raw_affiliation_string":"University of California Riverside,Computer Science and Engineering,Riverside,CA,USA","institution_ids":["https://openalex.org/I103635307"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5001694225"],"corresponding_institution_ids":["https://openalex.org/I103635307"],"apc_list":null,"apc_paid":null,"fwci":0.3626,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.70787371,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"5335","last_page":"5341"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9847999811172485,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7204623818397522},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5367407202720642},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.44476377964019775},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4065156579017639},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3554064631462097},{"id":"https://openalex.org/keywords/history","display_name":"History","score":0.09674990177154541}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7204623818397522},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5367407202720642},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.44476377964019775},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4065156579017639},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3554064631462097},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.09674990177154541},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10825481","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825481","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.49000000953674316,"display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320338281","display_name":"Army Research Office","ror":"https://ror.org/05epdh915"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W391578156","https://openalex.org/W2097998348","https://openalex.org/W2118550318","https://openalex.org/W2990138404","https://openalex.org/W3035965352","https://openalex.org/W3099878876","https://openalex.org/W4312258136","https://openalex.org/W4319586039","https://openalex.org/W4385567149","https://openalex.org/W4387559176","https://openalex.org/W4389519294","https://openalex.org/W4390041933","https://openalex.org/W4405621262","https://openalex.org/W6674385629","https://openalex.org/W6809646742","https://openalex.org/W6853344003","https://openalex.org/W6856830087","https://openalex.org/W6871553294","https://openalex.org/W6875004255"],"related_works":["https://openalex.org/W3204019825","https://openalex.org/W2349222429","https://openalex.org/W2116230991","https://openalex.org/W3117430770","https://openalex.org/W2046058552","https://openalex.org/W2590751808","https://openalex.org/W1972377868","https://openalex.org/W2132709506","https://openalex.org/W2098730537","https://openalex.org/W2186895195"],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4],"demonstrated":[5],"the":[6,33,48,89,105,126,167],"ability":[7],"to":[8,37,60,142,157],"solve":[9,38],"complex":[10,85,162],"tasks":[11],"through":[12],"In-Context":[13],"Learning":[14],"(ICL),":[15],"where":[16],"models":[17,62,82],"learn":[18],"from":[19],"a":[20],"few":[21],"input-output":[22],"pairs":[23],"without":[24],"explicit":[25],"fine-tuning":[26],"[1].":[27],"In":[28],"this":[29],"paper,":[30],"we":[31,110],"explore":[32],"capacity":[34],"of":[35,47,91,169],"LLMs":[36,57,96,113,136],"non-linear":[39],"numerical":[40,172],"computations,":[41],"with":[42,118],"specific":[43],"emphasis":[44],"on":[45,83,153],"functions":[46],"Singular":[49,93],"Value":[50],"Decomposition.":[51],"Our":[52],"experiments":[53],"show":[54],"that":[55,112,135],"while":[56,165],"perform":[58],"comparably":[59],"traditional":[61],"such":[63],"as":[64,104],"Stochastic":[65],"Gradient":[66],"Descent":[67],"(SGD)":[68],"based":[69],"Linear":[70],"Regression":[71],"and":[72,124,160],"Neural":[73],"Networks":[74],"(NN)":[75],"for":[76,145],"simpler":[77],"tasks,":[78,86],"they":[79],"outperform":[80],"these":[81,155],"more":[84,161],"particularly":[87],"in":[88,129,174],"case":[90],"top-k":[92],"Values.":[94],"Furthermore,":[95],"demonstrate":[97],"strong":[98],"scalability,":[99],"maintaining":[100],"high":[101,116],"accuracy":[102,117],"even":[103],"matrix":[106,163],"size":[107],"increases.":[108],"Additionally,":[109],"found":[111],"can":[114],"achieve":[115],"minimal":[119],"prior":[120],"examples,":[121],"converging":[122],"quickly":[123],"avoiding":[125],"overfitting":[127],"seen":[128],"classical":[130,143],"models.":[131],"These":[132],"results":[133],"suggest":[134],"could":[137],"provide":[138],"an":[139],"efficient":[140],"alternative":[141],"methods":[144],"solving":[146],"high-dimensional":[147],"problems.":[148],"Future":[149],"work":[150],"will":[151],"focus":[152],"extending":[154],"findings":[156],"larger":[158],"matrices":[159],"operations":[164],"exploring":[166],"effect":[168],"using":[170],"different":[171],"representations":[173],"ICL.":[175]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
