{"id":"https://openalex.org/W4394866680","doi":"https://doi.org/10.48550/arxiv.2404.09562","title":"\u03c3-GPTs: A New Approach to Autoregressive Models","display_name":"\u03c3-GPTs: A New Approach to Autoregressive Models","publication_year":2024,"publication_date":"2024-04-15","ids":{"openalex":"https://openalex.org/W4394866680","doi":"https://doi.org/10.48550/arxiv.2404.09562"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2404.09562","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.09562","pdf_url":"https://arxiv.org/pdf/2404.09562","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2404.09562","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059678146","display_name":"Arnaud Pannatier","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Pannatier, Arnaud","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005306316","display_name":"Evann Courdier","orcid":"https://orcid.org/0000-0003-2135-1910"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Courdier, Evann","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5076094010","display_name":"Fran\u00e7ois Fleuret","orcid":"https://orcid.org/0000-0001-9457-7393"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fleuret, Fran\u00e7ois","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5059678146"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9843000173568726,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9782999753952026,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.9190854430198669},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.6783296465873718},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.6140656471252441},{"id":"https://openalex.org/keywords/star-model","display_name":"STAR model","score":0.6002405285835266},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5814985036849976},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.5335476994514465},{"id":"https://openalex.org/keywords/on-the-fly","display_name":"On the fly","score":0.5138900279998779},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.5137354135513306},{"id":"https://openalex.org/keywords/sigma","display_name":"Sigma","score":0.5045996904373169},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5009217262268066},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.47010985016822815},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.43222954869270325},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.26703882217407227},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24598199129104614},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.2036629617214203},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.13781893253326416},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.1058923602104187},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.07866466045379639},{"id":"https://openalex.org/keywords/time-series","display_name":"Time series","score":0.0777047872543335},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.06201407313346863}],"concepts":[{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.9190854430198669},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.6783296465873718},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.6140656471252441},{"id":"https://openalex.org/C194657046","wikidata":"https://www.wikidata.org/wiki/Q7394685","display_name":"STAR model","level":4,"score":0.6002405285835266},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5814985036849976},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.5335476994514465},{"id":"https://openalex.org/C2781020372","wikidata":"https://www.wikidata.org/wiki/Q533093","display_name":"On the fly","level":2,"score":0.5138900279998779},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.5137354135513306},{"id":"https://openalex.org/C2778049214","wikidata":"https://www.wikidata.org/wiki/Q7512234","display_name":"Sigma","level":2,"score":0.5045996904373169},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5009217262268066},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.47010985016822815},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.43222954869270325},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.26703882217407227},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24598199129104614},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.2036629617214203},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.13781893253326416},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.1058923602104187},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.07866466045379639},{"id":"https://openalex.org/C151406439","wikidata":"https://www.wikidata.org/wiki/Q186588","display_name":"Time series","level":2,"score":0.0777047872543335},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.06201407313346863},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C24338571","wikidata":"https://www.wikidata.org/wiki/Q2566298","display_name":"Autoregressive integrated moving average","level":3,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2404.09562","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.09562","pdf_url":"https://arxiv.org/pdf/2404.09562","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2404.09562","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2404.09562","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2404.09562","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.09562","pdf_url":"https://arxiv.org/pdf/2404.09562","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320327931","display_name":"Innosuisse - Schweizerische Agentur f\u00fcr Innovationsf\u00f6rderung","ror":"https://ror.org/05a2bhn71"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4394866680.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2439807930","https://openalex.org/W2009692134","https://openalex.org/W2019155478","https://openalex.org/W1972271943","https://openalex.org/W2024529895","https://openalex.org/W2168175994","https://openalex.org/W1902630399","https://openalex.org/W2120434453","https://openalex.org/W3120578569","https://openalex.org/W1487412319"],"abstract_inverted_index":{"Autoregressive":[0],"models,":[1],"such":[2],"as":[3],"the":[4,39,56,107],"GPT":[5],"family,":[6],"use":[7],"a":[8,20,35,79,84],"fixed":[9],"order,":[10],"usually":[11],"left-to-right,":[12],"to":[13,78,83],"generate":[14],"sequences.":[15],"However,":[16],"this":[17,23,27,41],"is":[18],"not":[19],"necessity.":[21],"In":[22],"paper,":[24],"we":[25],"challenge":[26],"assumption":[28],"and":[29,59,66,101],"show":[30],"that":[31],"by":[32,114],"simply":[33],"adding":[34],"positional":[36],"encoding":[37],"for":[38,55,112],"output,":[40],"order":[42,116],"can":[43],"be":[44],"modulated":[45],"on-the-fly":[46],"per-sample":[47],"which":[48],"offers":[49],"key":[50],"advantageous":[51],"properties.":[52],"It":[53],"allows":[54,69],"sampling":[57,70],"of":[58,64,87,109,117],"conditioning":[60],"on":[61],"arbitrary":[62],"subsets":[63],"tokens,":[65],"it":[67],"also":[68],"in":[71],"one":[72],"shot":[73],"multiple":[74],"tokens":[75],"dynamically":[76],"according":[77],"rejection":[80],"strategy,":[81],"leading":[82],"sub-linear":[85],"number":[86,108],"model":[88],"evaluations.":[89],"We":[90],"evaluate":[91],"our":[92],"method":[93],"across":[94],"various":[95],"domains,":[96],"including":[97],"language":[98],"modeling,":[99],"path-solving,":[100],"aircraft":[102],"vertical":[103],"rate":[104],"prediction,":[105],"decreasing":[106],"steps":[110],"required":[111],"generation":[113],"an":[115],"magnitude.":[118]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
