{"id":"https://openalex.org/W4387561528","doi":"https://doi.org/10.48550/arxiv.2310.06825","title":"Mistral 7B","display_name":"Mistral 7B","publication_year":2023,"publication_date":"2023-10-10","ids":{"openalex":"https://openalex.org/W4387561528","doi":"https://doi.org/10.48550/arxiv.2310.06825"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2310.06825","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2310.06825","pdf_url":"https://arxiv.org/pdf/2310.06825","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2310.06825","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083358660","display_name":"Albert Q. Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jiang, Albert Q.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067991583","display_name":"Alexandre Sablayrolles","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sablayrolles, Alexandre","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110691380","display_name":"Arthur Mensch","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mensch, Arthur","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012897368","display_name":"Chris Bamford","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bamford, Chris","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016223957","display_name":"Devendra Singh Chaplot","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chaplot, Devendra Singh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075173651","display_name":"Diego de Las Casas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Casas, Diego de las","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061952014","display_name":"Florian Bressand","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bressand, Florian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093047940","display_name":"Gianna Lengyel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lengyel, Gianna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054371148","display_name":"Guillaume Lample","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lample, Guillaume","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001689321","display_name":"Lucile Saulnier","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saulnier, Lucile","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093047938","display_name":"L\u00e9lio Renard Lavaud","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lavaud, L\u00e9lio Renard","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050998809","display_name":"Marie-Anne Lachaux","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lachaux, Marie-Anne","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066603292","display_name":"Pierre Stock","orcid":"https://orcid.org/0000-0002-3623-3899"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stock, Pierre","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084957527","display_name":"Teven Le Scao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Scao, Teven Le","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090457109","display_name":"Thibaut Lavril","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lavril, Thibaut","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085451281","display_name":"Thomas J. Wang","orcid":"https://orcid.org/0000-0003-4063-6508"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Thomas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084553837","display_name":"Timoth\u00e9e Lacroix","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lacroix, Timoth\u00e9e","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5093047939","display_name":"William El Sayed","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sayed, William El","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":18,"corresponding_author_ids":["https://openalex.org/A5083358660"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":285,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9799000024795532,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7308691740036011},{"id":"https://openalex.org/keywords/license","display_name":"License","score":0.7234842777252197},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6908263564109802},{"id":"https://openalex.org/keywords/window","display_name":"Window (computing)","score":0.6399619579315186},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6289259195327759},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.5423991680145264},{"id":"https://openalex.org/keywords/mit-license","display_name":"MIT License","score":0.4917955696582794},{"id":"https://openalex.org/keywords/sliding-window-protocol","display_name":"Sliding window protocol","score":0.48217934370040894},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3349781334400177},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3191966414451599},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.23578083515167236}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7308691740036011},{"id":"https://openalex.org/C2780560020","wikidata":"https://www.wikidata.org/wiki/Q79719","display_name":"License","level":2,"score":0.7234842777252197},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6908263564109802},{"id":"https://openalex.org/C2778751112","wikidata":"https://www.wikidata.org/wiki/Q835016","display_name":"Window (computing)","level":2,"score":0.6399619579315186},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6289259195327759},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.5423991680145264},{"id":"https://openalex.org/C174183944","wikidata":"https://www.wikidata.org/wiki/Q334661","display_name":"MIT License","level":3,"score":0.4917955696582794},{"id":"https://openalex.org/C102392041","wikidata":"https://www.wikidata.org/wiki/Q592860","display_name":"Sliding window protocol","level":3,"score":0.48217934370040894},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3349781334400177},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3191966414451599},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.23578083515167236},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2310.06825","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2310.06825","pdf_url":"https://arxiv.org/pdf/2310.06825","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2310.06825","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2310.06825","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2310.06825","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2310.06825","pdf_url":"https://arxiv.org/pdf/2310.06825","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387561528.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2036021480","https://openalex.org/W2546377002","https://openalex.org/W380079223","https://openalex.org/W3014558862","https://openalex.org/W4285209474","https://openalex.org/W22571951","https://openalex.org/W2046541848","https://openalex.org/W4384009753","https://openalex.org/W2791776396","https://openalex.org/W4286531993"],"abstract_inverted_index":{"We":[0,62],"introduce":[1],"Mistral":[2,15,71],"7B":[3,16,72],"v0.1,":[4],"a":[5,58,65],"7-billion-parameter":[6],"language":[7],"model":[8,36,66,83],"engineered":[9],"for":[10,41],"superior":[11],"performance":[12],"and":[13,25,32,87],"efficiency.":[14],"outperforms":[17],"Llama":[18,26,78],"2":[19,79],"13B":[20,80],"across":[21],"all":[22],"evaluated":[23],"benchmarks,":[24],"1":[27],"34B":[28],"in":[29],"reasoning,":[30],"mathematics,":[31],"code":[33],"generation.":[34],"Our":[35,90],"leverages":[37],"grouped-query":[38],"attention":[39,48],"(GQA)":[40],"faster":[42],"inference,":[43],"coupled":[44],"with":[45,57],"sliding":[46],"window":[47],"(SWA)":[49],"to":[50,68],"effectively":[51],"handle":[52],"sequences":[53],"of":[54],"arbitrary":[55],"length":[56],"reduced":[59],"inference":[60],"cost.":[61],"also":[63],"provide":[64],"fine-tuned":[67],"follow":[69],"instructions,":[70],"--":[73,81],"Instruct,":[74],"that":[75],"surpasses":[76],"the":[77,95],"Chat":[82],"both":[84],"on":[85],"human":[86],"automated":[88],"benchmarks.":[89],"models":[91],"are":[92],"released":[93],"under":[94],"Apache":[96],"2.0":[97],"license.":[98]},"counts_by_year":[{"year":2026,"cited_by_count":52},{"year":2025,"cited_by_count":126},{"year":2024,"cited_by_count":95},{"year":2023,"cited_by_count":11},{"year":2019,"cited_by_count":1}],"updated_date":"2026-06-06T09:05:17.133730","created_date":"2023-10-12T00:00:00"}
