Skip to content

Commit

Permalink
Quantized version of mistral.
Browse files Browse the repository at this point in the history
  • Loading branch information
LaurentMazare committed Sep 30, 2023
1 parent 0620733 commit 3bcaa94
Show file tree
Hide file tree
Showing 3 changed files with 375 additions and 12 deletions.
24 changes: 12 additions & 12 deletions candle-transformers/src/models/mistral.rs
Original file line number Diff line number Diff line change
Expand Up @@ -6,18 +6,18 @@ use std::sync::Arc;

#[derive(Debug, Clone, PartialEq)]
pub struct Config {
vocab_size: usize,
hidden_size: usize,
intermediate_size: usize,
num_hidden_layers: usize,
num_attention_heads: usize,
num_key_value_heads: usize,
hidden_act: Activation,
max_position_embeddings: usize,
rms_norm_eps: f64,
rope_theta: f64,
sliding_window: usize,
use_flash_attn: bool,
pub(crate) vocab_size: usize,
pub(crate) hidden_size: usize,
pub(crate) intermediate_size: usize,
pub(crate) num_hidden_layers: usize,
pub(crate) num_attention_heads: usize,
pub(crate) num_key_value_heads: usize,
pub(crate) hidden_act: Activation,
pub(crate) max_position_embeddings: usize,
pub(crate) rms_norm_eps: f64,
pub(crate) rope_theta: f64,
pub(crate) sliding_window: usize,
pub(crate) use_flash_attn: bool,
}

impl Config {
Expand Down
1 change: 1 addition & 0 deletions candle-transformers/src/models/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@ pub mod llama;
pub mod mistral;
pub mod mixformer;
pub mod quantized_llama;
pub mod quantized_mistral;
pub mod quantized_mixformer;
pub mod quantized_t5;
pub mod segment_anything;
Expand Down
Loading

0 comments on commit 3bcaa94

Please sign in to comment.