mirror of
https://github.com/huggingface/candle.git
synced 2025-06-17 02:58:50 +00:00
Add support for the phi-hermes finetuned model. (#1192)
This commit is contained in:
@ -73,6 +73,23 @@ impl Config {
|
||||
pad_vocab_size_multiple: 64,
|
||||
}
|
||||
}
|
||||
|
||||
// https://huggingface.co/teknium/Phi-Hermes-1.3B/blob/main/config.json
|
||||
pub fn phi_hermes_1_3b() -> Self {
|
||||
Self {
|
||||
vocab_size: 50304,
|
||||
n_positions: 2048,
|
||||
n_embd: 2048,
|
||||
n_layer: 24,
|
||||
n_inner: None,
|
||||
n_head: 32,
|
||||
rotary_dim: usize::min(32, 2048 / 32),
|
||||
activation_function: Activation::NewGelu,
|
||||
layer_norm_epsilon: 1e-5,
|
||||
tie_word_embeddings: false,
|
||||
pad_vocab_size_multiple: 64,
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
#[derive(Debug, Clone)]
|
||||
|
Reference in New Issue
Block a user