Fix the revision used in starcoder to use the safetensors PR. (#269)

This commit is contained in:
Laurent Mazare
2023-07-28 14:02:31 +01:00
committed by GitHub
parent fb84ead8f7
commit a0e47aba98
2 changed files with 6 additions and 9 deletions

View File

@ -316,7 +316,7 @@ impl GPTBigCode {
.map(|i| Block::load(vb_t.pp(&format!("h.{i}")), &cfg))
.collect::<Result<Vec<_>>>()?;
let ln_f = layer_norm(hidden_size, cfg.layer_norm_epsilon, vb_t.pp("ln_f"))?;
let lm_head = linear(hidden_size, cfg.vocab_size, false, vb.pp("lm_head"))?;
let lm_head = linear(hidden_size, cfg.vocab_size, false, vb_t.pp("wte"))?;
let bias = make_causal_mask(cfg.max_position_embeddings, vb.device())?;
Ok(Self {
wte,