StableLM-2 models were updated to use GPT-2 tokenization. (#1847)

This commit is contained in:
Jani Monoses
2024-03-14 22:01:36 +02:00
committed by GitHub
parent 3318fe30fb
commit e1f9c3776d
2 changed files with 1 additions and 13 deletions

View File

@ -239,14 +239,7 @@ fn main() -> Result<()> {
));
let tokenizer_filename = match args.tokenizer_file {
Some(file) => std::path::PathBuf::from(file),
None => match args.which {
Which::V1Orig | Which::V1 | Which::V1Zephyr | Which::Code => {
repo.get("tokenizer.json")?
}
Which::V2 | Which::V2Zephyr => api
.model("lmz/candle-stablelm".to_string())
.get("tokenizer-gpt4.json")?,
},
None => repo.get("tokenizer.json")?,
};
let filenames = match args.weight_files {
Some(files) => files