mirror of
https://github.com/huggingface/candle.git
synced 2025-06-17 19:18:50 +00:00
88 lines
3.1 KiB
Rust
88 lines
3.1 KiB
Rust
use candle::{safetensors::Load, DType, Device, Result, Shape, Tensor, Var};
|
|
use std::collections::HashMap;
|
|
use std::sync::{Arc, Mutex};
|
|
|
|
/// A `VarMap` is a store that holds named variables. Variables can be retrieved from the stores
|
|
/// and new variables can be added by providing some initialization config in case they are
|
|
/// missing.
|
|
/// `VarMap` structures can be serialized in the safetensors format.
|
|
#[derive(Clone)]
|
|
pub struct VarMap {
|
|
data: Arc<Mutex<HashMap<String, Var>>>,
|
|
}
|
|
|
|
impl VarMap {
|
|
/// Create a new empty `VarMap`.
|
|
#[allow(clippy::new_without_default)]
|
|
pub fn new() -> Self {
|
|
let data = Arc::new(Mutex::new(HashMap::new()));
|
|
Self { data }
|
|
}
|
|
|
|
/// Retrieve all the variables currently stored in the map.
|
|
pub fn all_vars(&self) -> Vec<Var> {
|
|
let tensor_data = self.data.lock().unwrap();
|
|
#[allow(clippy::map_clone)]
|
|
tensor_data.values().map(|c| c.clone()).collect::<Vec<_>>()
|
|
}
|
|
|
|
/// Save the map in the safetensors format.
|
|
pub fn save<P: AsRef<std::path::Path>>(&self, path: P) -> Result<()> {
|
|
let tensor_data = self.data.lock().unwrap();
|
|
let data = tensor_data.iter().map(|(k, v)| (k, v.as_tensor()));
|
|
safetensors::tensor::serialize_to_file(data, &None, path.as_ref())?;
|
|
Ok(())
|
|
}
|
|
|
|
/// Load some values from a safetensors file and modify the existing variables to have these
|
|
/// values.
|
|
///
|
|
/// Note that values for variables that are currently not in the map are not kept.
|
|
pub fn load<P: AsRef<std::path::Path>>(&mut self, path: P) -> Result<()> {
|
|
let path = path.as_ref();
|
|
let data = unsafe { candle::safetensors::MmapedFile::new(path)? };
|
|
let data = data.deserialize()?;
|
|
let mut tensor_data = self.data.lock().unwrap();
|
|
for (name, var) in tensor_data.iter_mut() {
|
|
match data.tensor(name) {
|
|
Ok(data) => {
|
|
let data: Tensor = data.load(var.device())?;
|
|
if let Err(err) = var.set(&data) {
|
|
candle::bail!("error setting {name} using data from {path:?}: {err}",)
|
|
}
|
|
}
|
|
Err(_) => candle::bail!("cannot find tensor for {name}"),
|
|
}
|
|
}
|
|
Ok(())
|
|
}
|
|
|
|
/// Retrieve or add a new variable.
|
|
pub fn get<S: Into<Shape>>(
|
|
&self,
|
|
shape: S,
|
|
path: &str,
|
|
init: crate::Init,
|
|
dtype: DType,
|
|
device: &Device,
|
|
) -> Result<Tensor> {
|
|
let shape = shape.into();
|
|
let mut tensor_data = self.data.lock().unwrap();
|
|
if let Some(tensor) = tensor_data.get(path) {
|
|
let tensor_shape = tensor.shape();
|
|
if &shape != tensor_shape {
|
|
candle::bail!("shape mismatch on {path}: {shape:?} <> {tensor_shape:?}")
|
|
}
|
|
return Ok(tensor.as_tensor().clone());
|
|
}
|
|
let var = init.var(shape, dtype, device)?;
|
|
let tensor = var.as_tensor().clone();
|
|
tensor_data.insert(path.to_string(), var);
|
|
Ok(tensor)
|
|
}
|
|
|
|
pub fn data(&self) -> &Mutex<HashMap<String, Var>> {
|
|
&self.data
|
|
}
|
|
}
|