Another tweak.

This commit is contained in:
laurent
2024-09-26 10:14:53 +02:00
parent 43a8cbe244
commit ab12425bff

View File

@ -445,13 +445,16 @@ impl QCudaStorage {
} }
_ => crate::bail!("only f32 can be quantized"), _ => crate::bail!("only f32 can be quantized"),
}; };
let src_len = pad_for_alloc(src.len()); let src_len = src.len();
let src = crate::Storage::Cpu(crate::CpuStorage::F32(src)); let src = crate::Storage::Cpu(crate::CpuStorage::F32(src));
let mut qcpu_storage = crate::Device::Cpu.qzeros(src_len, self.dtype)?; let mut qcpu_storage = crate::Device::Cpu.qzeros(src_len, self.dtype)?;
qcpu_storage.quantize(&src)?; qcpu_storage.quantize(&src)?;
let data = qcpu_storage.data()?; let data = qcpu_storage.data()?;
let data = self.device.htod_sync_copy(data.as_ref()).w()?; let mut dst = self.device.alloc_zeros::<u8>(pad_for_alloc(src_len)).w()?;
self.data = data; self.device
.htod_sync_copy_into(data.as_ref(), &mut dst.slice_mut(..src_len))
.w()?;
self.data = dst;
Ok(()) Ok(())
} }