mirror of
https://github.com/huggingface/candle.git
synced 2025-06-16 02:38:10 +00:00
Separate quantized phi-3 implementation. (#2157)
* Separate quantized phi-3 implementation. * Integrate the quantized phi3 model.= * Small fixes, get the generation to work properly. * Keep the old llama implementation around. * Change the default.
This commit is contained in:
@ -676,9 +676,6 @@ impl BackendStorage for MetalStorage {
|
||||
}
|
||||
}
|
||||
|
||||
if layout.is_contiguous() {
|
||||
} else {
|
||||
}
|
||||
Ok(Self::new(buffer, device.clone(), el_count, dtype))
|
||||
}
|
||||
|
||||
|
@ -178,7 +178,7 @@ impl crate::CustomOp1 for ArgSort {
|
||||
device.metal_device(),
|
||||
&command_buffer,
|
||||
kernels,
|
||||
&name,
|
||||
name,
|
||||
nrows,
|
||||
ncols,
|
||||
ncols_pad,
|
||||
|
Reference in New Issue
Block a user