mirror of
https://github.com/huggingface/candle.git
synced 2025-06-15 18:28:24 +00:00
Sketch a simd128 optimized q4k vecdot. (#977)
* Sketch a simd128 optimized q4k vecdot. * Simdify. * More quantization optimizations. * Again more simdification. * Simdify the splitting loop.
This commit is contained in:
@ -133,6 +133,12 @@ fn quantized_matmul_q40() -> Result<()> {
|
||||
Ok(())
|
||||
}
|
||||
|
||||
#[wasm_bindgen_test]
|
||||
fn quantized_matmul_q4k() -> Result<()> {
|
||||
ggml_matmul_error_test::<candle::quantized::k_quants::BlockQ4K>()?;
|
||||
Ok(())
|
||||
}
|
||||
|
||||
#[wasm_bindgen_test]
|
||||
fn quantized_matmul_q80() -> Result<()> {
|
||||
ggml_matmul_error_test::<candle::quantized::k_quants::BlockQ8_0>()?;
|
||||
|
Reference in New Issue
Block a user