mirror of
https://github.com/huggingface/candle.git
synced 2025-06-19 03:54:56 +00:00
Faster matmul when we can fall back to gemv.
This commit is contained in:
@ -111,6 +111,7 @@ impl TransformerWeights {
|
||||
// matrix column major rather than row major. This ends up speeding up text generation from
|
||||
// 120 token/s to 220 token/s on a Ryzen 2600X.
|
||||
let tr = device.is_cpu() && !candle::utils::has_mkl();
|
||||
let tr = false;
|
||||
let tr = |x: Tensor| if tr { x.t()?.contiguous()?.t() } else { Ok(x) };
|
||||
let mut ws = std::collections::HashMap::new();
|
||||
let mut insert = |name: &str, t: Tensor| {
|
||||
|
Reference in New Issue
Block a user