mirror of
https://github.com/huggingface/candle.git
synced 2025-06-19 03:54:56 +00:00
Quantized version of flux. (#2500)
* Quantized version of flux. * More generic sampling. * Hook the quantized model. * Use the newly minted gguf file. * Fix for the quantized model. * Default to avoid the faster cuda kernels.
This commit is contained in:
@ -92,8 +92,8 @@ pub fn unpack(xs: &Tensor, height: usize, width: usize) -> Result<Tensor> {
|
||||
}
|
||||
|
||||
#[allow(clippy::too_many_arguments)]
|
||||
pub fn denoise(
|
||||
model: &super::model::Flux,
|
||||
pub fn denoise<M: super::WithForward>(
|
||||
model: &M,
|
||||
img: &Tensor,
|
||||
img_ids: &Tensor,
|
||||
txt: &Tensor,
|
||||
|
Reference in New Issue
Block a user