diff --git a/examples/cli/README.md b/examples/cli/README.md index d6c36b8..78f8821 100644 --- a/examples/cli/README.md +++ b/examples/cli/README.md @@ -52,7 +52,8 @@ Context Options: --control-net-cpu keep controlnet in cpu (for low vram) --clip-on-cpu keep clip in cpu (for low vram) --vae-on-cpu keep vae in cpu (for low vram) - --diffusion-fa use flash attention in the diffusion model + --fa use flash attention + --diffusion-fa use flash attention in the diffusion model only --diffusion-conv-direct use ggml_conv2d_direct in the diffusion model --vae-conv-direct use ggml_conv2d_direct in the vae model --circular enable circular padding for convolutions diff --git a/examples/server/README.md b/examples/server/README.md index 354075c..8a2f2e9 100644 --- a/examples/server/README.md +++ b/examples/server/README.md @@ -44,7 +44,8 @@ Context Options: --clip-on-cpu keep clip in cpu (for low vram) --vae-on-cpu keep vae in cpu (for low vram) --mmap whether to memory-map model - --diffusion-fa use flash attention in the diffusion model + --fa use flash attention + --diffusion-fa use flash attention in the diffusion model only --diffusion-conv-direct use ggml_conv2d_direct in the diffusion model --vae-conv-direct use ggml_conv2d_direct in the vae model --circular enable circular padding for convolutions