feat: use Euler sampling by default for SD3 and Flux (#753)

Thank you for your contribution.
2026-02-04 10:53:34 +00:00 · 2025-09-14 01:34:41 -03:00 · 2025-09-14 01:34:41 -03:00 · c607fc3ed4
commit c607fc3ed4
parent b54bec3f18
4 changed files with 33 additions and 9 deletions
--- a/README.md
+++ b/README.md
@ -334,9 +334,9 @@ arguments:
  --skip-layers LAYERS               Layers to skip for SLG steps: (default: [7,8,9])
  --skip-layer-start START           SLG enabling point: (default: 0.01)
  --skip-layer-end END               SLG disabling point: (default: 0.2)
-  --scheduler {discrete, karras, exponential, ays, gits} Denoiser sigma scheduler (default: discrete)
+  --scheduler {discrete, karras, exponential, ays, gits, smoothstep} Denoiser sigma scheduler (default: discrete)
  --sampling-method {euler, euler_a, heun, dpm2, dpm++2s_a, dpm++2m, dpm++2mv2, ipndm, ipndm_v, lcm, ddim_trailing, tcd}
-                                     sampling method (default: "euler_a")
+                                     sampling method (default: "euler" for Flux/SD3/Wan, "euler_a" otherwise)
  --steps  STEPS                     number of sample steps (default: 20)
  --high-noise-cfg-scale SCALE       (high noise) unconditional guidance scale: (default: 7.0)
  --high-noise-img-cfg-scale SCALE   (high noise) image guidance scale for inpaint or instruct-pix2pix models: (default: same as --cfg-scale)
@ -347,7 +347,7 @@ arguments:
  --high-noise-skip-layers LAYERS    (high noise) Layers to skip for SLG steps: (default: [7,8,9])
  --high-noise-skip-layer-start      (high noise) SLG enabling point: (default: 0.01)
  --high-noise-skip-layer-end END    (high noise) SLG disabling point: (default: 0.2)
-  --high-noise-scheduler {discrete, karras, exponential, ays, gits} Denoiser sigma scheduler (default: discrete)
+  --high-noise-scheduler {discrete, karras, exponential, ays, gits, smoothstep} Denoiser sigma scheduler (default: discrete)
  --high-noise-sampling-method {euler, euler_a, heun, dpm2, dpm++2s_a, dpm++2m, dpm++2mv2, ipndm, ipndm_v, lcm, ddim_trailing, tcd}
                                     (high noise) sampling method (default: "euler_a")
  --high-noise-steps  STEPS          (high noise) number of sample steps (default: -1 = auto)
--- a/examples/cli/main.cpp
+++ b/examples/cli/main.cpp
@ -240,7 +240,7 @@ void print_usage(int argc, const char* argv[]) {
    printf("  --skip-layer-end END               SLG disabling point: (default: 0.2)\n");
    printf("  --scheduler {discrete, karras, exponential, ays, gits, smoothstep} Denoiser sigma scheduler (default: discrete)\n");
    printf("  --sampling-method {euler, euler_a, heun, dpm2, dpm++2s_a, dpm++2m, dpm++2mv2, ipndm, ipndm_v, lcm, ddim_trailing, tcd}\n");
-    printf("                                     sampling method (default: \"euler_a\")\n");
+    printf("                                     sampling method (default: \"euler\" for Flux/SD3/Wan, \"euler_a\" otherwise)\n");
    printf("  --steps  STEPS                     number of sample steps (default: 20)\n");
    printf("  --high-noise-cfg-scale SCALE       (high noise) unconditional guidance scale: (default: 7.0)\n");
    printf("  --high-noise-img-cfg-scale SCALE   (high noise) image guidance scale for inpaint or instruct-pix2pix models: (default: same as --cfg-scale)\n");
@ -1202,6 +1202,10 @@ int main(int argc, const char* argv[]) {
        return 1;
    }

+    if (params.sample_params.sample_method == SAMPLE_METHOD_DEFAULT) {
+        params.sample_params.sample_method = sd_get_default_sample_method(sd_ctx);
+    }
+
    sd_image_t* results;
    int num_results = 1;
    if (params.mode == IMG_GEN) {
--- a/stable-diffusion.cpp
+++ b/stable-diffusion.cpp
@ -43,7 +43,7 @@ const char* model_version_to_str[] = {
 };

 const char* sampling_methods_str[] = {
-    "Euler A",
+    "default",
    "Euler",
    "Heun",
    "DPM2",
@ -55,6 +55,7 @@ const char* sampling_methods_str[] = {
    "LCM",
    "DDIM \"trailing\"",
    "TCD",
+    "Euler A",
 };

 /*================================================== Helper Functions ================================================*/
@ -1500,7 +1501,7 @@ enum rng_type_t str_to_rng_type(const char* str) {
 }

 const char* sample_method_to_str[] = {
-    "euler_a",
+    "default",
    "euler",
    "heun",
    "dpm2",
@ -1512,6 +1513,7 @@ const char* sample_method_to_str[] = {
    "lcm",
    "ddim_trailing",
    "tcd",
+    "euler_a",
 };

 const char* sd_sample_method_name(enum sample_method_t sample_method) {
@ -1650,7 +1652,7 @@ void sd_sample_params_init(sd_sample_params_t* sample_params) {
    sample_params->guidance.slg.layer_end      = 0.2f;
    sample_params->guidance.slg.scale          = 0.f;
    sample_params->scheduler                   = DEFAULT;
-    sample_params->sample_method               = EULER_A;
+    sample_params->sample_method               = SAMPLE_METHOD_DEFAULT;
    sample_params->sample_steps                = 20;
 }

@ -1792,6 +1794,17 @@ void free_sd_ctx(sd_ctx_t* sd_ctx) {
    free(sd_ctx);
 }

+enum sample_method_t sd_get_default_sample_method(const sd_ctx_t* sd_ctx) {
+    if (sd_ctx != NULL && sd_ctx->sd != NULL) {
+        SDVersion version = sd_ctx->sd->version;
+        if (sd_version_is_dit(version))
+            return EULER;
+        else
+            return EULER_A;
+    }
+    return SAMPLE_METHOD_COUNT;
+}
+
 sd_image_t* generate_image_internal(sd_ctx_t* sd_ctx,
                                    struct ggml_context* work_ctx,
                                    ggml_tensor* init_latent,
@ -2356,6 +2369,11 @@ sd_image_t* generate_image(sd_ctx_t* sd_ctx, const sd_img_gen_params_t* sd_img_g
        LOG_INFO("encode_first_stage completed, taking %.2fs", (t1 - t0) * 1.0f / 1000);
    }

+    enum sample_method_t sample_method = sd_img_gen_params->sample_params.sample_method;
+    if (sample_method == SAMPLE_METHOD_DEFAULT) {
+        sample_method = sd_get_default_sample_method(sd_ctx);
+    }
+
    sd_image_t* result_images = generate_image_internal(sd_ctx,
                                                        work_ctx,
                                                        init_latent,
@ -2366,7 +2384,7 @@ sd_image_t* generate_image(sd_ctx_t* sd_ctx, const sd_img_gen_params_t* sd_img_g
                                                        sd_img_gen_params->sample_params.eta,
                                                        width,
                                                        height,
-                                                        sd_img_gen_params->sample_params.sample_method,
+                                                        sample_method,
                                                        sigmas,
                                                        seed,
                                                        sd_img_gen_params->batch_count,
--- a/stable-diffusion.h
+++ b/stable-diffusion.h
@ -35,7 +35,7 @@ enum rng_type_t {
 };

 enum sample_method_t {
-    EULER_A,
+    SAMPLE_METHOD_DEFAULT,
    EULER,
    HEUN,
    DPM2,
@ -47,6 +47,7 @@ enum sample_method_t {
    LCM,
    DDIM_TRAILING,
    TCD,
+    EULER_A,
    SAMPLE_METHOD_COUNT
 };

@ -238,6 +239,7 @@ SD_API char* sd_ctx_params_to_str(const sd_ctx_params_t* sd_ctx_params);

 SD_API sd_ctx_t* new_sd_ctx(const sd_ctx_params_t* sd_ctx_params);
 SD_API void free_sd_ctx(sd_ctx_t* sd_ctx);
+SD_API enum sample_method_t sd_get_default_sample_method(const sd_ctx_t* sd_ctx);

 SD_API void sd_sample_params_init(sd_sample_params_t* sample_params);
 SD_API char* sd_sample_params_to_str(const sd_sample_params_t* sample_params);