Spaces:

Oysiyl
/

AI-QR-code-generator

Running on Zero

Oysiyl commited on 4 days ago

Commit

3490b07

1 Parent(s): 1652ae0

Switch torch.compile mode from 'reduce-overhead' to 'max-autotune' for faster inference

Files changed (1) hide show

app.py CHANGED Viewed

@@ -365,7 +365,7 @@ def _apply_torch_compile_optimizations():
         set_torch_compile_wrapper(
             model=standard_model,
             backend="inductor",
-            mode="reduce-overhead",  # Best for iterative sampling
             fullgraph=False,  # Allow SAG to capture attention maps (disabled in SAG code)
             dynamic=True,  # Handle variable batch sizes during CFG without recompiling
             keys=["diffusion_model"],  # Compile UNet only
@@ -377,7 +377,7 @@ def _apply_torch_compile_optimizations():
         set_torch_compile_wrapper(
             model=artistic_model,
             backend="inductor",
-            mode="reduce-overhead",
             fullgraph=False,  # Allow SAG to capture attention maps (disabled in SAG code)
             dynamic=True,  # Handle variable batch sizes during CFG without recompiling
             keys=["diffusion_model"],  # Compile UNet only

         set_torch_compile_wrapper(
             model=standard_model,
             backend="inductor",
+            mode="max-autotune",  # Maximum runtime speed (longer compile time is OK during warmup)
             fullgraph=False,  # Allow SAG to capture attention maps (disabled in SAG code)
             dynamic=True,  # Handle variable batch sizes during CFG without recompiling
             keys=["diffusion_model"],  # Compile UNet only
         set_torch_compile_wrapper(
             model=artistic_model,
             backend="inductor",
+            mode="max-autotune",  # Maximum runtime speed (longer compile time is OK during warmup)
             fullgraph=False,  # Allow SAG to capture attention maps (disabled in SAG code)
             dynamic=True,  # Handle variable batch sizes during CFG without recompiling
             keys=["diffusion_model"],  # Compile UNet only