Turn off cuda malloc by default when --fast autotune is turned on. (#10393)

This commit is contained in:
comfyanonymous
2025-10-18 19:35:46 -07:00
committed by GitHub
parent 9da397ea2f
commit 5b80addafd
3 changed files with 7 additions and 6 deletions

View File

@@ -371,6 +371,9 @@ try:
except:
pass
if torch.cuda.is_available() and torch.backends.cudnn.is_available() and PerformanceFeature.AutoTune in args.fast:
torch.backends.cudnn.benchmark = True
try:
if torch_version_numeric >= (2, 5):
torch.backends.cuda.allow_fp16_bf16_reduction_math_sdp(True)