Allow TF32 in CUDA for increased performance #279

2022-09-12 16:34:13 +03:00 · 2022-09-12 16:34:13 +03:00 · b70b51cc72
parent 11e648f6c7
commit b70b51cc72
2 changed files with 21 additions and 0 deletions
--- a/modules/devices.py
+++ b/modules/devices.py
@ -1,6 +1,8 @@
 import torch
 # has_mps is only available in nightly pytorch (for now), `getattr` for compatibility
 from modules import errors
 has_mps = getattr(torch, 'has_mps', False)
 cpu = torch.device("cpu")
@ -20,3 +22,12 @@ def torch_gc():
    if torch.cuda.is_available():
        torch.cuda.empty_cache()
        torch.cuda.ipc_collect()
 def enable_tf32():
    if torch.cuda.is_available():
        torch.backends.cuda.matmul.allow_tf32 = True
        torch.backends.cudnn.allow_tf32 = True
 errors.run(enable_tf32, "Enabling TF32")
--- a/modules/errors.py
+++ b/modules/errors.py
@ -0,0 +1,10 @@
 import sys
 import traceback
 def run(code, task):
    try:
        code()
    except Exception as e:
        print(f"{task}: {type(e).__name__}", file=sys.stderr)
        print(traceback.format_exc(), file=sys.stderr)