Merge branch 'AUTOMATIC1111:master' into master

author: Zac Liu <liuguang@baai.ac.cn> 2022-12-06 09:16:15 +0800
committer: GitHub <noreply@github.com> 2022-12-06 09:16:15 +0800
commit: 3ebf977a6e4f478ab918e44506974beee32da276 (patch)
tree: f68456207e5cd78718ec1e9c588ecdc22d568d81 /modules/devices.py
parent: 231fb72872191ffa8c446af1577c9003b3d19d4f (diff)
parent: 44c46f0ed395967cd3830dd481a2db759fda5b3b (diff)
1 files changed, 20 insertions, 13 deletions
diff --git a/modules/devices.py b/modules/devices.py
index e69c1fe3..397b4b95 100644
--- a/modules/devices.py
+++ b/modules/devices.py
@@ -44,6 +44,15 @@ def get_optimal_device():
     return cpu
 
 
+def get_device_for(task):
+    from modules import shared
+
+    if task in shared.cmd_opts.use_cpu:
+        return cpu
+
+    return get_optimal_device()
+
+
 def torch_gc():
     if torch.cuda.is_available():
         with torch.cuda.device(get_cuda_device_string()):
@@ -53,37 +62,35 @@ def torch_gc():
 
 def enable_tf32():
     if torch.cuda.is_available():
+
+        # enabling benchmark option seems to enable a range of cards to do fp16 when they otherwise can't
+        # see https://github.com/AUTOMATIC1111/stable-diffusion-webui/pull/4407
+        if any([torch.cuda.get_device_capability(devid) == (7, 5) for devid in range(0, torch.cuda.device_count())]):
+            torch.backends.cudnn.benchmark = True
+
         torch.backends.cuda.matmul.allow_tf32 = True
         torch.backends.cudnn.allow_tf32 = True
 
 
+
 errors.run(enable_tf32, "Enabling TF32")
 
 cpu = torch.device("cpu")
-device = device_interrogate = device_gfpgan = device_swinir = device_esrgan = device_scunet = device_codeformer = None
+device = device_interrogate = device_gfpgan = device_esrgan = device_codeformer = None
 dtype = torch.float16
 dtype_vae = torch.float16
 
 
 def randn(seed, shape):
-    # Pytorch currently doesn't handle setting randomness correctly when the metal backend is used.
-    if device.type == 'mps':
-        generator = torch.Generator(device=cpu)
-        generator.manual_seed(seed)
-        noise = torch.randn(shape, generator=generator, device=cpu).to(device)
-        return noise
-
     torch.manual_seed(seed)
+    if device.type == 'mps':
+        return torch.randn(shape, device=cpu).to(device)
     return torch.randn(shape, device=device)
 
 
 def randn_without_seed(shape):
-    # Pytorch currently doesn't handle setting randomness correctly when the metal backend is used.
     if device.type == 'mps':
-        generator = torch.Generator(device=cpu)
-        noise = torch.randn(shape, generator=generator, device=cpu).to(device)
-        return noise
-
+        return torch.randn(shape, device=cpu).to(device)
     return torch.randn(shape, device=device)
author	Zac Liu <liuguang@baai.ac.cn>	2022-12-06 09:16:15 +0800
committer	GitHub <noreply@github.com>	2022-12-06 09:16:15 +0800
commit	3ebf977a6e4f478ab918e44506974beee32da276 (patch)
tree	f68456207e5cd78718ec1e9c588ecdc22d568d81 /modules/devices.py
parent	231fb72872191ffa8c446af1577c9003b3d19d4f (diff)
parent	44c46f0ed395967cd3830dd481a2db759fda5b3b (diff)