Merge branch 'dev' into master

author: AUTOMATIC1111 <16777216c@gmail.com> 2023-11-05 19:30:57 +0300
committer: GitHub <noreply@github.com> 2023-11-05 19:30:57 +0300
commit: ff805d8d0eb8e3de42f04747de0d1c7354491810 (patch)
tree: c6e557895ff3172bad42da469a6912ac718078a1 /modules/devices.py
parent: 44c5097375ae4cf40300c09473bb46cf6c5d6cb7 (diff)
parent: c3699d4fd185d5a7285c5519f9bb4b6fec236d9f (diff)
1 files changed, 2 insertions, 1 deletions
diff --git a/modules/devices.py b/modules/devices.py
index c01f0602..1d4eb563 100644
--- a/modules/devices.py
+++ b/modules/devices.py
@@ -60,7 +60,8 @@ def enable_tf32():
 
         # enabling benchmark option seems to enable a range of cards to do fp16 when they otherwise can't
         # see https://github.com/AUTOMATIC1111/stable-diffusion-webui/pull/4407
-        if any(torch.cuda.get_device_capability(devid) == (7, 5) for devid in range(0, torch.cuda.device_count())):
+        device_id = (int(shared.cmd_opts.device_id) if shared.cmd_opts.device_id is not None and shared.cmd_opts.device_id.isdigit() else 0) or torch.cuda.current_device()
+        if torch.cuda.get_device_capability(device_id) == (7, 5) and torch.cuda.get_device_name(device_id).startswith("NVIDIA GeForce GTX 16"):
             torch.backends.cudnn.benchmark = True
 
         torch.backends.cuda.matmul.allow_tf32 = True
author	AUTOMATIC1111 <16777216c@gmail.com>	2023-11-05 19:30:57 +0300
committer	GitHub <noreply@github.com>	2023-11-05 19:30:57 +0300
commit	ff805d8d0eb8e3de42f04747de0d1c7354491810 (patch)
tree	c6e557895ff3172bad42da469a6912ac718078a1 /modules/devices.py
parent	44c5097375ae4cf40300c09473bb46cf6c5d6cb7 (diff)
parent	c3699d4fd185d5a7285c5519f9bb4b6fec236d9f (diff)