Skip to content

Commit

Permalink
Merge pull request #12924 from catboxanon/fix/cudnn
Browse files Browse the repository at this point in the history
More accurate check for enabling cuDNN benchmark on 16XX cards
  • Loading branch information
AUTOMATIC1111 authored Sep 9, 2023
2 parents 4ebed49 + 5681bf8 commit 558baff
Showing 1 changed file with 2 additions and 1 deletion.
3 changes: 2 additions & 1 deletion modules/devices.py
Original file line number Diff line number Diff line change
Expand Up @@ -60,7 +60,8 @@ def enable_tf32():

# enabling benchmark option seems to enable a range of cards to do fp16 when they otherwise can't
# see https://github.com/AUTOMATIC1111/stable-diffusion-webui/pull/4407
if any(torch.cuda.get_device_capability(devid) == (7, 5) for devid in range(0, torch.cuda.device_count())):
device_id = (int(shared.cmd_opts.device_id) if shared.cmd_opts.device_id.isdigit() else 0) or torch.cuda.current_device()
if torch.cuda.get_device_capability(device_id) == (7, 5) and torch.cuda.get_device_name(device_id).startswith("NVIDIA GeForce GTX 16"):
torch.backends.cudnn.benchmark = True

torch.backends.cuda.matmul.allow_tf32 = True
Expand Down

0 comments on commit 558baff

Please sign in to comment.