stable-diffusion-webui/modules/devices.py

import torch

# has_mps is only available in nightly pytorch (for now), `getattr` for compatibility
from modules import errors

has_mps = getattr(torch, 'has_mps', False)

cpu = torch.device("cpu")


def get_optimal_device():
    if torch.cuda.is_available():
        return torch.device("cuda")

    if has_mps:
        return torch.device("mps")

    return cpu


def torch_gc():
    if torch.cuda.is_available():
        torch.cuda.empty_cache()
        torch.cuda.ipc_collect()


def enable_tf32():
    if torch.cuda.is_available():
        torch.backends.cuda.matmul.allow_tf32 = True
        torch.backends.cudnn.allow_tf32 = True


errors.run(enable_tf32, "Enabling TF32")

device = get_optimal_device()
device_codeformer = cpu if has_mps else device
dtype = torch.float16

def randn(seed, shape):
    # Pytorch currently doesn't handle setting randomness correctly when the metal backend is used.
    if device.type == 'mps':
        generator = torch.Generator(device=cpu)
        generator.manual_seed(seed)
        noise = torch.randn(shape, generator=generator, device=cpu).to(device)
        return noise

    torch.manual_seed(seed)
    return torch.randn(shape, device=device)


def randn_without_seed(shape):
    # Pytorch currently doesn't handle setting randomness correctly when the metal backend is used.
    if device.type == 'mps':
        generator = torch.Generator(device=cpu)
        noise = torch.randn(shape, generator=generator, device=cpu).to(device)
        return noise

    return torch.randn(shape, device=device)
Modular device management 2022-09-11 13:11:27 +08:00			`import torch`

			# has_mps is only available in nightly pytorch (for now), `getattr` for compatibility
Allow TF32 in CUDA for increased performance #279 2022-09-12 21:34:13 +08:00			`from modules import errors`

Modular device management 2022-09-11 13:11:27 +08:00			`has_mps = getattr(torch, 'has_mps', False)`

CLIP interrogator 2022-09-11 23:48:36 +08:00			`cpu = torch.device("cpu")`


Modular device management 2022-09-11 13:11:27 +08:00			`def get_optimal_device():`
CLIP interrogator 2022-09-11 23:48:36 +08:00			`if torch.cuda.is_available():`
			`return torch.device("cuda")`

			`if has_mps:`
			`return torch.device("mps")`

			`return cpu`
add half() supporrt for CLIP interrogation 2022-09-12 04:24:24 +08:00

			`def torch_gc():`
			`if torch.cuda.is_available():`
			`torch.cuda.empty_cache()`
			`torch.cuda.ipc_collect()`
Allow TF32 in CUDA for increased performance #279 2022-09-12 21:34:13 +08:00

			`def enable_tf32():`
			`if torch.cuda.is_available():`
			`torch.backends.cuda.matmul.allow_tf32 = True`
			`torch.backends.cudnn.allow_tf32 = True`


			`errors.run(enable_tf32, "Enabling TF32")`
changes for #294 2022-09-13 01:09:32 +08:00
			`device = get_optimal_device()`
			`device_codeformer = cpu if has_mps else device`
initial support for training textual inversion 2022-10-02 20:03:39 +08:00			`dtype = torch.float16`
changes for #294 2022-09-13 01:09:32 +08:00
			`def randn(seed, shape):`
			`# Pytorch currently doesn't handle setting randomness correctly when the metal backend is used.`
			`if device.type == 'mps':`
			`generator = torch.Generator(device=cpu)`
			`generator.manual_seed(seed)`
			`noise = torch.randn(shape, generator=generator, device=cpu).to(device)`
			`return noise`

			`torch.manual_seed(seed)`
			`return torch.randn(shape, device=device)`

first attempt to produce crrect seeds in batch 2022-09-14 02:49:58 +08:00
			`def randn_without_seed(shape):`
			`# Pytorch currently doesn't handle setting randomness correctly when the metal backend is used.`
			`if device.type == 'mps':`
			`generator = torch.Generator(device=cpu)`
			`noise = torch.randn(shape, generator=generator, device=cpu).to(device)`
			`return noise`

			`return torch.randn(shape, device=device)`