diffusers/run.py at docs · python273/diffusers

History

executable file

153 lines (115 loc) · 4.61 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

#!/usr/bin/env python3

import numpy as np

import PIL

import torch

#from configs.ve import ffhq_ncsnpp_continuous as configs

# from configs.ve import cifar10_ncsnpp_continuous as configs

device = torch.device('cuda:0') if torch.cuda.is_available() else torch.device('cpu')

torch.backends.cuda.matmul.allow_tf32 = False

torch.manual_seed(0)

class NewReverseDiffusionPredictor:

def __init__(self, score_fn, probability_flow=False, sigma_min=0.0, sigma_max=0.0, N=0):

super().__init__()

self.sigma_min = sigma_min

self.sigma_max = sigma_max

self.N = N

self.discrete_sigmas = torch.exp(torch.linspace(np.log(self.sigma_min), np.log(self.sigma_max), N))

self.probability_flow = probability_flow

self.score_fn = score_fn

def discretize(self, x, t):

timestep = (t * (self.N - 1)).long()

sigma = self.discrete_sigmas.to(t.device)[timestep]

adjacent_sigma = torch.where(timestep == 0, torch.zeros_like(t),

self.discrete_sigmas[timestep - 1].to(t.device))

f = torch.zeros_like(x)

G = torch.sqrt(sigma ** 2 - adjacent_sigma ** 2)

labels = self.sigma_min * (self.sigma_max / self.sigma_min) ** t

result = self.score_fn(x, labels)

rev_f = f - G[:, None, None, None] ** 2 * result * (0.5 if self.probability_flow else 1.)

rev_G = torch.zeros_like(G) if self.probability_flow else G

return rev_f, rev_G

def update_fn(self, x, t):

f, G = self.discretize(x, t)

z = torch.randn_like(x)

x_mean = x - f

x = x_mean + G[:, None, None, None] * z

return x, x_mean

class NewLangevinCorrector:

def __init__(self, score_fn, snr, n_steps, sigma_min=0.0, sigma_max=0.0):

super().__init__()

self.score_fn = score_fn

self.snr = snr

self.n_steps = n_steps

self.sigma_min = sigma_min

self.sigma_max = sigma_max

def update_fn(self, x, t):

score_fn = self.score_fn

n_steps = self.n_steps

target_snr = self.snr

# if isinstance(sde, VPSDE) or isinstance(sde, subVPSDE):

# timestep = (t * (sde.N - 1) / sde.T).long()

# alpha = sde.alphas.to(t.device)[timestep]

# else:

alpha = torch.ones_like(t)

for i in range(n_steps):

labels = self.sigma_min * (self.sigma_max / self.sigma_min) ** t

grad = score_fn(x, labels)

noise = torch.randn_like(x)

grad_norm = torch.norm(grad.reshape(grad.shape[0], -1), dim=-1).mean()

noise_norm = torch.norm(noise.reshape(noise.shape[0], -1), dim=-1).mean()

step_size = (target_snr * noise_norm / grad_norm) ** 2 * 2 * alpha

x_mean = x + step_size[:, None, None, None] * grad

x = x_mean + torch.sqrt(step_size * 2)[:, None, None, None] * noise

return x, x_mean

def save_image(x):

image_processed = np.clip(x.permute(0, 2, 3, 1).cpu().numpy() * 255, 0, 255).astype(np.uint8)

image_pil = PIL.Image.fromarray(image_processed[0])

image_pil.save("../images/hey.png")

# ckpt_filename = "exp/ve/cifar10_ncsnpp_continuous/checkpoint_24.pth"

#ckpt_filename = "exp/ve/ffhq_1024_ncsnpp_continuous/checkpoint_60.pth"

# Note usually we need to restore ema etc...

# ema restored checkpoint used from below

N = 2

sigma_min = 0.01

sigma_max = 1348

sampling_eps = 1e-5

batch_size = 1

centered = False

from diffusers import NCSNpp

model = NCSNpp.from_pretrained("/home/patrick/ffhq_ncsnpp").to(device)

model = torch.nn.DataParallel(model)

img_size = model.module.config.image_size

channels = model.module.config.num_channels

shape = (batch_size, channels, img_size, img_size)

probability_flow = False

snr = 0.15

n_steps = 1

new_corrector = NewLangevinCorrector(score_fn=model, snr=snr, n_steps=n_steps, sigma_min=sigma_min, sigma_max=sigma_max)

new_predictor = NewReverseDiffusionPredictor(score_fn=model, sigma_min=sigma_min, sigma_max=sigma_max, N=N)

with torch.no_grad():

# Initial sample

x = torch.randn(*shape) * sigma_max

x = x.to(device)

timesteps = torch.linspace(1, sampling_eps, N, device=device)

for i in range(N):

t = timesteps[i]

vec_t = torch.ones(shape[0], device=t.device) * t

x, x_mean = new_corrector.update_fn(x, vec_t)

x, x_mean = new_predictor.update_fn(x, vec_t)

x = x_mean

if centered:

x = (x + 1.) / 2.

# save_image(x)

# for 5 cifar10

x_sum = 106071.9922

x_mean = 34.52864456176758

# for 1000 cifar10

x_sum = 461.9700

x_mean = 0.1504

# for 2 for 1024

x_sum = 3382810112.0

x_mean = 1075.366455078125

def check_x_sum_x_mean(x, x_sum, x_mean):

assert (x.abs().sum() - x_sum).abs().cpu().item() < 1e-2, f"sum wrong {x.abs().sum()}"

assert (x.abs().mean() - x_mean).abs().cpu().item() < 1e-4, f"mean wrong {x.abs().mean()}"

check_x_sum_x_mean(x, x_sum, x_mean)

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

run.py

Latest commit

History

run.py

File metadata and controls