PerturbDiff/src/models/diffusion/diffusion_core.py at main · DeepGraphLearning/PerturbDiff

History

264 lines (219 loc) · 9.83 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

"""Core GaussianDiffusion class assembly (logic-preserving extraction)."""

import enum

import numpy as np

import torch as th

from src.common.utils import _extract_into_tensor

class ModelMeanType(enum.Enum):

"""

Which type of output the model predicts.

"""

PREVIOUS_X = enum.auto() # the model predicts x_{t-1}

START_X = enum.auto() # the model predicts x_0

EPSILON = enum.auto() # the model predicts epsilon

class ModelVarType(enum.Enum):

"""

What is used as the model's output variance.

"""

FIXED_SMALL = enum.auto()

FIXED_LARGE = enum.auto()

class LossType(enum.Enum):

"""Losstype implementation used by the PerturbDiff pipeline."""

MSE = enum.auto()

RESCALED_MSE = enum.auto()

def is_vb(self):

"""Execute `is_vb` and return values used by downstream logic."""

return False

from src.models.diffusion.diffusion_sampling import GaussianDiffusionSamplingMixin

from src.models.diffusion.diffusion_training import GaussianDiffusionTrainingMixin

class GaussianDiffusion(

GaussianDiffusionSamplingMixin,

GaussianDiffusionTrainingMixin,

"""

Utilities for training and sampling diffusion models.

Ported directly from here, and then adapted over time to further experimentation.

https://github.com/hojonathanho/diffusion/blob/1e0dceb3b3495bbe19116a5e1b3596cd0706c543/diffusion_tf/diffusion_utils_2.py#L42

:param betas: a 1-D numpy array of betas for each diffusion timestep,

starting at T and going to 1.

:param model_mean_type: a ModelMeanType determining what the model outputs.

:param model_var_type: a ModelVarType determining how variance is output.

:param loss_type: a LossType determining the loss function to use.

:param rescale_timesteps: if True, pass floating point timesteps into the

model so that they are always scaled like in the

original paper (0 to 1000).

"""

def __init__(

self,

betas,

model_mean_type,

model_var_type,

loss_type,

rescale_timesteps=False,

"""

Initialize the class instance.

:param betas: Input `betas` value.

:param model_mean_type: Input `model_mean_type` value.

:param model_var_type: Input `model_var_type` value.

:param loss_type: Input `loss_type` value.

:param rescale_timesteps: Input `rescale_timesteps` value.

:return: None.

"""

self.model_mean_type = model_mean_type

self.model_var_type = model_var_type

self.loss_type = loss_type

self.rescale_timesteps = rescale_timesteps

# Use float64 for accuracy.

betas = np.array(betas, dtype=np.float64)

self.betas = betas

assert len(betas.shape) == 1, "betas must be 1-D"

assert (betas > 0).all() and (betas <= 1).all()

self.num_timesteps = int(betas.shape[0])

alphas = 1.0 - betas

self.alphas_cumprod = np.cumprod(alphas, axis=0)

self.alphas_cumprod_prev = np.append(1.0, self.alphas_cumprod[:-1])

self.alphas_cumprod_next = np.append(self.alphas_cumprod[1:], 0.0)

assert self.alphas_cumprod_prev.shape == (self.num_timesteps,)

# calculations for diffusion q(x_t | x_{t-1}) and others

self.sqrt_alphas_cumprod = np.sqrt(self.alphas_cumprod)

self.sqrt_one_minus_alphas_cumprod = np.sqrt(1.0 - self.alphas_cumprod)

self.log_one_minus_alphas_cumprod = np.log(1.0 - self.alphas_cumprod)

self.sqrt_recip_alphas_cumprod = np.sqrt(1.0 / self.alphas_cumprod)

self.sqrt_recipm1_alphas_cumprod = np.sqrt(1.0 / self.alphas_cumprod - 1)

# calculations for posterior q(x_{t-1} | x_t, x_0)

self.posterior_variance = (

betas * (1.0 - self.alphas_cumprod_prev) / (1.0 - self.alphas_cumprod)

)

# log calculation clipped because the posterior variance is 0 at the

# beginning of the diffusion chain.

self.posterior_log_variance_clipped = np.log(

np.append(self.posterior_variance[1], self.posterior_variance[1:])

)

self.posterior_mean_coef1 = (

betas * np.sqrt(self.alphas_cumprod_prev) / (1.0 - self.alphas_cumprod)

)

self.posterior_mean_coef2 = (

(1.0 - self.alphas_cumprod_prev)

* np.sqrt(alphas)

/ (1.0 - self.alphas_cumprod)

)

def _predict_xstart_from_eps(self, x_t, t, eps):

"""Execute `_predict_xstart_from_eps` and return values used by downstream logic."""

assert x_t.shape == eps.shape

return (

_extract_into_tensor(self.sqrt_recip_alphas_cumprod, t, x_t.shape) * x_t

- _extract_into_tensor(self.sqrt_recipm1_alphas_cumprod, t, x_t.shape) * eps

)

def _predict_xstart_from_xprev(self, x_t, t, xprev):

"""Execute `_predict_xstart_from_xprev` and return values used by downstream logic."""

assert x_t.shape == xprev.shape

return ( # (xprev - coef2*x_t) / coef1

_extract_into_tensor(1.0 / self.posterior_mean_coef1, t, x_t.shape) * xprev

- _extract_into_tensor(

self.posterior_mean_coef2 / self.posterior_mean_coef1, t, x_t.shape

)

* x_t

)

def _predict_eps_from_xstart(self, x_t, t, pred_xstart):

"""Execute `_predict_eps_from_xstart` and return values used by downstream logic."""

return (

_extract_into_tensor(self.sqrt_recip_alphas_cumprod, t, x_t.shape) * x_t

- pred_xstart

) / _extract_into_tensor(self.sqrt_recipm1_alphas_cumprod, t, x_t.shape)

def _scale_timesteps(self, t):

"""Execute `_scale_timesteps` and return values used by downstream logic."""

if self.rescale_timesteps:

return t.float() * (1000.0 / self.num_timesteps)

return t

def condition_mean(self, cond_fn, p_mean_var, x, t, model_kwargs=None):

"""

Compute the mean for the previous step, given a function cond_fn that

computes the gradient of a conditional log probability with respect to

x. In particular, cond_fn computes grad(log(p(y|x))), and we want to

condition on y.

This uses the conditioning strategy from Sohl-Dickstein et al. (2015).

"""

gradient = cond_fn(x, self._scale_timesteps(t), **model_kwargs)

new_mean = (

p_mean_var["mean"].float() + p_mean_var["variance"] * gradient.float()

)

return new_mean

def condition_score(self, cond_fn, p_mean_var, x, t, model_kwargs=None):

"""

Compute what the p_mean_variance output would have been, should the

model's score function be conditioned by cond_fn.

See condition_mean() for details on cond_fn.

Unlike condition_mean(), this instead uses the conditioning strategy

from Song et al (2020).

"""

alpha_bar = _extract_into_tensor(self.alphas_cumprod, t, x.shape)

eps = self._predict_eps_from_xstart(x, t, p_mean_var["pred_xstart"])

eps = eps - (1 - alpha_bar).sqrt() * cond_fn(

x, self._scale_timesteps(t), **model_kwargs

)

out = p_mean_var.copy()

out["pred_xstart"] = self._predict_xstart_from_eps(x, t, eps)

out["mean"], _, _ = self.q_posterior_mean_variance(

x_start=out["pred_xstart"], x_t=x, t=t

)

return out

def q_mean_variance(self, x_start, t, x_control=None):

"""

Get the distribution q(x_t | x_0).

:param x_start: the [N x C x ...] tensor of noiseless inputs.

:param t: the number of diffusion steps (minus 1). Here, 0 means one step.

:return: A tuple (mean, variance, log_variance), all of x_start's shape.

"""

mean = (

_extract_into_tensor(self.sqrt_alphas_cumprod, t, x_start.shape) * x_start

)

variance = _extract_into_tensor(1.0 - self.alphas_cumprod, t, x_start.shape)

log_variance = _extract_into_tensor(

self.log_one_minus_alphas_cumprod, t, x_start.shape

)

return mean, variance, log_variance

def q_sample(self, x_start, t, noise=None, x_control=None):

"""

Diffuse the data for a given number of diffusion steps.

In other words, sample from q(x_t | x_0).

:param x_start: the initial data batch.

:param t: the number of diffusion steps (minus 1). Here, 0 means one step.

:param noise: if specified, the split-out normal noise.

:return: A noisy version of x_start.

"""

if noise is None:

noise = th.randn_like(x_start)

assert noise.shape == x_start.shape

return (

_extract_into_tensor(self.sqrt_alphas_cumprod, t, x_start.shape) * x_start

+ _extract_into_tensor(self.sqrt_one_minus_alphas_cumprod, t, x_start.shape)

* noise

)

def q_posterior_mean_variance(self, x_start, x_t, t):

"""

Compute the mean and variance of the diffusion posterior:

q(x_{t-1} | x_t, x_0)

"""

assert x_start.shape == x_t.shape

posterior_mean = (

_extract_into_tensor(self.posterior_mean_coef1, t, x_t.shape) * x_start

+ _extract_into_tensor(self.posterior_mean_coef2, t, x_t.shape) * x_t

)

posterior_variance = _extract_into_tensor(self.posterior_variance, t, x_t.shape)

posterior_log_variance_clipped = _extract_into_tensor(

self.posterior_log_variance_clipped, t, x_t.shape

)

assert (

posterior_mean.shape[0]

== posterior_variance.shape[0]

== posterior_log_variance_clipped.shape[0]

== x_start.shape[0]

)

return posterior_mean, posterior_variance, posterior_log_variance_clipped

__all__ = [

"LossType",

"ModelMeanType",

"ModelVarType",

"GaussianDiffusion",

]

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

diffusion_core.py

Latest commit

History

diffusion_core.py

File metadata and controls