mirror of
https://github.com/Laurent2916/Diffusers.jl.git
synced 2024-11-09 23:12:03 +00:00
🚚 move DDPM's step from Schedulers.jl to DDPM.jl
This commit is contained in:
parent
cfd090b6e2
commit
b4ed6e3c99
49
src/DDPM.jl
49
src/DDPM.jl
|
@ -19,7 +19,6 @@ struct DDPM{V<:AbstractVector} <: Scheduler
|
||||||
sqrt_one_minus_α_cumprods::V
|
sqrt_one_minus_α_cumprods::V
|
||||||
end
|
end
|
||||||
|
|
||||||
|
|
||||||
function DDPM(V::DataType, βs::AbstractVector)
|
function DDPM(V::DataType, βs::AbstractVector)
|
||||||
αs = 1 .- βs
|
αs = 1 .- βs
|
||||||
α_cumprods = cumprod(αs)
|
α_cumprods = cumprod(αs)
|
||||||
|
@ -39,6 +38,50 @@ function DDPM(V::DataType, βs::AbstractVector)
|
||||||
)
|
)
|
||||||
end
|
end
|
||||||
|
|
||||||
function DDPM(V::DataType, beta_scheduler)
|
function step(
|
||||||
DDPM(V, beta_scheduler)
|
scheduler::DDPM,
|
||||||
|
sample::AbstractArray,
|
||||||
|
model_output::AbstractArray,
|
||||||
|
timesteps::AbstractArray,
|
||||||
|
)
|
||||||
|
"""
|
||||||
|
Remove noise from model output using the backward diffusion process.
|
||||||
|
|
||||||
|
Args:
|
||||||
|
scheduler (`Scheduler`): scheduler object.
|
||||||
|
sample (`AbstractArray`): sample to remove noise from, i.e. model_input.
|
||||||
|
model_output (`AbstractArray`): predicted noise from the model.
|
||||||
|
timesteps (`AbstractArray`): timesteps to remove noise from.
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
`AbstractArray`: denoised model output at the given timestep.
|
||||||
|
"""
|
||||||
|
# 1. compute alphas, betas
|
||||||
|
α_cumprod_t = scheduler.α_cumprods[timesteps]
|
||||||
|
α_cumprod_t_prev = scheduler.α_cumprods[timesteps.-1]
|
||||||
|
β_cumprod_t = 1 .- α_cumprod_t
|
||||||
|
β_cumprod_t_prev = 1 .- α_cumprod_t_prev
|
||||||
|
current_α_t = α_cumprod_t ./ α_cumprod_t_prev
|
||||||
|
current_β_t = 1 .- current_α_t
|
||||||
|
|
||||||
|
# 2. compute predicted original sample from predicted noise also called
|
||||||
|
# "predicted x_0" of formula (15) from https://arxiv.org/pdf/2006.11239.pdf
|
||||||
|
# epsilon prediction type
|
||||||
|
# print shapes of thingies
|
||||||
|
x_0_pred = (sample - sqrt.(β_cumprod_t)' .* model_output) ./ sqrt.(α_cumprod_t)'
|
||||||
|
|
||||||
|
# 4. Compute coefficients for pred_original_sample x_0 and current sample x_t
|
||||||
|
# See formula (7) from https://arxiv.org/pdf/2006.11239.pdf
|
||||||
|
pred_original_sample_coeff = (sqrt.(α_cumprod_t_prev) .* current_β_t) ./ β_cumprod_t
|
||||||
|
current_sample_coeff = sqrt.(current_α_t) .* β_cumprod_t_prev ./ β_cumprod_t
|
||||||
|
|
||||||
|
# 5. Compute predicted previous sample µ_t
|
||||||
|
# See formula (7) from https://arxiv.org/pdf/2006.11239.pdf
|
||||||
|
pred_prev_sample = pred_original_sample_coeff' .* x_0_pred + current_sample_coeff' .* sample
|
||||||
|
|
||||||
|
# 6. Add noise
|
||||||
|
variance = sqrt.(scheduler.βs[timesteps])' .* randn(size(model_output))
|
||||||
|
pred_prev_sample = pred_prev_sample + variance
|
||||||
|
|
||||||
|
return pred_prev_sample, x_0_pred
|
||||||
end
|
end
|
||||||
|
|
|
@ -25,51 +25,3 @@ function add_noise(
|
||||||
|
|
||||||
return noisy_data
|
return noisy_data
|
||||||
end
|
end
|
||||||
|
|
||||||
function step(
|
|
||||||
scheduler::Scheduler,
|
|
||||||
sample::AbstractArray,
|
|
||||||
model_output::AbstractArray,
|
|
||||||
timesteps::AbstractArray,
|
|
||||||
)
|
|
||||||
"""
|
|
||||||
Remove noise from model output using the backward diffusion process.
|
|
||||||
|
|
||||||
Args:
|
|
||||||
scheduler (`Scheduler`): scheduler object.
|
|
||||||
sample (`AbstractArray`): sample to remove noise from, i.e. model_input.
|
|
||||||
model_output (`AbstractArray`): predicted noise from the model.
|
|
||||||
timesteps (`AbstractArray`): timesteps to remove noise from.
|
|
||||||
|
|
||||||
Returns:
|
|
||||||
`AbstractArray`: denoised model output at the given timestep.
|
|
||||||
"""
|
|
||||||
# 1. compute alphas, betas
|
|
||||||
α_cumprod_t = scheduler.α_cumprods[timesteps]
|
|
||||||
α_cumprod_t_prev = scheduler.α_cumprods[timesteps.-1]
|
|
||||||
β_cumprod_t = 1 .- α_cumprod_t
|
|
||||||
β_cumprod_t_prev = 1 .- α_cumprod_t_prev
|
|
||||||
current_α_t = α_cumprod_t ./ α_cumprod_t_prev
|
|
||||||
current_β_t = 1 .- current_α_t
|
|
||||||
|
|
||||||
# 2. compute predicted original sample from predicted noise also called
|
|
||||||
# "predicted x_0" of formula (15) from https://arxiv.org/pdf/2006.11239.pdf
|
|
||||||
# epsilon prediction type
|
|
||||||
# print shapes of thingies
|
|
||||||
x_0_pred = (sample - sqrt.(β_cumprod_t)' .* model_output) ./ sqrt.(α_cumprod_t)'
|
|
||||||
|
|
||||||
# 4. Compute coefficients for pred_original_sample x_0 and current sample x_t
|
|
||||||
# See formula (7) from https://arxiv.org/pdf/2006.11239.pdf
|
|
||||||
pred_original_sample_coeff = (sqrt.(α_cumprod_t_prev) .* current_β_t) ./ β_cumprod_t
|
|
||||||
current_sample_coeff = sqrt.(current_α_t) .* β_cumprod_t_prev ./ β_cumprod_t
|
|
||||||
|
|
||||||
# 5. Compute predicted previous sample µ_t
|
|
||||||
# See formula (7) from https://arxiv.org/pdf/2006.11239.pdf
|
|
||||||
pred_prev_sample = pred_original_sample_coeff' .* x_0_pred + current_sample_coeff' .* sample
|
|
||||||
|
|
||||||
# 6. Add noise
|
|
||||||
variance = sqrt.(scheduler.βs[timesteps])' .* randn(size(model_output))
|
|
||||||
pred_prev_sample = pred_prev_sample + variance
|
|
||||||
|
|
||||||
return pred_prev_sample
|
|
||||||
end
|
|
||||||
|
|
Loading…
Reference in a new issue