当前位置：首页 > wzjs >正文

泉州网站建设工程宣传软文是什么意思

wzjs 2025/8/11 1:37:46

泉州网站建设工程,宣传软文是什么意思,yusi wordpress,初做淘宝客选哪个网站简介生成式扩散模型已经成为生成式人工智能的基础。对于工程上常见的数据生成任务（曲线、向量并非图像），并不需要用到相对复杂的U-Net和注意力机制，只需要普通的全连接神经网络即可搭建扩散模型。本文则提供一个简易的代码&am…

简介

生成式扩散模型已经成为生成式人工智能的基础。对于工程上常见的数据生成任务（曲线、向量并非图像），并不需要用到相对复杂的U-Net和注意力机制，只需要普通的全连接神经网络即可搭建扩散模型。

本文则提供一个简易的代码，仅使用全连接神经网络实现Sine正弦曲线的生成任务。所搭建的扩散模型需要输入振幅、频率和相位三个条件（Condition），可从高斯噪声出发，一步一步去噪，并使用Classifier-free guidance技术，得到近似符合条件的Sine函数。

本文的代码可以作为一个学习案例，读者可根据具体工程问题，将三个条件（Condition）扩充，实现其他数据生成任务。

方法

代码改编自
https://github.com/cloneofsimo/minDiffusion
and
https://github.com/TeaPearce/Conditional_Diffusion_MNIST
扩散模型理论源于
https://arxiv.org/abs/2006.11239
条件引导的理论源于
https://arxiv.org/abs/2207.12598

代码

代码由dataset.py, generation.py, network.py, train.py四个文件构成，文件目录如下
在这里插入图片描述
dataset.py用于定义训练用的数据集，也就是随机生成的正弦曲线，曲线由数列表示。

from torch.utils.data import Dataset
import numpy as np# 自定义数据集类
class SinWaveDataset(Dataset):def __init__(self, num_samples, sequence_length):self.num_samples = num_samplesself.sequence_length = sequence_lengthself.data, self.labels = self.generate_data()def generate_data(self):data = []labels = []for _ in range(self.num_samples):t = np.linspace(0, 4*np.pi, self.sequence_length)  # 时间点freq = np.random.uniform(1.0, 10.0)  # 随机频率amplitude = np.random.uniform(0.5, 2.0)  # 随机振幅phase = np.random.uniform(0, 2 * np.pi)  # 随机相位x = amplitude * np.sin(freq * t + phase)  # 生成x数值condition=np.array([amplitude, freq, phase])data.append(x)  # 每个样本是 (sequence_length)labels.append(condition)  # 振幅、频率、相位作为标签data = np.array(data, dtype=np.float32)labels = np.array(labels, dtype=np.float32)return data, labelsdef __len__(self):return self.num_samplesdef __getitem__(self, idx):return self.data[idx], self.labels[idx]

network.py用于定义神经网络, FCNN是全连接神经网络，EmbedFC是全连接嵌入层，ddpm_schedules定义了扩散模型加噪规律，DDPM的forward用于预测噪声，DDPM的sample用于完成训练后的数据生成

import torch
import torch.nn as nn
import numpy as np# GPU or CPU
device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")class FCNN(nn.Module):def __init__(self, hidden_sizes, x_size, time_embed_size, condition_size, condition_embed_size):super(FCNN, self).__init__()input_size = x_size + time_embed_size + condition_embed_sizebypass_size = time_embed_size + condition_embed_sizeself.layers = nn.ModuleList()self.bn_layers = nn.ModuleList()# First layerself.layers.append(nn.Linear(input_size, hidden_sizes[0]))self.bn_layers.append(nn.BatchNorm1d(hidden_sizes[0]))# Hidden layersfor i in range(1, len(hidden_sizes)):self.layers.append(nn.Linear(hidden_sizes[i - 1] + bypass_size, hidden_sizes[i]))self.bn_layers.append(nn.BatchNorm1d(hidden_sizes[i]))# Output layerself.layers.append(nn.Linear(hidden_sizes[-1] + bypass_size, x_size))self.leaky_relu = nn.LeakyReLU(0.01)self.dropout = nn.Dropout(0.05)self.time_embeding = EmbedFC(1, time_embed_size)self.condition_embeding = EmbedFC(condition_size, condition_embed_size)def forward(self, x, time, condition, context_mask):time_embed = self.time_embeding(time)condition_embed = self.condition_embeding(condition) * (1.0 - context_mask)for i, layer in enumerate(self.layers[:-1]):x = torch.cat((x, time_embed, condition_embed), 1)x = layer(x)x = self.leaky_relu(x)x = self.bn_layers[i](x)x = self.dropout(x)x = torch.cat((x, time_embed, condition_embed), 1)x = self.layers[-1](x)return x# A fully connected neural network for embed
class EmbedFC(nn.Module):def __init__(self, input_dim, emb_dim):super(EmbedFC, self).__init__()self.input_dim = input_dimlayers = [nn.Linear(input_dim, emb_dim)]self.model = nn.Sequential(*layers)def forward(self, x):x = x.view(-1, self.input_dim)return self.model(x)def ddpm_schedules(beta1, beta2, T):"""Returns pre-computed schedules for DDPM sampling, training process."""assert beta1 < beta2 < 1.0, "beta1 and beta2 must be in (0, 1)"beta_t = (beta2 - beta1) * torch.arange(0, T +1, dtype=torch.float32) / T + beta1sqrt_beta_t = torch.sqrt(beta_t)alpha_t = 1 - beta_tlog_alpha_t = torch.log(alpha_t)alphabar_t = torch.cumsum(log_alpha_t, dim=0).exp()sqrtab = torch.sqrt(alphabar_t)oneover_sqrta = 1 / torch.sqrt(alpha_t)sqrtmab = torch.sqrt(1 - alphabar_t)mab_over_sqrtmab_inv = (1 - alpha_t) / sqrtmabreturn {"alpha_t": alpha_t,  # \alpha_t"oneover_sqrta": oneover_sqrta,  # 1/\sqrt{\alpha_t}"sqrt_beta_t": sqrt_beta_t,  # \sqrt{\beta_t}"alphabar_t": alphabar_t,  # \bar{\alpha_t}"sqrtab": sqrtab,  # \sqrt{\bar{\alpha_t}}"sqrtmab": sqrtmab,  # \sqrt{1-\bar{\alpha_t}}# (1-\alpha_t)/\sqrt{1-\bar{\alpha_t}}"mab_over_sqrtmab": mab_over_sqrtmab_inv,}class DDPM(nn.Module):def __init__(self, nn_model, betas, n_T, device, drop_prob=0.1):super(DDPM, self).__init__()self.nn_model = nn_model.to(device)num_params = sum(p.numel() for p in nn_model.parameters())print(f"Parameter number: {num_params*1e-6}M")# register_buffer allows accessing dictionary produced by ddpm_schedules# e.g. can access self.sqrtab laterfor k, v in ddpm_schedules(betas[0], betas[1], n_T).items():self.register_buffer(k, v)self.n_T = n_Tself.device = deviceself.drop_prob = drop_probself.loss_mse = nn.MSELoss()def forward(self, x, condition):"""this method is used in training, so samples t and noise randomly"""_ts = torch.randint(1, self.n_T+1, (x.shape[0],)).to(self.device)  # t ~ Uniform(0, n_T)noise = torch.randn_like(x)  # eps ~ N(0, 1)x_t = (self.sqrtab[_ts, None] * x+ self.sqrtmab[_ts, None] * noise)  # This is the x_t, which is sqrt(alphabar) x_0 + sqrt(1-alphabar) * eps# We should predict the "error term" from this x_t. Loss is what we return.# dropout context with some probabilitycontext_mask = torch.bernoulli(torch.zeros_like(condition[:, 0:1])+self.drop_prob).to(self.device)# return MSE between added noise, and our predicted noisereturn self.loss_mse(noise, self.nn_model(x_t, _ts / self.n_T, condition, context_mask))def sample(self, n_sample, x_size, device, guide_w=0.0, condition=None):# we follow the guidance sampling scheme described in 'Classifier-Free Diffusion Guidance'# to make the fwd passes efficient, we concat two versions of the dataset,# one with context_mask=0 and the other context_mask=1# we then mix the outputs with the guidance scale, w# where w>0 means more guidance# x_T ~ N(0, 1), sample initial noisex_i = torch.randn(n_sample, x_size).to(device)condition = condition.unsqueeze(0).repeat(n_sample, 1).to(device)# don't drop context at test timecontext_mask = torch.zeros_like(condition[:, 0:1]).to(device)# double the batchcondition = condition.repeat(2, 1)context_mask = context_mask.repeat(2, 1)context_mask[n_sample:] = 1.  # makes second half of batch context freex_i_store = []  # keep track of generated steps in case want to plot somethingfor i in range(self.n_T, 0, -1):print(f'sampling timestep {i}\n')t_is = torch.tensor([i / self.n_T]).to(device)t_is = t_is.repeat(n_sample, 1)# double batchx_i = x_i.repeat(2, 1)t_is = t_is.repeat(2, 1)z = torch.randn(n_sample, x_size).to(device) if i > 1 else 0# split predictions and compute weightingeps = self.nn_model(x_i, t_is[:, 0], condition, context_mask)eps1 = eps[:n_sample]eps2 = eps[n_sample:]eps = (1.0+guide_w)*eps1 - guide_w*eps2x_i = x_i[:n_sample]x_i = (self.oneover_sqrta[i] * (x_i - eps * self.mab_over_sqrtmab[i])+ self.sqrt_beta_t[i] * z)x_i_store.append(x_i.detach().cpu().numpy())x_i_store.reverse()x_i_store = np.array(x_i_store)x_i_store = torch.Tensor(x_i_store)return x_i, x_i_store

train.py用于训练神经网络

''' 
This script does conditional latent generation using a diffusion modelThis code is modified from,
https://github.com/cloneofsimo/minDiffusion
and
https://github.com/TeaPearce/Conditional_Diffusion_MNISTDiffusion model is based on DDPM,
https://arxiv.org/abs/2006.11239The conditioning idea is taken from 'Classifier-Free Diffusion Guidance',
https://arxiv.org/abs/2207.12598This technique also features in ImageGen 'Photorealistic Text-to-Image Diffusion Modelswith Deep Language Understanding',
https://arxiv.org/abs/2205.11487'''
from tqdm import tqdm
import torch
from torch.utils.data import DataLoader
import matplotlib.pyplot as plt
import math
from network import DDPM,FCNN
from dataset import SinWaveDatasetdef main():device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")# hardcoding of the training parametersn_epoch = 2000batch_size = 512n_T = 1000lrate = 1e-3x_size=128time_embed_size=64condition_size=3condition_embed_size=64ddpm = DDPM(nn_model=FCNN(hidden_sizes=[4096,4096,4096,4096],x_size=x_size,time_embed_size=time_embed_size,condition_size=condition_size,condition_embed_size=condition_embed_size),betas=(1e-4, 0.02),n_T=n_T,device=device,drop_prob=0.05)ddpm.to(device)# Create datasettrain_dataset = SinWaveDataset(5000, 128)train_dataloader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True, num_workers=5)optim = torch.optim.Adam(ddpm.parameters(), lr=lrate)losses = []for ep in range(n_epoch):print(f'epoch {ep}')ddpm.train()# Linear lrate decayoptim.param_groups[0]['lr'] = lrate*(1-ep/n_epoch)pbar = tqdm(train_dataloader)loss_ema = Nonefor x, c in pbar:optim.zero_grad()x = x.to(device)c = c.to(device)loss = ddpm(x, c)loss.backward()if loss_ema is None:loss_ema = loss.item()else:loss_ema = 0.95 * loss_ema + 0.05 * loss.item()pbar.set_description(f"loss: {loss_ema:.4f}")optim.step()losses.append(math.log(loss_ema)/math.log(10))# Draw loss curveplt.clf()plt.plot(losses)plt.xlabel('Steps')plt.ylabel('Loss')plt.title('Training Loss Curve')plt.pause(0.001)torch.save(ddpm, "DDPM/SineTest/ddpm.pth")print('model saved model')if __name__ == "__main__":main()

generation.py用于训练完成后生成数据

import numpy as np
import torch
import matplotlib.pyplot as plt# GPU or CPU
device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")def generate_samples(n_sample, condition, guide_w):with torch.no_grad():# Load trained DDPM modelddpm = torch.load("DDPM/SineTest/ddpm.pth", map_location=device)ddpm.eval()x_gen, x_gen_store = ddpm.sample(n_sample=n_sample, x_size=128, device=device, guide_w=guide_w, condition=condition)return x_genif __name__ == "__main__":condition=torch.tensor([1.5, 4.0, np.pi/2])#给定振幅、频率、相位# 生成样本out = generate_samples(n_sample = 30,condition = condition,guide_w = 1.0)out = out.cpu().numpy()# 创建一个图形plt.figure(figsize=(10, 6))# 遍历每一行数据并绘制曲线for i in range(out.shape[0]):plt.plot(out[i], label=f'Curve {i+1}')# 添加图例plt.legend()# 添加标题和轴标签plt.title('30 Curves with 128 Data Points Each')plt.xlabel('Data Points')plt.ylabel('Values')# 显示图形plt.show()