#MNIST資料集上條件變分自編碼器#程式碼

阿新 • • 發佈：2021-11-27

import torch
from torch import nn
import torch.nn.functional as F
import torchvision
from torch.utils.data import DataLoader
import utils


class CVAE(nn.Module):
    """Implementation of CVAE(Conditional Variational Auto-Encoder)"""
    def __init__(self, feature_size, class_size, latent_size):
        super(CVAE, self).__init__()

        self.fc1 = nn.Linear(feature_size + class_size, 200)
        self.fc2_mu = nn.Linear(200, latent_size)
        self.fc2_log_std = nn.Linear(200, latent_size)
        self.fc3 = nn.Linear(latent_size + class_size, 200)
        self.fc4 = nn.Linear(200, feature_size)

    def encode(self, x, y):
        h1 = F.relu(self.fc1(torch.cat([x, y], dim=1)))  # concat features and labels
        mu = self.fc2_mu(h1)
        log_std = self.fc2_log_std(h1)
        return mu, log_std

    def decode(self, z, y):
        h3 = F.relu(self.fc3(torch.cat([z, y], dim=1)))  # concat latents and labels
        recon = torch.sigmoid(self.fc4(h3))  # use sigmoid because the input image's pixel is between 0-1
        return recon

    def reparametrize(self, mu, log_std):
        std = torch.exp(log_std)
        eps = torch.randn_like(std)  # simple from standard normal distribution
        z = mu + eps * std
        return z

    def forward(self, x, y):
        mu, log_std = self.encode(x, y)
        z = self.reparametrize(mu, log_std)
        recon = self.decode(z, y)
        return recon, mu, log_std

    def loss_function(self, recon, x, mu, log_std) -> torch.Tensor:
        recon_loss = F.mse_loss(recon, x, reduction="sum")  # use "mean" may have a bad effect on gradients
        kl_loss = -0.5 * (1 + 2*log_std - mu.pow(2) - torch.exp(2*log_std))
        kl_loss = torch.sum(kl_loss)
        loss = recon_loss + kl_loss
        return loss


if __name__ == '__main__':
    epochs = 100
    batch_size = 100

    recon = None
    img = None

    utils.make_dir("./img/cvae")
    utils.make_dir("./model_weights/cvae")

    train_data = torchvision.datasets.MNIST(
        root='./mnist',
        train=True,
        transform=torchvision.transforms.ToTensor(),
        download=True
    )

    data_loader = DataLoader(train_data, batch_size=100, shuffle=True)

    cvae = CVAE(feature_size=784, class_size=10, latent_size=10)

    optimizer = torch.optim.Adam(cvae.parameters(), lr=1e-3)

    for epoch in range(100):
        train_loss = 0
        i = 0
        for batch_id, data in enumerate(data_loader):
            img, label = data
            inputs = img.reshape(img.shape[0], -1)
            y = utils.to_one_hot(label.reshape(-1, 1), num_class=10)
            recon, mu, log_std = cvae(inputs, y)
            loss = cvae.loss_function(recon, inputs, mu, log_std)

            optimizer.zero_grad()
            loss.backward()
            optimizer.step()

            train_loss += loss.item()
            i += 1

            if batch_id % 100 == 0:
                print("Epoch[{}/{}], Batch[{}/{}], batch_loss:{:.6f}".format(
                    epoch+1, epochs, batch_id+1, len(data_loader), loss.item()))

        print("======>epoch:{},\t epoch_average_batch_loss:{:.6f}============".format(epoch+1, train_loss/i), "\n")

        # save imgs
        if epoch % 10 == 0:
            imgs = utils.to_img(recon.detach())
            path = "./img/cvae/epoch{}.png".format(epoch+1)
            torchvision.utils.save_image(imgs, path, nrow=10)
            print("save:", path, "\n")

    torchvision.utils.save_image(img, "./img/cvae/raw.png", nrow=10)
    print("save raw image:./img/cvae/raw/png", "\n")

    # save val model
    utils.save_model(cvae, "./model_weights/cvae/cvae_weights.pth")

　　util

import torch
import torch.nn as nn
import os
import torch.nn.functional as F


def to_img(x):
    x = x.clamp(0, 1)
    imgs = x.reshape(x.shape[0], 1, 28, 28)
    return imgs


def to_one_hot(labels: torch.Tensor, num_class: int):
    y = torch.zeros(labels.shape[0], num_class)
    for i, label in enumerate(labels):
        y[i, label] = 1
    return y


def save_model(model: nn.Module, path):
    torch.save(model.state_dict(), path)
    print("save model..........")


def load_model(model: nn.Module, path):
    model.load_state_dict(torch.load(path))
    print("load model..........")


def make_dir(path):
    if not os.path.exists(path):
        os.makedirs(path)

　幾個結果

第一輪

11輪

21輪

31輪

41輪

51輪

61輪

71輪

81輪

最後

#MNIST資料集上條件變分自編碼器#程式碼

import torch from torch import nn import torch.nn.functional as F import torchvision from torch.utils.data import DataLoader

[tensorflow2.0]採用自定義層和模型在minist資料集上實現VAE(變分自編碼器)

技術標籤：tensorflowpython 使用keras的API進行搭建 from tensorflow.keras import layers

基於圖嵌入的高斯混合變分自編碼器的深度聚類(Deep Clustering by Gaussian Mixture Variational Autoencoders with Graph Embedding, DGG)

基於圖嵌入的高斯混合變分自編碼器的深度聚類 Deep Clustering by Gaussian Mixture Variational Autoencoders with Graph Embedding, DGG

pytorch-自編碼器與變分自編碼器-有損影象壓縮

筆記摘抄 importtorch fromtorch import nn, optim fromtorch.utils.data import DataLoader fromtorchvision import transforms, datasets

VAE(變分自編碼器的torch實現) —— jupyter實現(注意tqdm模組不同)

簡單實現了torch版本的變分自編碼器參考大佬TensorFlow版本的VAE：膜拜大佬 import os

使用 PyTorch 實現 MLP 並在 MNIST 資料集上驗證方式

簡介這是深度學習課程的第一個實驗，主要目的就是熟悉 Pytorch 框架。MLP 是多層感知器，我這次實現的是四層感知器，程式碼和思路參考了網上的很多文章。個人認為，感知器的程式碼大同小異，尤其是用 Pytorch 實現，

變分自動編碼器

變分自動編碼器 Diederik Kingma和Max Welling於2013年推出了自動編碼器的另一個重要類別，並迅速成為最受歡迎的自動編碼器型別之一：變分自動編碼器

Pytorch 神經網路—自定義資料集上實現教程

第一步、匯入需要的包 import os import scipy.io as sio import numpy as np import torch import torch.nn as nn

如何在自定義資料集上訓練YOLOv5

作者|Jacob Solawetz, Joseph Nelson 編譯|Flin 來源|blog YOLO系列的目標檢測模型隨著YOLOv5的引入變得越來越強大。在這篇文章中，我們將介紹如何訓練YOLOv5為你的定製用例識別定製物件。

【北京大學】9 TensorFlow1.x的實現自定義Mnist資料集

技術標籤：機器學習Pythonpythontensorflowmnist資料集目錄 1 實現把任意圖片放進訓練好的網路進行測試2 實現製作資料2.1 簡介2.2 生成tfrecords檔案2.3 解析tfrecords檔案2.4 生成自定義資料的完整程式碼mni

pytorch GAN偽造手寫體mnist資料集方式

一，mnist資料集形如上圖的數字手寫體就是mnist資料集。二，GAN原理(生成對抗網路)

pytorch:實現簡單的GAN示例(MNIST資料集)

我就廢話不多說了，直接上程式碼吧！ # -*- coding: utf-8 -*- \"\"\" Created on Sat Oct 13 10:22:45 2018

Pytorch使用MNIST資料集實現CGAN和生成指定的數字方式

CGAN的全拼是Conditional Generative Adversarial Networks，條件生成對抗網路，在初始GAN的基礎上增加了圖片的相應資訊。

MNIST資料集轉化為二維圖片的實現示例

本文介紹了MNIST資料集轉化為二維圖片的實現示例，分享給大家，具體如下：

關於Pytorch的MNIST資料集的預處理詳解

關於Pytorch的MNIST資料集的預處理詳解 MNIST的準確率達到99.7% 用於MNIST的卷積神經網路（CNN）的實現，具有各種技術，例如資料增強，丟失，偽隨機化等。

Pytorch使用MNIST資料集實現基礎GAN和DCGAN詳解

原始生成對抗網路Generative Adversarial Networks GAN包含生成器Generator和判別器Discriminator，資料有真實資料groundtruth，還有需要網路生成的“fake”資料，目的是網路生成的fake資料可以“騙過”判別器，讓判

pytorch實現mnist資料集的影象視覺化及儲存

如何將pytorch中mnist資料集的影象視覺化及儲存匯出一些庫 import torch import torchvision

使用tensorflow實現VGG網路,訓練mnist資料集方式

VGG作為流行的幾個模型之一,訓練圖形資料效果不錯，在mnist資料集是常用的入門集資料，VGG層數非常多，如果嚴格按照規範來實現，並用來訓練mnist資料集，會出現各種問題，如，經過16層卷積後，28*28*1的圖片幾乎無法

tensorflow實現殘差網路方式(mnist資料集)

介紹殘差網路是何凱明大神的神作，效果非常好，深度可以達到1000層。但是，其實現起來並沒有那末難，在這裡以tensorflow作為框架，實現基於mnist資料集上的殘差網路，當然只是比較淺層的。

基於Tensorflow讀取MNIST資料集時網路超時的解決方式

最近在學習TensorFlow，比較煩人的是使用tensorflow.examples.tutorials.mnist.input_data讀取資料

#MNIST資料集上條件變分自編碼器#程式碼

相關推薦