对抗生成网络（GAN）同时训练两个模型：能够得到数据分布的生成模型（generative model G）和能判够区别数据是生成的还是真实的判别模型（discriminative model D）。训练过程使得G生成的数据尽可能真实，同时又使得D尽可能能够区分生成的数据和真实的数据，最终G生成数据足以以假乱真，而D输出数据的概率均为0.5 。参考论文：Bengio大神的 Generative Adversarial Networks

2. GAN训练过程

在caffe 中实现Generative Adversarial Nets（一）目录

注意：这里的loss在更新D梯度是上升方向，在caffe具体实现时，为了使得D模型梯度更新为梯度的下降方向，loss等价改为: loss=−[log(D(x(i))+log(1−D(G(z(i))))] .

二、Deep Convolutional GANs (DCGAN)

1. DCGAN 网络结构

DCGAN 用卷积神经（CNN）代替GAN中用多层感知器（MLP）实现D和G，后生成图片效果显著提升。参考论文Unsupervised Representation Learning with Deep Convolutional Generative Adversarial Neworks

DCGAN网络结构图

在caffe 中实现Generative Adversarial Nets（一）目录
DCGAN结构内容

在caffe 中实现Generative Adversarial Nets（一）目录

2. DCGAN caffe prototxt

1.train.prototxt

#  Create on: 2016/10/22 ShanghaiTech
#  Author:    Yingying Zhang
name: "gan_newface"
layer {
  name: "images"
  type: "ImageData"
  top: "face_images"
  top: "label"
  include {
    phase: TRAIN
  }
  transform_param {
    mirror: true
    mean_value: []
    scale: 
  }
  image_data_param {
    source: "data/face_data.txt"
    root_folder: "data/"
    batch_size: 
    new_height: 
    new_width: 
    is_color: true
    shuffle: true
  }
}
layer {
  name: "rand_vec"
  type: "RandVec"
  top: "rand_vec"
  rand_vec_param {
    batch_size: 
    dim: 
    lower: -
    upper: 
    repeat: 
  }
}
layer {
  name: "silence"
  type: "Silence"
  bottom: "label"
}
#----------- generative -----------
layer {
  name: "ip1"
  type: "InnerProduct"
  bottom: "rand_vec"
  top: "ip1"
  param {
    name: "ip_w_g"
    lr_mult: 
  }
  param {
    name: "ip_b_g"
    lr_mult: 
  }
  inner_product_param{
    num_output: 
    gen_mode: true
    weight_filler {
      type: "gaussian"
      std: 
    }
    bias_filler {
      type: "constant"
      value: 
    }
  }
}
layer {
  name: "ip1_reshape"
  type: "Reshape"
  bottom: "ip1"
  top: "ip1_reshape"
  reshape_param {
    shape {
      dim: 
      dim: 
      dim: 
      dim: 
    }
  }
}
layer {
  name: "batch_norm_g1"
  type: "BatchNorm"
  bottom: "ip1_reshape"
  top: "ip1_reshape"
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  batch_norm_param {
    use_global_stats: false
  }
}
layer {
  name: "scale_batch_g1"
  type: "Scale"
  bottom: "ip1_reshape"
  top: "ip1_reshape"
  param {
    name: "gen_s1"
    lr_mult: 
    decay_mult: 
  }
  param {
    name: "gen_b1"
    lr_mult: 
    decay_mult: 
  }
  scale_param {
    bias_term: true
    gen_mode: true
  }
}
layer {
  name: "relu_g1"
  type: "ReLU"
  bottom: "ip1_reshape"
  top: "ip1_reshape"
}
layer {
  name: "gen_conv2"
  type: "Deconvolution"
  bottom: "ip1_reshape"
  top: "gen_conv2"
  param {
    name: "gen_w_2"
    lr_mult: 
  }
  param {
    name: "gen_b_2"
    lr_mult: 
  }
  convolution_param {
    num_output: 
    pad: 
    kernel_size: 
    stride: 
    gen_mode: true
    shape_offset: [, ]
    weight_filler {
      type: "gaussian"
      std: 
    }
    bias_filler {
      type: "constant"
      value: 
    }
  }
}
layer {
  name: "batch_norm_g2"
  type: "BatchNorm"
  bottom: "gen_conv2"
  top: "gen_conv2"
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  batch_norm_param {
    use_global_stats: false
  }
}
layer {
  name: "scale_batch_g2"
  type: "Scale"
  bottom: "gen_conv2"
  top: "gen_conv2"
  param {
    name: "gen_s2"
    lr_mult: 
    decay_mult: 
  }
  param {
    name: "gen_b2"
    lr_mult: 
    decay_mult: 
  }
  scale_param {
    gen_mode: true
    bias_term: true
  }
}
layer {
  name: "relu_g2"
  type: "ReLU"
  bottom: "gen_conv2"
  top: "gen_conv2"
}
layer {
  name: "gen_conv3"
  type: "Deconvolution"
  bottom: "gen_conv2"
  top: "gen_conv3"
  param {
    name: "gen_w_3"
    lr_mult: 
  }
  param {
    name: "gen_b_3"
    lr_mult: 
  }
  convolution_param {
    num_output: 
    pad: 
    kernel_size: 
    stride: 
    gen_mode: true
    shape_offset: [, ]
    weight_filler {
      type: "gaussian"
      std: 
    }
    bias_filler {
      type: "constant"
      value: 
    }
  }
}
layer {
  name: "batch_norm_g3"
  type: "BatchNorm"
  bottom: "gen_conv3"
  top: "gen_conv3"
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  batch_norm_param {
    use_global_stats: false
  }
}
layer {
  name: "scale_batch_g3"
  type: "Scale"
  bottom: "gen_conv3"
  top: "gen_conv3"
  param {
    name: "gen_s3"
    lr_mult: 
    decay_mult: 
  }
  param {
    name: "gen_b3"
    lr_mult: 
    decay_mult: 
  }
  scale_param {
    gen_mode: true
    bias_term: true
  }
}
layer {
  name: "relu_g3"
  type: "ReLU"
  bottom: "gen_conv3"
  top: "gen_conv3"
}
layer {
  name: "gen_conv4"
  type: "Deconvolution"
  bottom: "gen_conv3"
  top: "gen_conv4"
  param {
    name: "gen_w_4"
    lr_mult: 
  }
  param {
    name: "gen_b_4"
    lr_mult: 
  }
  convolution_param {
    num_output: 
    pad: 
    kernel_size: 
    stride: 
    gen_mode: true
    shape_offset: [, ]
    weight_filler {
      type: "gaussian"
      std: 
    }
    bias_filler {
      type: "constant"
      value: 
    }
  }
}
layer {
  name: "batch_norm_g4"
  type: "BatchNorm"
  bottom: "gen_conv4"
  top: "gen_conv4"
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  batch_norm_param {
    use_global_stats: false
  }
}
layer {
  name: "scale_batch_g4"
  type: "Scale"
  bottom: "gen_conv4"
  top: "gen_conv4"
  param {
    name: "gen_s4"
    lr_mult: 
    decay_mult: 
  }
  param {
    name: "gen_b4"
    lr_mult: 
    decay_mult: 
  }
  scale_param {
    gen_mode: true
    bias_term: true
  }
}
layer {
  name: "relu_g4"
  type: "ReLU"
  bottom: "gen_conv4"
  top: "gen_conv4"
}
layer {
  name: "gen_conv5"
  type: "Deconvolution"
  bottom: "gen_conv4"
  top: "gen_conv5"
  param {
    name: "gen_w_5"
    lr_mult: 
  }
  param {
    name: "gen_b_5"
    lr_mult: 
  }
  convolution_param {
    num_output: 
    pad: 
    kernel_size: 
    stride: 
    gen_mode: true
    shape_offset: [, ]
    weight_filler {
      type: "gaussian"
      std: 
    }
    bias_filler {
      type: "constant"
      value: 
    }
  }
}
layer {
  name: "tanh_g5"
  type: "TanH"
  bottom: "gen_conv5"
  top: "gen_conv5"
}
#-----------   gan gate  ------------
layer {
  name: "gan_gate"
  type: "GANGate"
  bottom: "face_images"
  bottom: "gen_conv5"
  top: "dis_input"
}
#----------- discrimitive -----------
layer {
  name: "dis_conv_d1"
  type: "Convolution"
  bottom: "dis_input"
  top: "dis_conv_d1"
  param {
    name: "dis_w_1"
    lr_mult: 
  }
  param {
    name: "dis_b_1"
    lr_mult: 
  }
  convolution_param {
    num_output: 
    pad: 
    kernel_size: 
    stride: 
    dis_mode: true
    weight_filler {
      type: "gaussian"
      std: 
    }
    bias_filler {
      type: "constant"
      value: 
    }
  }
}
layer {
  name: "batch_norm_d1"
  type: "BatchNorm"
  bottom: "dis_conv_d1"
  top: "dis_conv_d1"
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  batch_norm_param {
    use_global_stats: false
  }
}
layer {
  name: "scale_batch_d1"
  type: "Scale"
  bottom: "dis_conv_d1"
  top: "dis_conv_d1"
  param {
    name: "dis_s1"
    lr_mult: 
    decay_mult: 
  }
  param {
    name: "dis_b1"
    lr_mult: 
    decay_mult: 
  }
  scale_param {
    dis_mode: true
    bias_term: true
  }
}
layer {
  name: "relu_d1"
  type: "ReLU"
  bottom: "dis_conv_d1"
  top: "dis_conv_d1"
  relu_param {
    negative_slope: 
  }
}
layer {
  name: "dis_conv_d2"
  type: "Convolution"
  bottom: "dis_conv_d1"
  top: "dis_conv_d2"
  param {
    name: "dis_w_2"
    lr_mult: 
  }
  param {
    name: "dis_b_2"
    lr_mult: 
  }
  convolution_param {
    num_output: 
    pad: 
    kernel_size: 
    stride: 
    dis_mode: true
    weight_filler {
      type: "gaussian"
      std: 
    }
    bias_filler {
      type: "constant"
      value: 
    }
  }
}
layer {
  name: "batch_norm_d2"
  type: "BatchNorm"
  bottom: "dis_conv_d2"
  top: "dis_conv_d2"
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  batch_norm_param {
    use_global_stats: false
  }
}
layer {
  name: "scale_batch_d2"
  type: "Scale"
  bottom: "dis_conv_d2"
  top: "dis_conv_d2"
  param {
    name: "dis_s2"
    lr_mult: 
    decay_mult: 
  }
  param {
    name: "dis_b2"
    lr_mult: 
    decay_mult: 
  }
  scale_param {
    dis_mode: true
    bias_term: true
  }
}
layer {
  name: "relu_d2"
  type: "ReLU"
  bottom: "dis_conv_d2"
  top: "dis_conv_d2"
  relu_param {
    negative_slope: 
  }
}
layer {
  name: "dis_conv_d3"
  type: "Convolution"
  bottom: "dis_conv_d2"
  top: "dis_conv_d3"
  param {
    name: "dis_w_3"
    lr_mult: 
  }
  param {
    name: "dis_b_3"
    lr_mult: 
  }
  convolution_param {
    num_output: 
    pad: 
    kernel_size: 
    stride: 
    dis_mode: true
    weight_filler {
      type: "gaussian"
      std: 
    }
    bias_filler {
      type: "constant"
      value: 
    }
  }
}
layer {
  name: "batch_norm_d3"
  type: "BatchNorm"
  bottom: "dis_conv_d3"
  top: "dis_conv_d3"
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  batch_norm_param {
    use_global_stats: false
  }
}
layer {
  name: "scale_batch_d3"
  type: "Scale"
  bottom: "dis_conv_d3"
  top: "dis_conv_d3"
  param {
    name: "dis_s3"
    lr_mult: 
    decay_mult: 
  }
  param {
    name: "dis_b3"
    lr_mult: 
    decay_mult: 
  }
  scale_param {
    dis_mode: true
    bias_term: true
  }
}
layer {
  name: "relu_d3"
  type: "ReLU"
  bottom: "dis_conv_d3"
  top: "dis_conv_d3"
  relu_param {
    negative_slope: 
  }
}
layer {
  name: "dis_conv_d4"
  type: "Convolution"
  bottom: "dis_conv_d3"
  top: "dis_conv_d4"
  param {
    name: "dis_w_4"
    lr_mult: 
  }
  param {
    name: "dis_b_4"
    lr_mult: 
  }
  convolution_param {
    num_output: 
    pad: 
    kernel_size: 
    stride: 
    dis_mode: true
    weight_filler {
      type: "gaussian"
      std: 
    }
    bias_filler {
      type: "constant"
      value: 
    }
  }
}
layer {
  name: "batch_norm_d4"
  type: "BatchNorm"
  bottom: "dis_conv_d4"
  top: "dis_conv_d4"
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  param {
    lr_mult: 
    decay_mult: 
  }
  batch_norm_param {
    use_global_stats: false
  }
}
layer {
  name: "scale_batch_d4"
  type: "Scale"
  bottom: "dis_conv_d4"
  top: "dis_conv_d4"
  param {
    name: "dis_s4"
    lr_mult: 
    decay_mult: 
  }
  param {
    name: "dis_b4"
    lr_mult: 
    decay_mult: 
  }
  scale_param {
    dis_mode: true
    bias_term: true
  }
}
layer {
  name: "relu_d4"
  type: "ReLU"
  bottom: "dis_conv_d4"
  top: "dis_conv_d4"
  relu_param {
    negative_slope: 
  }
}
layer {
  name: "score"
  type: "InnerProduct"
  bottom: "dis_conv_d4"
  top: "score"
  param {
    name: "score_w"
    lr_mult: 
  }
  param {
    name: "score_b"
    lr_mult: 
  }
  inner_product_param{
    num_output: 
    dis_mode: true
    weight_filler {
      type: "gaussian"
      std: 
    }
    bias_filler {
      type: "constant"
      value: 
    }
  }
}
layer {
  name: "sigmoid"
  type: "Sigmoid"
  bottom: "score"
  top: "score"
}
layer {
  name: "gan_loss"
  type: "GANDGLoss"
  bottom: "score"
  top: "gan_loss"
  gan_loss_param {
    dis_iter: 
    gen_iter: 
  }
}

2.solver.prototxt

#  Create on: 2016/10/22 ShanghaiTech
#  Author:    Yingying Zhang

net: "gan_configs/train.prototxt"
debug_info: false
display: 
solver_type: ADAM
average_loss: 
base_lr: 
lr_policy: "fixed"
max_iter: 
momentum: 
snapshot: 
gan_solver: true
snapshot_prefix: "models/gan_"

3.生成结果

在caffe 中实现Generative Adversarial Nets（一）目录

未完待续！！！第二部分为caffe具体源码！

在caffe 中实现Generative Adversarial Nets（一）目录

目录

一、Generative Adversarial Nets

1. GAN简介

2. GAN训练过程

二、Deep Convolutional GANs (DCGAN)

1. DCGAN 网络结构

2. DCGAN caffe prototxt

3.生成结果

继续阅读

caffe学习笔记1：转化自己的数据为（leveldb/lmdb）文件

caffe为什么采用LMDB、LEVELDB，而不是直接读取原始数据

【caffe-Windows】以mnist为例lmdb格式数据前言第一步第二步第三步

【AI】caffe使用步骤（一）：将标注数据生成lmdb或leveldb

caffe windows 数据转换lmdb can not find file...

【caffe】读取lmdb文件中的内容

GAN---Conditional Generative Adversarial Nets论文

算法工程师校招攻略

DA-GAN: Instance-level Image Translation by Deep Attention Generative Adversarial Networks

GAN的实现

生成式对抗网络GAN研究进展（一）1. 生成式模型

ICLR 2017 | GAN Missing Modes 和 GAN

[MICCAI2019] Unified Attentional Generative Adversarial Network for Brain Tumor Segmentation From Mu

Ubuntu16.04下Caffe环境搭建：cuda8.0 + opencv2.4.13

Ubuntu14.04+cuda8.0+caffe+MATLAB