From 63d5df08ccaa37fd9d1fb390f32823f41b505e6c Mon Sep 17 00:00:00 2001
From: "Kwang Myung, Jeon" <lordet01@gmail.com>
Date: Sun, 23 Apr 2017 02:28:49 +0900
Subject: [PATCH 1/2] Compatible with Tensorflow 1.1.0rc1 + Python 3.5.2

---
 README.md         |    7 +-
 clean_wav.sh      |    2 +-
 generator.py      |    6 +-
 main.py           |    2 +-
 make_tfrecords.py |    2 +-
 model.py          | 1529 +++++++++++++++++++++++----------------------
 ops.py            |   22 +-
 requirements.txt  |    2 +-
 test_all.sh       |   19 +
 9 files changed, 809 insertions(+), 782 deletions(-)
 create mode 100644 test_all.sh

diff --git a/README.md b/README.md
index 3d57c58..5a3d5cd 100644
--- a/README.md
+++ b/README.md
@@ -15,11 +15,16 @@ This model deals with raw speech waveforms on many noise conditions at different
 * [improved-gan](https://github.com/openai/improved-gan): implementing improvements to train GANs in a more stable way
 *  [DCGAN-tensorflow](https://github.com/carpedm20/DCGAN-tensorflow): implementation of the DCGAN in tensorflow
 
-### Dependencies
+### Dependencies-Original
 
 * Python 2.7
 * TensorFlow 0.12
 
+### Dependencies-Forked by kmjeon, 2017-04-23
+
+* Python 3.5.2
+* TensorFlow 1.1.0rc1
+
 You can install the requirements either to your virtualenv or the system via pip with:
 
 ```
diff --git a/clean_wav.sh b/clean_wav.sh
index c04cfcb..ef5c786 100755
--- a/clean_wav.sh
+++ b/clean_wav.sh
@@ -20,5 +20,5 @@ echo "SAVE PATH: $SAVE_PATH"
 mkdir -p $SAVE_PATH
 
 CUDA_VISIBLE_DEVICES="" python main.py --init_noise_std 0. --save_path segan_v1 \
-                        --batch_size 100 --g_nl prelu --weights SEGAN-41800 \
+                        --batch_size 100 --g_nl prelu --weights SEGAN-72900 \
                         --test_wav $NOISY_WAVNAME --save_clean_path $SAVE_PATH
diff --git a/generator.py b/generator.py
index 5b8af4f..d2f325e 100644
--- a/generator.py
+++ b/generator.py
@@ -50,7 +50,7 @@ def make_z(shape, mean=0., std=1., name='z'):
         kwidth = 3
         z = make_z([segan.batch_size, h_i.get_shape().as_list()[1],
                     segan.g_enc_depths[-1]])
-        h_i = tf.concat(2, [h_i, z])
+        h_i = tf.concat([h_i, z], 2)
         skip_out = True
         skips = []
         for block_idx, dilation in enumerate(segan.g_dilated_blocks):
@@ -182,7 +182,7 @@ def make_z(shape, mean=0., std=1., name='z'):
                 # random code is fused with intermediate representation
                 z = make_z([segan.batch_size, h_i.get_shape().as_list()[1],
                             segan.g_enc_depths[-1]])
-                h_i = tf.concat(2, [z, h_i])
+                h_i = tf.concat([z, h_i], 2)
 
             #SECOND DECODER (reverse order)
             g_dec_depths = segan.g_enc_depths[:-1][::-1] + [1]
@@ -219,7 +219,7 @@ def make_z(shape, mean=0., std=1., name='z'):
                     if is_ref:
                         print('Fusing skip connection of '
                               'shape {}'.format(skip_.get_shape()))
-                    h_i = tf.concat(2, [h_i, skip_])
+                    h_i = tf.concat([h_i, skip_], 2)
 
                 else:
                     if is_ref:
diff --git a/main.py b/main.py
index 3350e57..ef96d9e 100644
--- a/main.py
+++ b/main.py
@@ -94,7 +94,7 @@ def main(_):
             print('test wave min:{}  max:{}'.format(np.min(wave), np.max(wave)))
             c_wave = se_model.clean(wave)
             print('c wave min:{}  max:{}'.format(np.min(c_wave), np.max(c_wave)))
-            wavfile.write(os.path.join(FLAGS.save_clean_path, wavname), 16e3, c_wave)
+            wavfile.write(os.path.join(FLAGS.save_clean_path, wavname), 16000, c_wave)
             print('Done cleaning {} and saved '
                   'to {}'.format(FLAGS.test_wav,
                                  os.path.join(FLAGS.save_clean_path, wavname)))
diff --git a/make_tfrecords.py b/make_tfrecords.py
index bc1f821..b0a8c01 100644
--- a/make_tfrecords.py
+++ b/make_tfrecords.py
@@ -89,7 +89,7 @@ def main(opts):
         beg_enc_t = timeit.default_timer()
         out_file = tf.python_io.TFRecordWriter(out_filepath)
         # process the acoustic and textual data now
-        for dset_i, (dset, dset_desc) in enumerate(cfg_desc.iteritems()):
+        for dset_i, (dset, dset_desc) in enumerate(cfg_desc.items()):
             print('-' * 50)
             wav_dir = dset_desc['clean']
             wav_files = [os.path.join(wav_dir, wav) for wav in
diff --git a/model.py b/model.py
index e5a6e66..8ef47de 100644
--- a/model.py
+++ b/model.py
@@ -1,763 +1,766 @@
-from __future__ import print_function
-import tensorflow as tf
-from tensorflow.contrib.layers import batch_norm, fully_connected, flatten
-from tensorflow.contrib.layers import xavier_initializer
-from scipy.io import wavfile
-from generator import *
-from discriminator import *
-import numpy as np
-from data_loader import read_and_decode
-from bnorm import VBN
-from ops import *
-import timeit
-import os
-
-
-class Model(object):
-
-    def __init__(self, name='BaseModel'):
-        self.name = name
-
-    def save(self, save_path, step):
-        model_name = self.name
-        if not os.path.exists(save_path):
-            os.makedirs(save_path)
-        if not hasattr(self, 'saver'):
-            self.saver = tf.train.Saver()
-        self.saver.save(self.sess,
-                        os.path.join(save_path, model_name),
-                        global_step=step)
-
-    def load(self, save_path, model_file=None):
-        if not os.path.exists(save_path):
-            print('[!] Checkpoints path does not exist...')
-            return False
-        print('[*] Reading checkpoints...')
-        if model_file is None:
-            ckpt = tf.train.get_checkpoint_state(save_path)
-            if ckpt and ckpt.model_checkpoint_path:
-                ckpt_name = os.path.basename(ckpt.model_checkpoint_path)
-            else:
-                return False
-        else:
-            ckpt_name = model_file
-        if not hasattr(self, 'saver'):
-            self.saver = tf.train.Saver()
-        self.saver.restore(self.sess, os.path.join(save_path, ckpt_name))
-        print('[*] Read {}'.format(ckpt_name))
-        return True
-
-
-
-class SEGAN(Model):
-    """ Speech Enhancement Generative Adversarial Network """
-    def __init__(self, sess, args, devices, infer=False, name='SEGAN'):
-        super(SEGAN, self).__init__(name)
-        self.args = args
-        self.sess = sess
-        self.keep_prob = 1.
-        if infer:
-            self.keep_prob_var = tf.Variable(self.keep_prob, trainable=False)
-        else:
-            self.keep_prob = 0.5
-            self.keep_prob_var = tf.Variable(self.keep_prob, trainable=False)
-        self.batch_size = args.batch_size
-        self.epoch = args.epoch
-        self.d_label_smooth = args.d_label_smooth
-        self.devices = devices
-        self.z_dim = args.z_dim
-        self.z_depth = args.z_depth
-        # clip D values
-        self.d_clip_weights = False
-        # apply VBN or regular BN?
-        self.disable_vbn = False
-        self.save_path = args.save_path
-        # num of updates to be applied to D before G
-        # this is k in original GAN paper (https://arxiv.org/abs/1406.2661)
-        self.disc_updates = 1
-        # canvas size
-        self.canvas_size = args.canvas_size
-        self.deactivated_noise = False
-        # dilation factors per layer (only in atrous conv G config)
-        self.g_dilated_blocks = [1, 2, 4, 8, 16, 32, 64, 128, 256, 512]
-        # num fmaps for AutoEncoder SEGAN (v1)
-        self.g_enc_depths = [16, 32, 32, 64, 64, 128, 128, 256, 256, 512, 1024]
-        # Define D fmaps
-        self.d_num_fmaps = [16, 32, 32, 64, 64, 128, 128, 256, 256, 512, 1024]
-        self.init_noise_std = args.init_noise_std
-        self.disc_noise_std = tf.Variable(self.init_noise_std, trainable=False)
-        self.disc_noise_std_summ = scalar_summary('disc_noise_std',
-                                                  self.disc_noise_std)
-        self.e2e_dataset = args.e2e_dataset
-        # G's supervised loss weight
-        self.l1_weight = args.init_l1_weight
-        self.l1_lambda = tf.Variable(self.l1_weight, trainable=False)
-        self.deactivated_l1 = False
-        # define the functions
-        self.discriminator = discriminator
-        # register G non linearity
-        self.g_nl = args.g_nl
-        if args.g_type == 'ae':
-            self.generator = AEGenerator(self)
-        elif args.g_type == 'dwave':
-            self.generator = Generator(self)
-        else:
-            raise ValueError('Unrecognized G type {}'.format(args.g_type))
-        self.build_model(args)
-
-    def build_model(self, config):
-        all_d_grads = []
-        all_g_grads = []
-        d_opt = tf.train.RMSPropOptimizer(config.d_learning_rate)
-        g_opt = tf.train.RMSPropOptimizer(config.g_learning_rate)
-        #d_opt = tf.train.AdamOptimizer(config.d_learning_rate,
-        #                               beta1=config.beta_1)
-        #g_opt = tf.train.AdamOptimizer(config.g_learning_rate,
-        #                               beta1=config.beta_1)
-
-        for idx, device in enumerate(self.devices):
-            with tf.device("/%s" % device):
-                with tf.name_scope("device_%s" % idx):
-                    with variables_on_gpu0():
-                        self.build_model_single_gpu(idx)
-                        d_grads = d_opt.compute_gradients(self.d_losses[-1],
-                                                          var_list=self.d_vars)
-                        g_grads = g_opt.compute_gradients(self.g_losses[-1],
-                                                          var_list=self.g_vars)
-                        all_d_grads.append(d_grads)
-                        all_g_grads.append(g_grads)
-                        tf.get_variable_scope().reuse_variables()
-        avg_d_grads = average_gradients(all_d_grads)
-        avg_g_grads = average_gradients(all_g_grads)
-        self.d_opt = d_opt.apply_gradients(avg_d_grads)
-        self.g_opt = g_opt.apply_gradients(avg_g_grads)
-
-
-    def build_model_single_gpu(self, gpu_idx):
-        if gpu_idx == 0:
-            # create the nodes to load for input pipeline
-            filename_queue = tf.train.string_input_producer([self.e2e_dataset])
-            self.get_wav, self.get_noisy = read_and_decode(filename_queue,
-                                                           2 ** 14)
-        # load the data to input pipeline
-        wavbatch, \
-        noisybatch = tf.train.shuffle_batch([self.get_wav,
-                                             self.get_noisy],
-                                             batch_size=self.batch_size,
-                                             num_threads=2,
-                                             capacity=1000 + 3 * self.batch_size,
-                                             min_after_dequeue=1000,
-                                             name='wav_and_noisy')
-        if gpu_idx == 0:
-            self.Gs = []
-            self.zs = []
-            self.gtruth_wavs = []
-            self.gtruth_noisy = []
-
-        self.gtruth_wavs.append(wavbatch)
-        self.gtruth_noisy.append(noisybatch)
-
-        # add channels dimension to manipulate in D and G
-        wavbatch = tf.expand_dims(wavbatch, -1)
-        noisybatch = tf.expand_dims(noisybatch, -1)
-        # by default leaky relu is used
-        do_prelu = False
-        if self.g_nl == 'prelu':
-            do_prelu = True
-        if gpu_idx == 0:
-            #self.sample_wavs = tf.placeholder(tf.float32, [self.batch_size,
-            #                                               self.canvas_size],
-            #                                  name='sample_wavs')
-            ref_Gs = self.generator(noisybatch, is_ref=True,
-                                    spk=None,
-                                    do_prelu=do_prelu)
-            print('num of G returned: ', len(ref_Gs))
-            self.reference_G = ref_Gs[0]
-            self.ref_z = ref_Gs[1]
-            if do_prelu:
-                self.ref_alpha = ref_Gs[2:]
-                self.alpha_summ = []
-                for m, ref_alpha in enumerate(self.ref_alpha):
-                    # add a summary per alpha
-                    self.alpha_summ.append(histogram_summary('alpha_{}'.format(m),
-                                                             ref_alpha))
-            # make a dummy copy of discriminator to have variables and then
-            # be able to set up the variable reuse for all other devices
-            # merge along channels and this would be a real batch
-            dummy_joint = tf.concat(2, [wavbatch, noisybatch])
-            dummy = discriminator(self, dummy_joint,
-                                  reuse=False)
-
-        G, z  = self.generator(noisybatch, is_ref=False, spk=None,
-                               do_prelu=do_prelu)
-        self.Gs.append(G)
-        self.zs.append(z)
-
-        # add new dimension to merge with other pairs
-        D_rl_joint = tf.concat(2, [wavbatch, noisybatch])
-        D_fk_joint = tf.concat(2, [G, noisybatch])
-        # build rl discriminator
-        d_rl_logits = discriminator(self, D_rl_joint, reuse=True)
-        # build fk G discriminator
-        d_fk_logits = discriminator(self, D_fk_joint, reuse=True)
-
-        # make disc variables summaries
-        self.d_rl_sum = histogram_summary("d_real", d_rl_logits)
-        self.d_fk_sum = histogram_summary("d_fake", d_fk_logits)
-        #self.d_nfk_sum = histogram_summary("d_noisyfake", d_nfk_logits)
-
-        self.rl_audio_summ = audio_summary('real_audio', wavbatch)
-        self.real_w_summ = histogram_summary('real_wav', wavbatch)
-        self.noisy_audio_summ = audio_summary('noisy_audio', noisybatch)
-        self.noisy_w_summ = histogram_summary('noisy_wav', noisybatch)
-        self.gen_audio_summ = audio_summary('G_audio', G)
-        self.gen_summ = histogram_summary('G_wav', G)
-
-        if gpu_idx == 0:
-            self.g_losses = []
-            self.g_l1_losses = []
-            self.g_adv_losses = []
-            self.d_rl_losses = []
-            self.d_fk_losses = []
-            #self.d_nfk_losses = []
-            self.d_losses = []
-
-        d_rl_loss = tf.reduce_mean(tf.squared_difference(d_rl_logits, 1.))
-        d_fk_loss = tf.reduce_mean(tf.squared_difference(d_fk_logits, 0.))
-        #d_nfk_loss = tf.reduce_mean(tf.squared_difference(d_nfk_logits, 0.))
-        g_adv_loss = tf.reduce_mean(tf.squared_difference(d_fk_logits, 1.))
-
-        d_loss = d_rl_loss + d_fk_loss
-
-        # Add the L1 loss to G
-        g_l1_loss = self.l1_lambda * tf.reduce_mean(tf.abs(tf.sub(G,
-                                                                  wavbatch)))
-
-        g_loss = g_adv_loss + g_l1_loss
-
-        self.g_l1_losses.append(g_l1_loss)
-        self.g_adv_losses.append(g_adv_loss)
-        self.g_losses.append(g_loss)
-        self.d_rl_losses.append(d_rl_loss)
-        self.d_fk_losses.append(d_fk_loss)
-        #self.d_nfk_losses.append(d_nfk_loss)
-        self.d_losses.append(d_loss)
-
-        self.d_rl_loss_sum = scalar_summary("d_rl_loss", d_rl_loss)
-        self.d_fk_loss_sum = scalar_summary("d_fk_loss",
-                                            d_fk_loss)
-        #self.d_nfk_loss_sum = scalar_summary("d_nfk_loss",
-        #                                     d_nfk_loss)
-        self.g_loss_sum = scalar_summary("g_loss", g_loss)
-        self.g_loss_l1_sum = scalar_summary("g_l1_loss", g_l1_loss)
-        self.g_loss_adv_sum = scalar_summary("g_adv_loss", g_adv_loss)
-        self.d_loss_sum = scalar_summary("d_loss", d_loss)
-
-        if gpu_idx == 0:
-            self.get_vars()
-
-
-    def get_vars(self):
-        t_vars = tf.trainable_variables()
-        self.d_vars_dict = {}
-        self.g_vars_dict = {}
-        for var in t_vars:
-            if var.name.startswith('d_'):
-                self.d_vars_dict[var.name] = var
-            if var.name.startswith('g_'):
-                self.g_vars_dict[var.name] = var
-        self.d_vars = self.d_vars_dict.values()
-        self.g_vars = self.g_vars_dict.values()
-        for x in self.d_vars:
-            assert x not in self.g_vars
-        for x in self.g_vars:
-            assert x not in self.d_vars
-        for x in t_vars:
-            assert x in self.g_vars or x in self.d_vars, x.name
-        self.all_vars = t_vars
-        if self.d_clip_weights:
-            print('Clipping D weights')
-            self.d_clip = [v.assign(tf.clip_by_value(v, -0.05, 0.05)) for v in self.d_vars]
-        else:
-            print('Not clipping D weights')
-
-    def vbn(self, tensor, name):
-        if self.disable_vbn:
-            class Dummy(object):
-                # Do nothing here, no bnorm
-                def __init__(self, tensor, ignored):
-                    self.reference_output=tensor
-                def __call__(self, x):
-                    return x
-            VBN_cls = Dummy
-        else:
-            VBN_cls = VBN
-        if not hasattr(self, name):
-            vbn = VBN_cls(tensor, name)
-            setattr(self, name, vbn)
-            return vbn.reference_output
-        vbn = getattr(self, name)
-        return vbn(tensor)
-
-    def train(self, config, devices):
-        """ Train the SEGAN """
-
-        print('Initializing optimizers...')
-        # init optimizers
-        d_opt = self.d_opt
-        g_opt = self.g_opt
-        num_devices = len(devices)
-
-        try:
-            init = tf.global_variables_initializer()
-        except AttributeError:
-            # fall back to old implementation
-            init = tf.initialize_all_variables()
-
-        print('Initializing variables...')
-        self.sess.run(init)
-        g_summs = [self.d_fk_sum,
-                   #self.d_nfk_sum,
-                   self.d_fk_loss_sum,
-                   #self.d_nfk_loss_sum,
-                   self.g_loss_sum,
-                   self.g_loss_l1_sum,
-                   self.g_loss_adv_sum,
-                   self.gen_summ,
-                   self.gen_audio_summ]
-        # if we have prelus, add them to summary
-        if hasattr(self, 'alpha_summ'):
-            g_summs += self.alpha_summ
-        self.g_sum = tf.summary.merge(g_summs)
-        self.d_sum = tf.summary.merge([self.d_loss_sum,
-                                       self.d_rl_sum,
-                                       self.d_rl_loss_sum,
-                                       self.rl_audio_summ,
-                                       self.real_w_summ,
-                                       self.disc_noise_std_summ])
-
-        if not os.path.exists(os.path.join(config.save_path, 'train')):
-            os.makedirs(os.path.join(config.save_path, 'train'))
-
-        self.writer = tf.summary.FileWriter(os.path.join(config.save_path,
-                                                         'train'),
-                                            self.sess.graph)
-
-        coord = tf.train.Coordinator()
-        threads = tf.train.start_queue_runners(coord=coord)
-
-        print('Sampling some wavs to store sample references...')
-        # Hang onto a copy of wavs so we can feed the same one every time
-        # we store samples to disk for hearing
-        # pick a single batch
-        sample_noisy, sample_wav, \
-        sample_z = self.sess.run([self.gtruth_noisy[0],
-                                  self.gtruth_wavs[0],
-                                  self.zs[0]])
-        print('sample noisy shape: ', sample_noisy.shape)
-        print('sample wav shape: ', sample_wav.shape)
-        print('sample z shape: ', sample_z.shape)
-
-        save_path = config.save_path
-        counter = 0
-        # count number of samples
-        num_examples = 0
-        for record in tf.python_io.tf_record_iterator(self.e2e_dataset):
-            num_examples += 1
-        print('total examples in TFRecords {}: {}'.format(self.e2e_dataset,
-                                                          num_examples))
-        # last samples (those not filling a complete batch) are discarded
-        num_batches = num_examples / self.batch_size
-
-        print('Batches per epoch: ', num_batches)
-
-        if self.load(self.save_path):
-            print('[*] Load SUCCESS')
-        else:
-            print('[!] Load failed')
-        batch_idx = 0
-        curr_epoch = 0
-        batch_timings = []
-        d_fk_losses = []
-        #d_nfk_losses = []
-        d_rl_losses = []
-        g_adv_losses = []
-        g_l1_losses = []
-        try:
-            while not coord.should_stop():
-                start = timeit.default_timer()
-                if counter % config.save_freq == 0:
-                    for d_iter in range(self.disc_updates):
-                        _d_opt, _d_sum, \
-                        d_fk_loss, \
-                        d_rl_loss = self.sess.run([d_opt, self.d_sum,
-                                                   self.d_fk_losses[0],
-                                                   #self.d_nfk_losses[0],
-                                                   self.d_rl_losses[0]])
-                        if self.d_clip_weights:
-                            self.sess.run(self.d_clip)
-                        #d_nfk_loss, \
-
-                    # now G iterations
-                    _g_opt, _g_sum, \
-                    g_adv_loss, \
-                    g_l1_loss = self.sess.run([g_opt, self.g_sum,
-                                               self.g_adv_losses[0],
-                                               self.g_l1_losses[0]])
-                else:
-                    for d_iter in range(self.disc_updates):
-                        _d_opt, \
-                        d_fk_loss, \
-                        d_rl_loss = self.sess.run([d_opt,
-                                                   self.d_fk_losses[0],
-                                                   #self.d_nfk_losses[0],
-                                                   self.d_rl_losses[0]])
-                        #d_nfk_loss, \
-                        if self.d_clip_weights:
-                            self.sess.run(self.d_clip)
-
-                    _g_opt, \
-                    g_adv_loss, \
-                    g_l1_loss = self.sess.run([g_opt, self.g_adv_losses[0],
-                                               self.g_l1_losses[0]])
-                end = timeit.default_timer()
-                batch_timings.append(end - start)
-                d_fk_losses.append(d_fk_loss)
-                #d_nfk_losses.append(d_nfk_loss)
-                d_rl_losses.append(d_rl_loss)
-                g_adv_losses.append(g_adv_loss)
-                g_l1_losses.append(g_l1_loss)
-                print('{}/{} (epoch {}), d_rl_loss = {:.5f}, '
-                      'd_fk_loss = {:.5f}, '#d_nfk_loss = {:.5f}, '
-                      'g_adv_loss = {:.5f}, g_l1_loss = {:.5f},'
-                      ' time/batch = {:.5f}, '
-                      'mtime/batch = {:.5f}'.format(counter,
-                                                    config.epoch * num_batches,
-                                                    curr_epoch,
-                                                    d_rl_loss,
-                                                    d_fk_loss,
-                                                    #d_nfk_loss,
-                                                    g_adv_loss,
-                                                    g_l1_loss,
-                                                    end - start,
-                                                    np.mean(batch_timings)))
-                batch_idx += num_devices
-                counter += num_devices
-                if (counter / num_devices) % config.save_freq == 0:
-                    self.save(config.save_path, counter)
-                    self.writer.add_summary(_g_sum, counter)
-                    self.writer.add_summary(_d_sum, counter)
-                    fdict = {self.gtruth_noisy[0]:sample_noisy,
-                             self.zs[0]:sample_z}
-                    canvas_w = self.sess.run(self.Gs[0],
-                                             feed_dict=fdict)
-                    swaves = sample_wav
-                    sample_dif = sample_wav - sample_noisy
-                    for m in range(min(20, canvas_w.shape[0])):
-                        print('w{} max: {} min: {}'.format(m, np.max(canvas_w[m]), np.min(canvas_w[m])))
-                        wavfile.write(os.path.join(save_path, 'sample_{}-{}.wav'.format(counter, m)), 16e3, canvas_w[m])
-                        if not os.path.exists(os.path.join(save_path, 'gtruth_{}.wav'.format(m))):
-                            wavfile.write(os.path.join(save_path, 'gtruth_{}.wav'.format(m)), 16e3, swaves[m])
-                            wavfile.write(os.path.join(save_path, 'noisy_{}.wav'.format(m)), 16e3, sample_noisy[m])
-                            wavfile.write(os.path.join(save_path, 'dif_{}.wav'.format(m)), 16e3, sample_dif[m])
-                        np.savetxt(os.path.join(save_path, 'd_rl_losses.txt'), d_rl_losses)
-                        np.savetxt(os.path.join(save_path, 'd_fk_losses.txt'), d_fk_losses)
-                        #np.savetxt(os.path.join(save_path, 'd_nfk_losses.txt'), d_nfk_losses)
-                        np.savetxt(os.path.join(save_path, 'g_adv_losses.txt'), g_adv_losses)
-                        np.savetxt(os.path.join(save_path, 'g_l1_losses.txt'), g_l1_losses)
-
-                if batch_idx >= num_batches:
-                    curr_epoch += 1
-                    # re-set batch idx
-                    batch_idx = 0
-                    # check if we have to deactivate L1
-                    if curr_epoch >= config.l1_remove_epoch and self.deactivated_l1 == False:
-                        print('** Deactivating L1 factor! **')
-                        self.sess.run(tf.assign(self.l1_lambda, 0.))
-                        self.deactivated_l1 = True
-                    # check if we have to start decaying noise (if any)
-                    if curr_epoch >= config.denoise_epoch and self.deactivated_noise == False:
-                        # apply noise std decay rate
-                        decay = config.noise_decay
-                        if not hasattr(self, 'curr_noise_std'):
-                            self.curr_noise_std = self.init_noise_std
-                        new_noise_std = decay * self.curr_noise_std
-                        if new_noise_std < config.denoise_lbound:
-                            print('New noise std {} < lbound {}, setting 0.'.format(new_noise_std, config.denoise_lbound))
-                            print('** De-activating noise layer **')
-                            # it it's lower than a lower bound, cancel out completely
-                            new_noise_std = 0.
-                            self.deactivated_noise = True
-                        else:
-                            print('Applying decay {} to noise std {}: {}'.format(decay, self.curr_noise_std, new_noise_std))
-                        self.sess.run(tf.assign(self.disc_noise_std, new_noise_std))
-                        self.curr_noise_std = new_noise_std
-                if curr_epoch >= config.epoch:
-                    # done training
-                    print('Done training; epoch limit {} '
-                          'reached.'.format(self.epoch))
-                    break
-        except tf.errors.OutOfRangeError:
-            print('Done training; epoch limit {} reached.'.format(self.epoch))
-        finally:
-            coord.request_stop()
-        coord.join(threads)
-
-    def clean(self, x):
-        """ clean a utterance x
-            x: numpy array containing the normalized noisy waveform
-        """
-        c_res = None
-        for beg_i in range(0, x.shape[0], 2 ** 14):
-            if x.shape[0] - beg_i  < 2 ** 14:
-                length = x.shape[0] - beg_i
-                pad = (2 ** 14) - length
-            else:
-                length = 2 ** 14
-                pad = 0
-            x_ = np.zeros((self.batch_size, 2 ** 14))
-            if pad > 0:
-                x_[0] = np.concatenate((x[beg_i:beg_i + length], np.zeros(pad)))
-            else:
-                x_[0] = x[beg_i:beg_i + length]
-            print('Cleaning chunk {} -> {}'.format(beg_i, beg_i + length))
-            fdict = {self.gtruth_noisy[0]:x_}
-            canvas_w = self.sess.run(self.Gs[0],
-                                     feed_dict=fdict)[0]
-            canvas_w = canvas_w.reshape((2 ** 14))
-            print('canvas w shape: ', canvas_w.shape)
-            if pad > 0:
-                print('Removing padding of {} samples'.format(pad))
-                # get rid of last padded samples
-                canvas_w = canvas_w[:-pad]
-            if c_res is None:
-                c_res = canvas_w
-            else:
-                c_res = np.concatenate((c_res, canvas_w))
-        return c_res
-
-
-class SEAE(Model):
-    """ Speech Enhancement Auto Encoder """
-    def __init__(self, sess, args, devices, infer=False):
-        self.args = args
-        self.sess = sess
-        self.keep_prob = 1.
-        if infer:
-            self.keep_prob_var = tf.Variable(self.keep_prob, trainable=False)
-        else:
-            self.keep_prob = 0.5
-            self.keep_prob_var = tf.Variable(self.keep_prob, trainable=False)
-        self.batch_size = args.batch_size
-        self.epoch = args.epoch
-        self.devices = devices
-        self.save_path = args.save_path
-        # canvas size
-        self.canvas_size = args.canvas_size
-        self.g_enc_depths = [16, 32, 32, 64, 64, 128, 128, 256, 256, 512, 1024]
-        self.e2e_dataset = args.e2e_dataset
-        # define the Generator
-        self.generator = AEGenerator(self)
-        self.build_model(args)
-
-    def build_model(self, config):
-        all_g_grads = []
-        g_opt = tf.train.AdamOptimizer(config.g_learning_rate, config.beta_1)
-
-        for idx, device in enumerate(self.devices):
-            with tf.device("/%s" % device):
-                with tf.name_scope("device_%s" % idx):
-                    with variables_on_gpu0():
-                        self.build_model_single_gpu(idx)
-                        g_grads = g_opt.compute_gradients(self.g_losses[-1],
-                                                          var_list=self.g_vars)
-                        all_g_grads.append(g_grads)
-                        tf.get_variable_scope().reuse_variables()
-        avg_g_grads = average_gradients(all_g_grads)
-        self.g_opt = g_opt.apply_gradients(avg_g_grads)
-
-
-    def build_model_single_gpu(self, gpu_idx):
-        if gpu_idx == 0:
-            # create the nodes to load for input pipeline
-            filename_queue = tf.train.string_input_producer([self.e2e_dataset])
-            self.get_wav, self.get_noisy = read_and_decode(filename_queue,
-                                                           2 ** 14)
-        # load the data to input pipeline
-        wavbatch, \
-        noisybatch = tf.train.shuffle_batch([self.get_wav,
-                                             self.get_noisy],
-                                             batch_size=self.batch_size,
-                                             num_threads=2,
-                                             capacity=1000 + 3 * self.batch_size,
-                                             min_after_dequeue=1000,
-                                             name='wav_and_noisy')
-        if gpu_idx == 0:
-            self.Gs = []
-            self.zs = []
-            self.gtruth_wavs = []
-            self.gtruth_noisy = []
-
-        self.gtruth_wavs.append(wavbatch)
-        self.gtruth_noisy.append(noisybatch)
-
-        # add channels dimension to manipulate in D and G
-        wavbatch = tf.expand_dims(wavbatch, -1)
-        noisybatch = tf.expand_dims(noisybatch, -1)
-        if gpu_idx == 0:
-            #self.sample_wavs = tf.placeholder(tf.float32, [self.batch_size,
-            #                                               self.canvas_size],
-            #                                  name='sample_wavs')
-            self.reference_G = self.generator(noisybatch, is_ref=True,
-                                              spk=None, z_on=False)
-
-        G = self.generator(noisybatch, is_ref=False, spk=None, z_on=False)
-        print('GAE shape: ', G.get_shape())
-        self.Gs.append(G)
-
-        self.rl_audio_summ = audio_summary('real_audio', wavbatch)
-        self.real_w_summ = histogram_summary('real_wav', wavbatch)
-        self.noisy_audio_summ = audio_summary('noisy_audio', noisybatch)
-        self.noisy_w_summ = histogram_summary('noisy_wav', noisybatch)
-        self.gen_audio_summ = audio_summary('G_audio', G)
-        self.gen_summ = histogram_summary('G_wav', G)
-
-        if gpu_idx == 0:
-            self.g_losses = []
-
-        # Add the L1 loss to G
-        g_loss = tf.reduce_mean(tf.abs(tf.sub(G, wavbatch)))
-
-        self.g_losses.append(g_loss)
-
-        self.g_loss_sum = scalar_summary("g_loss", g_loss)
-
-        if gpu_idx == 0:
-            self.get_vars()
-
-    def get_vars(self):
-        t_vars = tf.trainable_variables()
-        self.g_vars = [var for var in t_vars if var.name.startswith('g_')]
-        for x in t_vars:
-            assert x in self.g_vars, x.name
-        self.all_vars = t_vars
-
-    def train(self, config, devices):
-        """ Train the SEAE """
-
-        print('Initializing optimizer...')
-        # init optimizer
-        g_opt = self.g_opt
-        num_devices = len(devices)
-
-        try:
-            init = tf.global_variables_initializer()
-        except AttributeError:
-            # fall back to old implementation
-            init = tf.initialize_all_variables()
-
-        print('Initializing variables...')
-        self.sess.run(init)
-        self.saver = tf.train.Saver()
-        self.g_sum = tf.summary.merge([self.g_loss_sum,
-                                       self.gen_summ,
-                                       self.rl_audio_summ,
-                                       self.real_w_summ,
-                                       self.gen_audio_summ])
-
-        if not os.path.exists(os.path.join(config.save_path, 'train')):
-            os.makedirs(os.path.join(config.save_path, 'train'))
-
-        self.writer = tf.summary.FileWriter(os.path.join(config.save_path,
-                                                         'train'),
-                                            self.sess.graph)
-
-        coord = tf.train.Coordinator()
-        threads = tf.train.start_queue_runners(coord=coord)
-
-        print('Sampling some wavs to store sample references...')
-        # Hang onto a copy of wavs so we can feed the same one every time
-        # we store samples to disk for hearing
-        # pick a single batch
-        sample_noisy, \
-        sample_wav = self.sess.run([self.gtruth_noisy[0],
-                                    self.gtruth_wavs[0]])
-        print('sample noisy shape: ', sample_noisy.shape)
-        print('sample wav shape: ', sample_wav.shape)
-        save_path = config.save_path
-        counter = 0
-        # count number of samples
-        num_examples = 0
-        for record in tf.python_io.tf_record_iterator(self.e2e_dataset):
-            num_examples += 1
-        print('total examples in TFRecords {}: {}'.format(self.e2e_dataset,
-                                                          num_examples))
-        # last samples (those not filling a complete batch) are discarded
-        num_batches = num_examples / self.batch_size
-
-        print('Batches per epoch: ', num_batches)
-
-        if self.load(self.save_path):
-            print('[*] Load SUCCESS')
-        else:
-            print('[!] Load failed')
-        batch_idx = 0
-        curr_epoch = 0
-        batch_timings = []
-        g_losses = []
-        try:
-            while not coord.should_stop():
-                start = timeit.default_timer()
-                if counter % config.save_freq == 0:
-                    # now G iterations
-                    _g_opt, _g_sum, \
-                    g_loss = self.sess.run([g_opt, self.g_sum,
-                                            self.g_losses[0]])
-                else:
-                    _g_opt, \
-                    g_loss = self.sess.run([g_opt, self.g_losses[0]])
-
-                end = timeit.default_timer()
-                batch_timings.append(end - start)
-                g_losses.append(g_loss)
-                print('{}/{} (epoch {}), g_loss = {:.5f},'
-                      ' time/batch = {:.5f}, '
-                      'mtime/batch = {:.5f}'.format(counter,
-                                                    config.epoch * num_batches,
-                                                    curr_epoch,
-                                                    g_loss,
-                                                    end - start,
-                                                    np.mean(batch_timings)))
-                batch_idx += num_devices
-                counter += num_devices
-                if (counter / num_devices) % config.save_freq == 0:
-                    self.save(config.save_path, counter)
-                    self.writer.add_summary(_g_sum, counter)
-                    fdict = {self.gtruth_noisy[0]:sample_noisy}
-                    canvas_w = self.sess.run(self.Gs[0],
-                                             feed_dict=fdict)
-                    swaves = sample_wav
-                    sample_dif = sample_wav - sample_noisy
-                    for m in range(min(20, canvas_w.shape[0])):
-                        print('w{} max: {} min: {}'.format(m, np.max(canvas_w[m]), np.min(canvas_w[m])))
-                        wavfile.write(os.path.join(save_path, 'sample_{}-{}.wav'.format(counter, m)), 16e3, canvas_w[m])
-                        if not os.path.exists(os.path.join(save_path, 'gtruth_{}.wav'.format(m))):
-                            wavfile.write(os.path.join(save_path, 'gtruth_{}.wav'.format(m)), 16e3, swaves[m])
-                            wavfile.write(os.path.join(save_path, 'noisy_{}.wav'.format(m)), 16e3, sample_noisy[m])
-                            wavfile.write(os.path.join(save_path, 'dif_{}.wav'.format(m)), 16e3, sample_dif[m])
-                        np.savetxt(os.path.join(save_path, 'g_losses.txt'), g_losses)
-
-                if batch_idx >= num_batches:
-                    curr_epoch += 1
-                    # re-set batch idx
-                    batch_idx = 0
-                if curr_epoch >= config.epoch:
-                    # done training
-                    print('Done training; epoch limit {} '
-                          'reached.'.format(self.epoch))
-                    break
-        except tf.errors.OutOfRangeError:
-            print('[!] Reached queues limits in training loop')
-        finally:
-            coord.request_stop()
-        coord.join(threads)
+from __future__ import print_function
+import tensorflow as tf
+from tensorflow.contrib.layers import batch_norm, fully_connected, flatten
+from tensorflow.contrib.layers import xavier_initializer
+from scipy.io import wavfile
+from generator import *
+from discriminator import *
+import numpy as np
+from data_loader import read_and_decode
+from bnorm import VBN
+from ops import *
+import timeit
+import os
+
+
+class Model(object):
+
+    def __init__(self, name='BaseModel'):
+        self.name = name
+
+    def save(self, save_path, step):
+        model_name = self.name
+        if not os.path.exists(save_path):
+            os.makedirs(save_path)
+        if not hasattr(self, 'saver'):
+            self.saver = tf.train.Saver()
+        self.saver.save(self.sess,
+                        os.path.join(save_path, model_name),
+                        global_step=step)
+
+    def load(self, save_path, model_file=None):
+        if not os.path.exists(save_path):
+            print('[!] Checkpoints path does not exist...')
+            return False
+        print('[*] Reading checkpoints...')
+        if model_file is None:
+            ckpt = tf.train.get_checkpoint_state(save_path)
+            if ckpt and ckpt.model_checkpoint_path:
+                ckpt_name = os.path.basename(ckpt.model_checkpoint_path)
+            else:
+                return False
+        else:
+            ckpt_name = model_file
+        if not hasattr(self, 'saver'):
+            self.saver = tf.train.Saver()
+        self.saver.restore(self.sess, os.path.join(save_path, ckpt_name))
+        print('[*] Read {}'.format(ckpt_name))
+        return True
+
+
+
+class SEGAN(Model):
+    """ Speech Enhancement Generative Adversarial Network """
+    def __init__(self, sess, args, devices, infer=False, name='SEGAN'):
+        super(SEGAN, self).__init__(name)
+        self.args = args
+        self.sess = sess
+        self.keep_prob = 1.
+        if infer:
+            self.keep_prob_var = tf.Variable(self.keep_prob, trainable=False)
+        else:
+            self.keep_prob = 0.5
+            self.keep_prob_var = tf.Variable(self.keep_prob, trainable=False)
+        self.batch_size = args.batch_size
+        self.epoch = args.epoch
+        self.d_label_smooth = args.d_label_smooth
+        self.devices = devices
+        self.z_dim = args.z_dim
+        self.z_depth = args.z_depth
+        # clip D values
+        self.d_clip_weights = False
+        # apply VBN or regular BN?
+        self.disable_vbn = False
+        self.save_path = args.save_path
+        # num of updates to be applied to D before G
+        # this is k in original GAN paper (https://arxiv.org/abs/1406.2661)
+        self.disc_updates = 1
+        # canvas size
+        self.canvas_size = args.canvas_size
+        self.deactivated_noise = False
+        # dilation factors per layer (only in atrous conv G config)
+        self.g_dilated_blocks = [1, 2, 4, 8, 16, 32, 64, 128, 256, 512]
+        # num fmaps for AutoEncoder SEGAN (v1)
+        self.g_enc_depths = [16, 32, 32, 64, 64, 128, 128, 256, 256, 512, 1024]
+        # Define D fmaps
+        self.d_num_fmaps = [16, 32, 32, 64, 64, 128, 128, 256, 256, 512, 1024]
+        self.init_noise_std = args.init_noise_std
+        self.disc_noise_std = tf.Variable(self.init_noise_std, trainable=False)
+        self.disc_noise_std_summ = scalar_summary('disc_noise_std',
+                                                  self.disc_noise_std)
+        self.e2e_dataset = args.e2e_dataset
+        # G's supervised loss weight
+        self.l1_weight = args.init_l1_weight
+        self.l1_lambda = tf.Variable(self.l1_weight, trainable=False)
+        self.deactivated_l1 = False
+        # define the functions
+        self.discriminator = discriminator
+        # register G non linearity
+        self.g_nl = args.g_nl
+        if args.g_type == 'ae':
+            self.generator = AEGenerator(self)
+        elif args.g_type == 'dwave':
+            self.generator = Generator(self)
+        else:
+            raise ValueError('Unrecognized G type {}'.format(args.g_type))
+        self.build_model(args)
+
+    def build_model(self, config):
+        all_d_grads = []
+        all_g_grads = []
+
+        #d_opt = tf.train.RMSPropOptimizer(config.d_learning_rate)
+        #g_opt = tf.train.RMSPropOptimizer(config.g_learning_rate)
+        d_opt = tf.train.AdamOptimizer(config.d_learning_rate,
+                                       beta1=config.beta_1)
+        g_opt = tf.train.AdamOptimizer(config.g_learning_rate,
+                                       beta1=config.beta_1)
+
+        with tf.variable_scope(tf.get_variable_scope()) as scope:
+          for idx, device in enumerate(self.devices):
+              with tf.device("/%s" % device):
+                  with tf.name_scope("device_%s" % idx):
+                      with variables_on_gpu0():
+                          self.build_model_single_gpu(idx)
+
+                          d_grads = d_opt.compute_gradients(self.d_losses[-1],
+                                                            var_list=self.d_vars)
+                          g_grads = g_opt.compute_gradients(self.g_losses[-1],
+                                                            var_list=self.g_vars)
+                          all_d_grads.append(d_grads)
+                          all_g_grads.append(g_grads)
+
+        avg_d_grads = average_gradients(all_d_grads)
+        avg_g_grads = average_gradients(all_g_grads)
+        self.d_opt = d_opt.apply_gradients(avg_d_grads)
+        self.g_opt = g_opt.apply_gradients(avg_g_grads)
+
+
+    def build_model_single_gpu(self, gpu_idx):
+        if gpu_idx == 0:
+            # create the nodes to load for input pipeline
+            filename_queue = tf.train.string_input_producer([self.e2e_dataset])
+            self.get_wav, self.get_noisy = read_and_decode(filename_queue,
+                                                           2 ** 14)
+        # load the data to input pipeline
+        wavbatch, \
+        noisybatch = tf.train.shuffle_batch([self.get_wav,
+                                             self.get_noisy],
+                                             batch_size=self.batch_size,
+                                             num_threads=2,
+                                             capacity=1000 + 3 * self.batch_size,
+                                             min_after_dequeue=1000,
+                                             name='wav_and_noisy')
+        if gpu_idx == 0:
+            self.Gs = []
+            self.zs = []
+            self.gtruth_wavs = []
+            self.gtruth_noisy = []
+
+        self.gtruth_wavs.append(wavbatch)
+        self.gtruth_noisy.append(noisybatch)
+
+        # add channels dimension to manipulate in D and G
+        wavbatch = tf.expand_dims(wavbatch, -1)
+        noisybatch = tf.expand_dims(noisybatch, -1)
+        # by default leaky relu is used
+        do_prelu = False
+        if self.g_nl == 'prelu':
+            do_prelu = True
+        if gpu_idx == 0:
+            #self.sample_wavs = tf.placeholder(tf.float32, [self.batch_size,
+            #                                               self.canvas_size],
+            #                                  name='sample_wavs')
+            ref_Gs = self.generator(noisybatch, is_ref=True,
+                                    spk=None,
+                                    do_prelu=do_prelu)
+            print('num of G returned: ', len(ref_Gs))
+            self.reference_G = ref_Gs[0]
+            self.ref_z = ref_Gs[1]
+            if do_prelu:
+                self.ref_alpha = ref_Gs[2:]
+                self.alpha_summ = []
+                for m, ref_alpha in enumerate(self.ref_alpha):
+                    # add a summary per alpha
+                    self.alpha_summ.append(histogram_summary('alpha_{}'.format(m),
+                                                             ref_alpha))
+            # make a dummy copy of discriminator to have variables and then
+            # be able to set up the variable reuse for all other devices
+            # merge along channels and this would be a real batch
+            dummy_joint = tf.concat(axis=2, values=[wavbatch, noisybatch])
+            dummy = discriminator(self, dummy_joint,
+                                  reuse=False)
+
+        G, z  = self.generator(noisybatch, is_ref=False, spk=None,
+                               do_prelu=do_prelu)
+        self.Gs.append(G)
+        self.zs.append(z)
+
+        # add new dimension to merge with other pairs
+        D_rl_joint = tf.concat(axis=2, values=[wavbatch, noisybatch])
+        D_fk_joint = tf.concat(axis=2, values=[G, noisybatch])
+        # build rl discriminator
+        d_rl_logits = discriminator(self, D_rl_joint, reuse=True)
+        # build fk G discriminator
+        d_fk_logits = discriminator(self, D_fk_joint, reuse=True)
+
+        # make disc variables summaries
+        self.d_rl_sum = histogram_summary("d_real", d_rl_logits)
+        self.d_fk_sum = histogram_summary("d_fake", d_fk_logits)
+        #self.d_nfk_sum = histogram_summary("d_noisyfake", d_nfk_logits)
+
+        self.rl_audio_summ = audio_summary('real_audio', wavbatch)
+        self.real_w_summ = histogram_summary('real_wav', wavbatch)
+        self.noisy_audio_summ = audio_summary('noisy_audio', noisybatch)
+        self.noisy_w_summ = histogram_summary('noisy_wav', noisybatch)
+        self.gen_audio_summ = audio_summary('G_audio', G)
+        self.gen_summ = histogram_summary('G_wav', G)
+
+        if gpu_idx == 0:
+            self.g_losses = []
+            self.g_l1_losses = []
+            self.g_adv_losses = []
+            self.d_rl_losses = []
+            self.d_fk_losses = []
+            #self.d_nfk_losses = []
+            self.d_losses = []
+
+        d_rl_loss = tf.reduce_mean(tf.squared_difference(d_rl_logits, 1.))
+        d_fk_loss = tf.reduce_mean(tf.squared_difference(d_fk_logits, 0.))
+        #d_nfk_loss = tf.reduce_mean(tf.squared_difference(d_nfk_logits, 0.))
+        g_adv_loss = tf.reduce_mean(tf.squared_difference(d_fk_logits, 1.))
+
+        d_loss = d_rl_loss + d_fk_loss
+
+        # Add the L1 loss to G
+        g_l1_loss = self.l1_lambda * tf.reduce_mean(tf.abs(tf.subtract(G, wavbatch)))
+
+        g_loss = g_adv_loss + g_l1_loss
+
+        self.g_l1_losses.append(g_l1_loss)
+        self.g_adv_losses.append(g_adv_loss)
+        self.g_losses.append(g_loss)
+        self.d_rl_losses.append(d_rl_loss)
+        self.d_fk_losses.append(d_fk_loss)
+        #self.d_nfk_losses.append(d_nfk_loss)
+        self.d_losses.append(d_loss)
+
+        self.d_rl_loss_sum = scalar_summary("d_rl_loss", d_rl_loss)
+        self.d_fk_loss_sum = scalar_summary("d_fk_loss",
+                                            d_fk_loss)
+        #self.d_nfk_loss_sum = scalar_summary("d_nfk_loss",
+        #                                     d_nfk_loss)
+        self.g_loss_sum = scalar_summary("g_loss", g_loss)
+        self.g_loss_l1_sum = scalar_summary("g_l1_loss", g_l1_loss)
+        self.g_loss_adv_sum = scalar_summary("g_adv_loss", g_adv_loss)
+        self.d_loss_sum = scalar_summary("d_loss", d_loss)
+
+        if gpu_idx == 0:
+            self.get_vars()
+
+
+    def get_vars(self):
+        t_vars = tf.trainable_variables()
+        self.d_vars_dict = {}
+        self.g_vars_dict = {}
+        for var in t_vars:
+            if var.name.startswith('d_'):
+                self.d_vars_dict[var.name] = var
+            if var.name.startswith('g_'):
+                self.g_vars_dict[var.name] = var
+        self.d_vars = list(self.d_vars_dict.values())
+        self.g_vars = list(self.g_vars_dict.values())
+
+        for x in self.d_vars:
+            assert x not in self.g_vars
+        for x in self.g_vars:
+            assert x not in self.d_vars
+        for x in t_vars:
+            assert x in self.g_vars or x in self.d_vars, x.name
+        self.all_vars = t_vars
+        if self.d_clip_weights:
+            print('Clipping D weights')
+            self.d_clip = [v.assign(tf.clip_by_value(v, -0.05, 0.05)) for v in self.d_vars]
+        else:
+            print('Not clipping D weights')
+
+    def vbn(self, tensor, name):
+        if self.disable_vbn:
+            class Dummy(object):
+                # Do nothing here, no bnorm
+                def __init__(self, tensor, ignored):
+                    self.reference_output=tensor
+                def __call__(self, x):
+                    return x
+            VBN_cls = Dummy
+        else:
+            VBN_cls = VBN
+        if not hasattr(self, name):
+            vbn = VBN_cls(tensor, name)
+            setattr(self, name, vbn)
+            return vbn.reference_output
+        vbn = getattr(self, name)
+        return vbn(tensor)
+
+    def train(self, config, devices):
+        """ Train the SEGAN """
+
+        print('Initializing optimizers...')
+        # init optimizers
+        d_opt = self.d_opt
+        g_opt = self.g_opt
+        num_devices = len(devices)
+
+        try:
+            init = tf.global_variables_initializer()
+        except AttributeError:
+            # fall back to old implementation
+            init = tf.global_variables_initializer()
+
+        print('Initializing variables...')
+        self.sess.run(init)
+        g_summs = [self.d_fk_sum,
+                   #self.d_nfk_sum,
+                   self.d_fk_loss_sum,
+                   #self.d_nfk_loss_sum,
+                   self.g_loss_sum,
+                   self.g_loss_l1_sum,
+                   self.g_loss_adv_sum,
+                   self.gen_summ,
+                   self.gen_audio_summ]
+        # if we have prelus, add them to summary
+        if hasattr(self, 'alpha_summ'):
+            g_summs += self.alpha_summ
+        self.g_sum = tf.summary.merge(g_summs)
+        self.d_sum = tf.summary.merge([self.d_loss_sum,
+                                       self.d_rl_sum,
+                                       self.d_rl_loss_sum,
+                                       self.rl_audio_summ,
+                                       self.real_w_summ,
+                                       self.disc_noise_std_summ])
+
+        if not os.path.exists(os.path.join(config.save_path, 'train')):
+            os.makedirs(os.path.join(config.save_path, 'train'))
+
+        self.writer = tf.summary.FileWriter(os.path.join(config.save_path,
+                                                         'train'),
+                                            self.sess.graph)
+
+        coord = tf.train.Coordinator()
+        threads = tf.train.start_queue_runners(coord=coord)
+
+        print('Sampling some wavs to store sample references...')
+        # Hang onto a copy of wavs so we can feed the same one every time
+        # we store samples to disk for hearing
+        # pick a single batch
+        sample_noisy, sample_wav, \
+        sample_z = self.sess.run([self.gtruth_noisy[0],
+                                  self.gtruth_wavs[0],
+                                  self.zs[0]])
+        print('sample noisy shape: ', sample_noisy.shape)
+        print('sample wav shape: ', sample_wav.shape)
+        print('sample z shape: ', sample_z.shape)
+
+        save_path = config.save_path
+        counter = 0
+        # count number of samples
+        num_examples = 0
+        for record in tf.python_io.tf_record_iterator(self.e2e_dataset):
+            num_examples += 1
+        print('total examples in TFRecords {}: {}'.format(self.e2e_dataset,
+                                                          num_examples))
+        # last samples (those not filling a complete batch) are discarded
+        num_batches = num_examples / self.batch_size
+
+        print('Batches per epoch: ', num_batches)
+
+        if self.load(self.save_path):
+            print('[*] Load SUCCESS')
+        else:
+            print('[!] Load failed')
+        batch_idx = 0
+        curr_epoch = 0
+        batch_timings = []
+        d_fk_losses = []
+        #d_nfk_losses = []
+        d_rl_losses = []
+        g_adv_losses = []
+        g_l1_losses = []
+        try:
+            while not coord.should_stop():
+                start = timeit.default_timer()
+                if counter % config.save_freq == 0:
+                    for d_iter in range(self.disc_updates):
+                        _d_opt, _d_sum, \
+                        d_fk_loss, \
+                        d_rl_loss = self.sess.run([d_opt, self.d_sum,
+                                                   self.d_fk_losses[0],
+                                                   #self.d_nfk_losses[0],
+                                                   self.d_rl_losses[0]])
+                        if self.d_clip_weights:
+                            self.sess.run(self.d_clip)
+                        #d_nfk_loss, \
+
+                    # now G iterations
+                    _g_opt, _g_sum, \
+                    g_adv_loss, \
+                    g_l1_loss = self.sess.run([g_opt, self.g_sum,
+                                               self.g_adv_losses[0],
+                                               self.g_l1_losses[0]])
+                else:
+                    for d_iter in range(self.disc_updates):
+                        _d_opt, \
+                        d_fk_loss, \
+                        d_rl_loss = self.sess.run([d_opt,
+                                                   self.d_fk_losses[0],
+                                                   #self.d_nfk_losses[0],
+                                                   self.d_rl_losses[0]])
+                        #d_nfk_loss, \
+                        if self.d_clip_weights:
+                            self.sess.run(self.d_clip)
+
+                    _g_opt, \
+                    g_adv_loss, \
+                    g_l1_loss = self.sess.run([g_opt, self.g_adv_losses[0],
+                                               self.g_l1_losses[0]])
+                end = timeit.default_timer()
+                batch_timings.append(end - start)
+                d_fk_losses.append(d_fk_loss)
+                #d_nfk_losses.append(d_nfk_loss)
+                d_rl_losses.append(d_rl_loss)
+                g_adv_losses.append(g_adv_loss)
+                g_l1_losses.append(g_l1_loss)
+                print('{}/{} (epoch {}), d_rl_loss = {:.5f}, '
+                      'd_fk_loss = {:.5f}, '#d_nfk_loss = {:.5f}, '
+                      'g_adv_loss = {:.5f}, g_l1_loss = {:.5f},'
+                      ' time/batch = {:.5f}, '
+                      'mtime/batch = {:.5f}'     .format(counter,
+                                                    config.epoch * num_batches,
+                                                    curr_epoch,
+                                                    d_rl_loss,
+                                                    d_fk_loss,
+                                                    #d_nfk_loss,
+                                                    g_adv_loss,
+                                                    g_l1_loss,
+                                                    end - start,
+                                                    np.mean(batch_timings)))
+                batch_idx += num_devices
+                counter += num_devices
+                if (counter / num_devices) % config.save_freq == 0:
+                    self.save(config.save_path, counter)
+                    self.writer.add_summary(_g_sum, counter)
+                    self.writer.add_summary(_d_sum, counter)
+                    fdict = {self.gtruth_noisy[0]:sample_noisy,
+                             self.zs[0]:sample_z}
+                    canvas_w = self.sess.run(self.Gs[0],
+                                             feed_dict=fdict)
+                    swaves = sample_wav
+                    sample_dif = sample_wav - sample_noisy
+                    for m in range(min(20, canvas_w.shape[0])):
+                        print('w{} max: {} min: {}'.format(m, np.max(canvas_w[m]), np.min(canvas_w[m])))
+                        wavfile.write(os.path.join(save_path, 'sample_{}-{}.wav'.format(counter, m)), 16000, canvas_w[m])
+                        if not os.path.exists(os.path.join(save_path, 'gtruth_{}.wav'.format(m))):
+                            wavfile.write(os.path.join(save_path, 'gtruth_{}.wav'.format(m)), 16000, swaves[m])
+                            wavfile.write(os.path.join(save_path, 'noisy_{}.wav'.format(m)), 16000, sample_noisy[m])
+                            wavfile.write(os.path.join(save_path, 'dif_{}.wav'.format(m)), 16000, sample_dif[m])
+                        np.savetxt(os.path.join(save_path, 'd_rl_losses.txt'), d_rl_losses)
+                        np.savetxt(os.path.join(save_path, 'd_fk_losses.txt'), d_fk_losses)
+                        #np.savetxt(os.path.join(save_path, 'd_nfk_losses.txt'), d_nfk_losses)
+                        np.savetxt(os.path.join(save_path, 'g_adv_losses.txt'), g_adv_losses)
+                        np.savetxt(os.path.join(save_path, 'g_l1_losses.txt'), g_l1_losses)
+
+                if batch_idx >= int(num_batches):
+                    curr_epoch += 1
+                    # re-set batch idx
+                    batch_idx = 0
+                    # check if we have to deactivate L1
+                    if curr_epoch >= config.l1_remove_epoch and self.deactivated_l1 == False:
+                        print('** Deactivating L1 factor! **')
+                        self.sess.run(tf.assign(self.l1_lambda, 0.))
+                        self.deactivated_l1 = True
+                    # check if we have to start decaying noise (if any)
+                    if curr_epoch >= config.denoise_epoch and self.deactivated_noise == False:
+                        # apply noise std decay rate
+                        decay = config.noise_decay
+                        if not hasattr(self, 'curr_noise_std'):
+                            self.curr_noise_std = self.init_noise_std
+                        new_noise_std = decay * self.curr_noise_std
+                        if new_noise_std < config.denoise_lbound:
+                            print('New noise std {} < lbound {}, setting 0.'.format(new_noise_std, config.denoise_lbound))
+                            print('** De-activating noise layer **')
+                            # it it's lower than a lower bound, cancel out completely
+                            new_noise_std = 0.
+                            self.deactivated_noise = True
+                        else:
+                            print('Applying decay {} to noise std {}: {}'.format(decay, self.curr_noise_std, new_noise_std))
+                        self.sess.run(tf.assign(self.disc_noise_std, new_noise_std))
+                        self.curr_noise_std = new_noise_std
+                if curr_epoch >= config.epoch:
+                    # done training
+                    print('Done training; epoch limit {} '
+                          'reached.'.format(self.epoch))
+                    break
+        except tf.errors.OutOfRangeError:
+            print('Done training; epoch limit {} reached.'.format(self.epoch))
+        finally:
+            coord.request_stop()
+        coord.join(threads)
+
+    def clean(self, x):
+        """ clean a utterance x
+            x: numpy array containing the normalized noisy waveform
+        """
+        c_res = None
+        for beg_i in range(0, x.shape[0], 2 ** 14):
+            if x.shape[0] - beg_i  < 2 ** 14:
+                length = x.shape[0] - beg_i
+                pad = (2 ** 14) - length
+            else:
+                length = 2 ** 14
+                pad = 0
+            x_ = np.zeros((self.batch_size, 2 ** 14))
+            if pad > 0:
+                x_[0] = np.concatenate((x[beg_i:beg_i + length], np.zeros(pad)))
+            else:
+                x_[0] = x[beg_i:beg_i + length]
+            print('Cleaning chunk {} -> {}'.format(beg_i, beg_i + length))
+            fdict = {self.gtruth_noisy[0]:x_}
+            canvas_w = self.sess.run(self.Gs[0],
+                                     feed_dict=fdict)[0]
+            canvas_w = canvas_w.reshape((2 ** 14))
+            print('canvas w shape: ', canvas_w.shape)
+            if pad > 0:
+                print('Removing padding of {} samples'.format(pad))
+                # get rid of last padded samples
+                canvas_w = canvas_w[:-pad]
+            if c_res is None:
+                c_res = canvas_w
+            else:
+                c_res = np.concatenate((c_res, canvas_w))
+        return c_res
+
+
+class SEAE(Model):
+    """ Speech Enhancement Auto Encoder """
+    def __init__(self, sess, args, devices, infer=False):
+        self.args = args
+        self.sess = sess
+        self.keep_prob = 1.
+        if infer:
+            self.keep_prob_var = tf.Variable(self.keep_prob, trainable=False)
+        else:
+            self.keep_prob = 0.5
+            self.keep_prob_var = tf.Variable(self.keep_prob, trainable=False)
+        self.batch_size = args.batch_size
+        self.epoch = args.epoch
+        self.devices = devices
+        self.save_path = args.save_path
+        # canvas size
+        self.canvas_size = args.canvas_size
+        self.g_enc_depths = [16, 32, 32, 64, 64, 128, 128, 256, 256, 512, 1024]
+        self.e2e_dataset = args.e2e_dataset
+        # define the Generator
+        self.generator = AEGenerator(self)
+        self.build_model(args)
+
+    def build_model(self, config):
+        all_g_grads = []
+        g_opt = tf.train.AdamOptimizer(config.g_learning_rate, config.beta_1)
+
+        for idx, device in enumerate(self.devices):
+            with tf.device("/%s" % device):
+                with tf.name_scope("device_%s" % idx):
+                    with variables_on_gpu0():
+                        self.build_model_single_gpu(idx)
+                        g_grads = g_opt.compute_gradients(self.g_losses[-1],
+                                                          var_list=self.g_vars)
+                        all_g_grads.append(g_grads)
+                        tf.get_variable_scope().reuse_variables()
+        avg_g_grads = average_gradients(all_g_grads)
+        self.g_opt = g_opt.apply_gradients(avg_g_grads)
+
+
+    def build_model_single_gpu(self, gpu_idx):
+        if gpu_idx == 0:
+            # create the nodes to load for input pipeline
+            filename_queue = tf.train.string_input_producer([self.e2e_dataset])
+            self.get_wav, self.get_noisy = read_and_decode(filename_queue,
+                                                           2 ** 14)
+        # load the data to input pipeline
+        wavbatch, \
+        noisybatch = tf.train.shuffle_batch([self.get_wav,
+                                             self.get_noisy],
+                                             batch_size=self.batch_size,
+                                             num_threads=2,
+                                             capacity=1000 + 3 * self.batch_size,
+                                             min_after_dequeue=1000,
+                                             name='wav_and_noisy')
+        if gpu_idx == 0:
+            self.Gs = []
+            self.zs = []
+            self.gtruth_wavs = []
+            self.gtruth_noisy = []
+
+        self.gtruth_wavs.append(wavbatch)
+        self.gtruth_noisy.append(noisybatch)
+
+        # add channels dimension to manipulate in D and G
+        wavbatch = tf.expand_dims(wavbatch, -1)
+        noisybatch = tf.expand_dims(noisybatch, -1)
+        if gpu_idx == 0:
+            #self.sample_wavs = tf.placeholder(tf.float32, [self.batch_size,
+            #                                               self.canvas_size],
+            #                                  name='sample_wavs')
+            self.reference_G = self.generator(noisybatch, is_ref=True,
+                                              spk=None, z_on=False)
+
+        G = self.generator(noisybatch, is_ref=False, spk=None, z_on=False)
+        print('GAE shape: ', G.get_shape())
+        self.Gs.append(G)
+
+        self.rl_audio_summ = audio_summary('real_audio', wavbatch)
+        self.real_w_summ = histogram_summary('real_wav', wavbatch)
+        self.noisy_audio_summ = audio_summary('noisy_audio', noisybatch)
+        self.noisy_w_summ = histogram_summary('noisy_wav', noisybatch)
+        self.gen_audio_summ = audio_summary('G_audio', G)
+        self.gen_summ = histogram_summary('G_wav', G)
+
+        if gpu_idx == 0:
+            self.g_losses = []
+
+        # Add the L1 loss to G
+        g_loss = tf.reduce_mean(tf.abs(tf.subtract(G, wavbatch)))
+
+        self.g_losses.append(g_loss)
+
+        self.g_loss_sum = scalar_summary("g_loss", g_loss)
+
+        if gpu_idx == 0:
+            self.get_vars()
+
+    def get_vars(self):
+        t_vars = tf.trainable_variables()
+        self.g_vars = [var for var in t_vars if var.name.startswith('g_')]
+        for x in t_vars:
+            assert x in self.g_vars, x.name
+        self.all_vars = t_vars
+
+    def train(self, config, devices):
+        """ Train the SEAE """
+
+        print('Initializing optimizer...')
+        # init optimizer
+        g_opt = self.g_opt
+        num_devices = len(devices)
+
+        try:
+            init = tf.global_variables_initializer()
+        except AttributeError:
+            # fall back to old implementation
+            init = tf.global_variables_initializer()
+
+        print('Initializing variables...')
+        self.sess.run(init)
+        self.saver = tf.train.Saver()
+        self.g_sum = tf.summary.merge([self.g_loss_sum,
+                                       self.gen_summ,
+                                       self.rl_audio_summ,
+                                       self.real_w_summ,
+                                       self.gen_audio_summ])
+
+        if not os.path.exists(os.path.join(config.save_path, 'train')):
+            os.makedirs(os.path.join(config.save_path, 'train'))
+
+        self.writer = tf.summary.FileWriter(os.path.join(config.save_path,
+                                                         'train'),
+                                            self.sess.graph)
+
+        coord = tf.train.Coordinator()
+        threads = tf.train.start_queue_runners(coord=coord)
+
+        print('Sampling some wavs to store sample references...')
+        # Hang onto a copy of wavs so we can feed the same one every time
+        # we store samples to disk for hearing
+        # pick a single batch
+        sample_noisy, \
+        sample_wav = self.sess.run([self.gtruth_noisy[0],
+                                    self.gtruth_wavs[0]])
+        print('sample noisy shape: ', sample_noisy.shape)
+        print('sample wav shape: ', sample_wav.shape)
+        save_path = config.save_path
+        counter = 0
+        # count number of samples
+        num_examples = 0
+        for record in tf.python_io.tf_record_iterator(self.e2e_dataset):
+            num_examples += 1
+        print('total examples in TFRecords {}: {}'.format(self.e2e_dataset,
+                                                          num_examples))
+        # last samples (those not filling a complete batch) are discarded
+        num_batches = num_examples / self.batch_size
+
+        print('Batches per epoch: ', num_batches)
+
+        if self.load(self.save_path):
+            print('[*] Load SUCCESS')
+        else:
+            print('[!] Load failed')
+        batch_idx = 0
+        curr_epoch = 0
+        batch_timings = []
+        g_losses = []
+        try:
+            while not coord.should_stop():
+                start = timeit.default_timer()
+                if counter % config.save_freq == 0:
+                    # now G iterations
+                    _g_opt, _g_sum, \
+                    g_loss = self.sess.run([g_opt, self.g_sum,
+                                            self.g_losses[0]])
+                else:
+                    _g_opt, \
+                    g_loss = self.sess.run([g_opt, self.g_losses[0]])
+
+                end = timeit.default_timer()
+                batch_timings.append(end - start)
+                g_losses.append(g_loss)
+                print('{}/{} (epoch {}), g_loss = {:.5f},'
+                      ' time/batch = {:.5f}, '
+                      'mtime/batch = {:.5f}'.format(counter,
+                                                    config.epoch * num_batches,
+                                                    curr_epoch,
+                                                    g_loss,
+                                                    end - start,
+                                                    np.mean(batch_timings)))
+                batch_idx += num_devices
+                counter += num_devices
+                if (counter / num_devices) % config.save_freq == 0:
+                    self.save(config.save_path, counter)
+                    self.writer.add_summary(_g_sum, counter)
+                    fdict = {self.gtruth_noisy[0]:sample_noisy}
+                    canvas_w = self.sess.run(self.Gs[0],
+                                             feed_dict=fdict)
+                    swaves = sample_wav
+                    sample_dif = sample_wav - sample_noisy
+                    for m in range(min(20, canvas_w.shape[0])):
+                        print('w{} max: {} min: {}'.format(m, np.max(canvas_w[m]), np.min(canvas_w[m])))
+                        wavfile.write(os.path.join(save_path, 'sample_{}-{}.wav'.format(counter, m)), 16000, canvas_w[m])
+                        if not os.path.exists(os.path.join(save_path, 'gtruth_{}.wav'.format(m))):
+                            wavfile.write(os.path.join(save_path, 'gtruth_{}.wav'.format(m)), 16000, swaves[m])
+                            wavfile.write(os.path.join(save_path, 'noisy_{}.wav'.format(m)), 16000, sample_noisy[m])
+                            wavfile.write(os.path.join(save_path, 'dif_{}.wav'.format(m)), 16000, sample_dif[m])
+                        np.savetxt(os.path.join(save_path, 'g_losses.txt'), g_losses)
+
+                if batch_idx >= int(num_batches):
+                    curr_epoch += 1
+                    # re-set batch idx
+                    batch_idx = 0
+                if curr_epoch >= config.epoch:
+                    # done training
+                    print('Done training; epoch limit {} '
+                          'reached.'.format(self.epoch))
+                    break
+        except tf.errors.OutOfRangeError:
+            print('[!] Reached queues limits in training loop')
+        finally:
+            coord.request_stop()
+        coord.join(threads)
diff --git a/ops.py b/ops.py
index 47d276c..8ce8e67 100644
--- a/ops.py
+++ b/ops.py
@@ -29,28 +29,28 @@ def scalar_summary(name, x):
     try:
         summ = tf.summary.scalar(name, x)
     except AttributeError:
-        summ = tf.scalar_summary(name, x)
+        summ = tf.summary.scalar(name, x)
     return summ
 
 def histogram_summary(name, x):
     try:
         summ = tf.summary.histogram(name, x)
     except AttributeError:
-        summ = tf.histogram_summary(name, x)
+        summ = tf.summary.histogram(name, x)
     return summ
 
 def tensor_summary(name, x):
     try:
         summ = tf.summary.tensor_summary(name, x)
     except AttributeError:
-        summ = tf.tensor_summary(name, x)
+        summ = tf.summary.tensor_summary(name, x)
     return summ
 
 def audio_summary(name, x, sampling_rate=16e3):
     try:
         summ = tf.summary.audio(name, x, sampling_rate)
     except AttributeError:
-        summ = tf.audio_summary(name, x, sampling_rate)
+        summ = tf.summary.audio(name, x, sampling_rate)
     return summ
 
 def minmax_normalize(x, x_min, x_max, o_min=-1., o_max=1.):
@@ -89,12 +89,12 @@ def highway(input_, size, layer_size=1, bias=-2, f=tf.nn.relu, name='hw'):
     where g is nonlinearity, t is transform gate, and (1 - t) is carry gate.
     """
     output = input_
-    for idx in xrange(layer_size):
+    for idx in range(layer_size):
         lin_scope = '{}_output_lin_{}'.format(name, idx)
-        output = f(tf.nn.rnn_cell._linear(output, size, 0, scope=lin_scope))
+        output = f(tf.contrib.rnn._linear(output, size, 0, scope=lin_scope))
         transform_scope = '{}_transform_lin_{}'.format(name, idx)
         transform_gate = tf.sigmoid(
-            tf.nn.rnn_cell._linear(input_, size, 0, scope=transform_scope) + bias)
+            tf.contrib.rnn._linear(input_, size, 0, scope=transform_scope) + bias)
         carry_gate = 1. - transform_gate
 
         output = transform_gate * output + carry_gate * input_
@@ -202,7 +202,7 @@ def residual_block(input_, dilation, kwidth, num_kernels=1,
         z = tf.nn.sigmoid(z_a)
         print('gate shape: ', z.get_shape())
         # element-wise apply the gate
-        gated_h = tf.mul(z, h)
+        gated_h = tf.multiply(z, h)
         print('gated h shape: ', gated_h.get_shape())
         #make res connection
         h_ = conv1d(gated_h, kwidth=1, num_kernels=1,
@@ -243,8 +243,8 @@ def deconv(x, output_shape, kwidth=5, dilation=2, init=None, uniform=False,
         except AttributeError:
             # support for versions of TF before 0.7.0
             # based on https://github.com/carpedm20/DCGAN-tensorflow
-            deconv = tf.nn.deconv2d(x2d, W, output_shape=o2d,
-                                    strides=[1, dilation, 1, 1])
+            deconv = tf.nn.conv2d_transpose(x2d, W, output_shape=o2d,
+                                            strides=[1, dilation, 1, 1])
         if bias_init is not None:
             b = tf.get_variable('b', [out_channels],
                                 initializer=tf.constant_initializer(0.))
@@ -302,7 +302,7 @@ def average_gradients(tower_grads):
             grads.append(expanded_g)
 
         # Build the tensor and average along tower dimension
-        grad = tf.concat(0, grads)
+        grad = tf.concat(grads, 0)
         grad = tf.reduce_mean(grad, 0)
 
         # The Variables are redundant because they are shared across towers
diff --git a/requirements.txt b/requirements.txt
index 8f06ea7..01a15c7 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,4 +1,4 @@
 numpy==1.12.1
 scipy==0.18.1
-tensorflow_gpu==0.12.1
+tensorflow_gpu==1.1.0rc1
 toml==0.9.2
diff --git a/test_all.sh b/test_all.sh
new file mode 100644
index 0000000..5621e5e
--- /dev/null
+++ b/test_all.sh
@@ -0,0 +1,19 @@
+#!/bin/bash
+
+# Set foler pathes for noisy and enhanced files
+if [ $# -lt 2 ]; then
+    echo 'ERROR: Noisy and Ehnahced Pathes should be provided!'
+    echo "Usage: $0 <noisy_path> <enhanced_path>"
+    exit 1
+fi
+
+NOISY_PATH="$1"
+ENHANCED_PATH="$2"
+mkdir -p $ENHANCED_PATH
+
+FILES=$NOISY_PATH/*.wav
+
+for f in $FILES 
+do 
+  clean_wav.sh $f $ENHANCED_PATH
+done

From b265a7bcd24aa723a3930285fe1df6df6b9b1b9b Mon Sep 17 00:00:00 2001
From: "Kwang Myung, Jeon" <lordet01@gmail.com>
Date: Tue, 26 May 2020 11:17:43 +0900
Subject: [PATCH 2/2] env updated for wavEnv

---
 .gitignore    | 106 ++++++++------------------------------------------
 clean_wav.bat |   5 +++
 2 files changed, 22 insertions(+), 89 deletions(-)
 create mode 100644 clean_wav.bat

diff --git a/.gitignore b/.gitignore
index 72364f9..0ac96a6 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,89 +1,17 @@
-# Byte-compiled / optimized / DLL files
-__pycache__/
-*.py[cod]
-*$py.class
-
-# C extensions
-*.so
-
-# Distribution / packaging
-.Python
-env/
-build/
-develop-eggs/
-dist/
-downloads/
-eggs/
-.eggs/
-lib/
-lib64/
-parts/
-sdist/
-var/
-*.egg-info/
-.installed.cfg
-*.egg
-
-# PyInstaller
-#  Usually these files are written by a python script from a template
-#  before PyInstaller builds the exe, so as to inject date/other infos into it.
-*.manifest
-*.spec
-
-# Installer logs
-pip-log.txt
-pip-delete-this-directory.txt
-
-# Unit test / coverage reports
-htmlcov/
-.tox/
-.coverage
-.coverage.*
-.cache
-nosetests.xml
-coverage.xml
-*,cover
-.hypothesis/
-
-# Translations
-*.mo
-*.pot
-
-# Django stuff:
-*.log
-local_settings.py
-
-# Flask stuff:
-instance/
-.webassets-cache
-
-# Scrapy stuff:
-.scrapy
-
-# Sphinx documentation
-docs/_build/
-
-# PyBuilder
-target/
-
-# IPython Notebook
-.ipynb_checkpoints
-
-# pyenv
-.python-version
-
-# celery beat schedule file
-celerybeat-schedule
-
-# dotenv
-.env
-
-# virtualenv
-venv/
-ENV/
-
-# Spyder project settings
-.spyderproject
-
-# Rope project settings
-.ropeproject
+*.feat
+*.feat.pickle
+*.train
+*.eval
+*.model
+*.pyc
+*.data-00000-of-00001
+*.data-00000-of-*
+speech2vec/
+*.mat
+debug/
+*.basis
+*.activation
+*.index
+*.h5
+*.GAN
+segan_v1/
diff --git a/clean_wav.bat b/clean_wav.bat
new file mode 100644
index 0000000..5f6d78b
--- /dev/null
+++ b/clean_wav.bat
@@ -0,0 +1,5 @@
+python main.py --init_noise_std 1. --save_path segan_v1 ^
+               --batch_size 100 --g_nl prelu --weights SEGAN-72900 ^
+               --preemph 0.95 --bias_deconv True ^
+               --bias_downconv True --bias_D_conv True ^
+               --test_wav %1 --save_clean_path %2