Untitled

#!/usr/bin/env python
# -*- coding: utf-8 -*-
from __future__ import division
import tensorflow as tf
import numpy as np
from tensorflow.examples.tutorials.mnist import input_data
from PIL import Image
from utils import tile_raster_images, scale_to_unit_interval
import math
import matplotlib.pyplot as plt


def main():
    mnist = input_data.read_data_sets("../MNIST_data/", one_hot=True)
    trX, trY, teX, teY = mnist.train.images, mnist.train.labels, mnist.test.images, mnist.test.labels

    Nv = 784
    v_shape = (28, 28)
    Nh = 100
    h1_shape = (10, 10)

    gibbs_sampling_steps = 1
    alpha = 0.1  # koeficijent učenja

    g1 = tf.Graph()
    with g1.as_default():
        X1 = tf.placeholder("float", [None, 784])                               # X1 [batch_size x 784]
        w1 = weights([Nv, Nh])                                                  # w1 [784 x 100]
        vb1 = bias([Nv])
        hb1 = bias([Nh])

        h0_prob = tf.random_normal([tf.shape(X1)[0], Nh])
        h0 = sample_prob(h0_prob)
        h1 = h0                                                                 # h1 [batch_size x 100]

        for step in range(gibbs_sampling_steps):
            v1_prob = tf.sigmoid(tf.matmul(h1, tf.transpose(w1)) + vb1)         # v1 [batch_size x 784]
            v1 = sample_prob(v1_prob)

            h1_prob = tf.sigmoid(tf.matmul(v1, w1) + hb1)                       # h1 [batch_size x 100]
            h1 = sample_prob(h1_prob)

            # pozitivna faza
            w1_positive_grad = tf.matmul(tf.transpose(X1), h0)                  # [784, 100]
            # negativna faza
            w1_negative_grad = tf.matmul(tf.transpose(v1_prob), h1)             # [784, 100]

        dw1 = (w1_positive_grad - w1_negative_grad) / tf.to_float(tf.shape(X1)[0])

        # operacije za osvježavanje parametara mreže - one pokreću učenje RBM-a
        update_w1 = tf.assign_add(w1, alpha * dw1)
        update_vb1 = tf.assign_add(vb1, alpha * tf.reduce_mean(X1 - v1_prob, 0))
        update_hb1 = tf.assign_add(hb1, alpha * tf.reduce_mean(h0 - h1, 0))

        out1 = (update_w1, update_vb1, update_hb1)

        # rekonstrukcija ulaznog vektora - koristimo vjerojatnost p(v=1)
        v1_prob = tf.sigmoid(tf.matmul(h1, tf.transpose(w1)) + vb1)

        err1 = X1 - v1_prob
        err_sum1 = tf.reduce_mean(err1 * err1)

        initialize1 = tf.initialize_all_variables()

    batch_size = 100
    epochs = 100
    n_samples = mnist.train.num_examples

    total_batch = int(n_samples / batch_size) * epochs

    with tf.Session(graph=g1) as sess:
        sess.run(initialize1)
        for i in range(total_batch):
            batch, label = mnist.train.next_batch(batch_size)
            err, _ = sess.run([err_sum1, out1], feed_dict={X1: batch})

            if i % (int(total_batch / 10)) == 0:
                print i, err

        w1s = w1.eval()
        vb1s = vb1.eval()
        hb1s = hb1.eval()
        vr, h1s = sess.run([v1_prob, h1], feed_dict={X1: teX[0:2, :]})

    # vizualizacija težina
    draw_weights(w1s, v_shape, Nh)

    # vizualizacija rekonstrukcije i stanja
    draw_reconstructions(teX, vr, h1s, v_shape, h1_shape, Nh)


def weights(shape):
    initial = tf.truncated_normal(shape, stddev=0.1)
    return tf.Variable(initial)


def bias(shape):
    initial = tf.zeros(shape, dtype=tf.float32)
    return tf.Variable(initial)


def sample_prob(probs):
    """Uzorkovanje vektora x prema vektoru vjerojatnosti p(x=1) = probs"""
    return tf.nn.relu(
        tf.sign(probs - tf.random_uniform(tf.shape(probs))))


def draw_weights(W, shape, N, interpolation="bilinear"):
    """Vizualizacija težina

    W -- vektori težina
    shape -- tuple dimenzije za 2D prikaz težina - obično dimenzije ulazne slike, npr. (28,28)
    N -- broj vektora težina
    """
    image = Image.fromarray(tile_raster_images(
        X=W.T,
        img_shape=shape,
        tile_shape=(int(math.ceil(N / 20)), 20),
        tile_spacing=(1, 1)))
    plt.figure(figsize=(10, 14))
    plt.imshow(image, interpolation=interpolation)


def draw_reconstructions(ins, outs, states, shape_in, shape_state, Nh):
    """Vizualizacija ulaza i pripadajućih rekonstrkcija i stanja skrivenog sloja
    ins -- ualzni vektori
    outs -- rekonstruirani vektori
    states -- vektori stanja skrivenog sloja
    shape_in -- dimezije ulaznih slika npr. (28,28)
    shape_state -- dimezije za 2D prikaz stanja (npr. za 100 stanja (10,10)
    """
    plt.figure(figsize=(8, 12 * 4))
    for i in range(20):

        plt.subplot(20, 4, 4 * i + 1)
        plt.imshow(ins[i].reshape(shape_in), vmin=0,
                   vmax=1, interpolation="nearest")
        plt.title("Test input")
        plt.subplot(20, 4, 4 * i + 2)
        plt.imshow(outs[i][0:784].reshape(shape_in),
                   vmin=0, vmax=1, interpolation="nearest")
        plt.title("Reconstruction")
        plt.subplot(20, 4, 4 * i + 3)
        plt.imshow(states[i][0:Nh].reshape(shape_state),
                   vmin=0, vmax=1, interpolation="nearest")
        plt.title("States")
    plt.tight_layout()


if __name__ == '__main__':
    main()