comparative examples

2018-02-14 14:58:28 +00:00 · 2018-02-14 14:58:28 +00:00 · 8205402b66
commit 8205402b66
parent c1ed3e477e
3 changed files with 252 additions and 0 deletions
--- a/examples/flux.jl
+++ b/examples/flux.jl
@ -0,0 +1,92 @@
 using Flux
 # ––––––––––––––––––––––––––––––––––––––––––––––––––––––– #
 #            Logistic Regression from scratch             #
 # ––––––––––––––––––––––––––––––––––––––––––––––––––––––– #
 W = param(zeros(10,784))
 b = param(zeros(10))
 pred(x) = softmax(W*x .+ b)
 cost(x, y) = mean(sum(log.(pred(x)).*y, 1))
 # See an example predction
 pred(rand(784))
 # ––––––––––––––––––––––––––––––––––––––––––––––––––––––– #
 #                  Custom Layer: Dense                    #
 # ––––––––––––––––––––––––––––––––––––––––––––––––––––––– #
 struct Dense
  σ
  W
  b
 end
 function Dense(in::Integer, out::Integer, σ = σ)
  W = param(randn(out, in))
  b = param(zeros(out))
  return Dense(σ, W, b)
 end
 # Note that Julia compiles:
 #   * Specialised code for the forward pass (wrt activation function,
 #     number types, ...)
 #   * Including a single GPU/CPU kernel for the broadcast call
 function (m::Dense)(x)
  σ, W, b = m.σ, m.W, m.b
  σ.(W*x .+ b)
 end
 d = Dense(10, 5, relu)
 d(rand(10))
 # ––––––––––––––––––––––––––––––––––––––––––––––––––––––– #
 #                  RNN from scratch                       #
 # ––––––––––––––––––––––––––––––––––––––––––––––––––––––– #
 in = 10
 out = 5
 Wi = param(randn(out, in))
 Wh = param(randn(out, out))
 b = param(zeros(out))
 function rnn(h, x)
  h = tanh.(Wi*x .+ Wh*h .+ b)
  return h, h
 end
 h = rand(out)
 xs = [rand(in) for i = 1:13] # Sequence of length 13
 ys = []
 for x in xs
  h, y = rnn(h, x)
  push!(ys, y)
 end
 # Output hidden state and sequence
 h, ys
 # ––––––––––––––––––––––––––––––––––––––––––––––––––––––– #
 #                  Recursive Net                          #
 # ––––––––––––––––––––––––––––––––––––––––––––––––––––––– #
 N = 10
 # Generate dummy data
 tree() = rand() < 0.5 ? rand(N) : (tree(), tree())
 # Model
 shrink = Dense(2N, N)
 combine(a, b) = shrink([a; b])
 model(x) = x
 model(x::Tuple) = combine(model(x[1]), model(x[2]))
 # The model is able to compress an arbitrary tree into
 # a single length N representation.
 model(tree())
--- a/examples/pytorch.py
+++ b/examples/pytorch.py
@ -0,0 +1,73 @@
 import torch
 from torch.autograd import Variable
 from torch import nn
 from torch.nn import Parameter
 from torch.nn.functional import softmax
 # ------------------------------------------------------- #
 #            Logistic Regression from scratch             #
 # ------------------------------------------------------- #
 W = Variable(torch.zeros(784, 10))
 b = Variable(torch.zeros(1, 10))
 def pred(x):
    return softmax(torch.matmul(x, W) + b)
 def cost(x, y):
    return (pred(x).log() * y).sum(1).mean()
 # See an example prediction
 pred(Variable(torch.rand(1,784), requires_grad = False))
 # ------------------------------------------------------- #
 #                  Custom Layer: Dense                    #
 # ------------------------------------------------------- #
 class Dense(nn.Module):
    def __init__(self, input, out, act = torch.nn.functional.sigmoid):
        super(Dense, self).__init__()
        self.act = act
        self.W = Parameter(torch.randn(input, out))
        self.b = Parameter(torch.randn(1, out))
    def forward(self, x):
        return self.act(torch.matmul(x, self.W) + self.b)
 d = Dense(10, 5, torch.nn.functional.relu)
 x = Variable(torch.rand(1, 10), requires_grad = False)
 d(x)
 # ------------------------------------------------------- #
 #                  RNN from scratch                       #
 # ------------------------------------------------------- #
 class RNN(nn.Module):
    def __init__(self, input, out):
        super(RNN, self).__init__()
        self.Wi = Parameter(torch.randn(input, out))
        self.Wh = Parameter(torch.randn(out, out))
        self.b = Parameter(torch.randn(1, out))
    def forward(self, h, x):
        Wi, Wh, b = self.Wi, self.Wh, self.b
        h = (torch.matmul(x, Wi) + torch.matmul(h, Wh) + b).tanh()
        return (h, h)
 rnn = RNN(10, 5)
 h = Variable(torch.rand(1, 5), requires_grad = False)
 xs = [Variable(torch.rand(1, 10), requires_grad = False) for _ in range(10)]
 ys = []
 for x in xs:
    (h, y) = rnn(h, x)
    ys.append(y)
 # Output hidden state and sequence
 h, ys
 # ------------------------------------------------------- #
 #                  Recursive Net                          #
 # ------------------------------------------------------- #
 # TODO: similar to Julia
--- a/examples/tf.py
+++ b/examples/tf.py
@ -0,0 +1,87 @@
 import tensorflow as tf
 import numpy as np
 # ------------------------------------------------------- #
 #            Logistic Regression from scratch             #
 # ------------------------------------------------------- #
 sess = tf.Session()
 x = tf.placeholder(tf.float32, [None, 784]) # mnist data image of shape 28*28=784
 y = tf.placeholder(tf.float32, [None, 10]) # 0-9 digits recognition => 10 classes
 W = tf.Variable(tf.zeros([784, 10]))
 b = tf.Variable(tf.zeros([10]))
 pred = tf.nn.softmax(tf.matmul(x, W) + b)
 cost = tf.reduce_mean(-tf.reduce_sum(y*tf.log(pred), reduction_indices=1))
 init = tf.global_variables_initializer()
 sess.run(init)
 # See an example prediction
 sess.run(pred, feed_dict = {x: np.random.rand(1,784)})
 sess.close()
 # ------------------------------------------------------- #
 #                  Custom Layer: Dense                    #
 # ------------------------------------------------------- #
 def dense_layer(x, input, out, act = tf.sigmoid):
    W = tf.get_variable("weights", [input, out],
                        initializer=tf.random_normal_initializer())
    b = tf.get_variable("bias", [1, out],
                        initializer=tf.random_normal_initializer())
    return act(tf.matmul(x, W) + b)
 sess = tf.Session()
 x = tf.placeholder(tf.float32, [None, 10])
 with tf.variable_scope("layer1"):
    y = dense_layer(x, 10, 5)
 init = tf.global_variables_initializer()
 sess.run(init)
 sess.run(y, feed_dict = {x: np.random.rand(1,10)})
 sess.close()
 # ------------------------------------------------------- #
 #                  RNN from scratch                       #
 # ------------------------------------------------------- #
 input = 10
 hidden = 5
 length = 13
 def step(hprev, x):
    # params
    Wi = tf.get_variable('W', shape=[input, hidden], initializer=tf.random_normal_initializer())
    Wh = tf.get_variable('U', shape=[hidden, hidden], initializer=tf.random_normal_initializer())
    b = tf.get_variable('b', shape=[hidden], initializer=tf.constant_initializer(0.))
    # current hidden state
    h = tf.tanh(tf.matmul(hprev, Wh) + tf.matmul(x,Wi) + b)
    return h
 sess = tf.Session()
 # (seqlength, batch, features)
 xs = tf.placeholder(tf.float32, [length, 1, input])
 h = tf.placeholder(tf.float32, [None, hidden])
 states = tf.scan(step, xs, initializer=h)
 init = tf.global_variables_initializer()
 sess.run(init)
 sess.run(states, feed_dict = {xs: np.random.rand(length,1,input), h: np.random.randn(1,hidden)})
 sess.close()
 # ------------------------------------------------------- #
 #                  Recursive Net                          #
 # ------------------------------------------------------- #
 # Too long to repeat here, see https://github.com/erickrf/treernn