Skip to content

Commit

Permalink
Neural networks
Browse files Browse the repository at this point in the history
  • Loading branch information
vinhkhuc committed Feb 13, 2017
1 parent 05f780e commit 48b8ec4
Show file tree
Hide file tree
Showing 2 changed files with 146 additions and 0 deletions.
71 changes: 71 additions & 0 deletions 3_neural_net.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,71 @@
import numpy as np

import torch
from torch.autograd import Variable
from torch import optim

from data_util import load_mnist


def build_model(input_dim, output_dim):
model = torch.nn.Sequential()
model.add_module("linear_1", torch.nn.Linear(input_dim, 512, bias=False))
model.add_module("sigmoid_1", torch.nn.Sigmoid())
model.add_module("linear_2", torch.nn.Linear(512, output_dim, bias=False))
model.add_module("softmax", torch.nn.Softmax())
return model


def train(model, loss, optimizer, x, y):
x = Variable(x, requires_grad=False)
y = Variable(y, requires_grad=False)

# Reset gradient
optimizer.zero_grad()

# Forward
fx = model.forward(x)
output = loss.forward(fx, y)

# Backward
output.backward()

# Update parameters
optimizer.step()

return output.data[0]


def predict(model, x):
var_x = Variable(x, requires_grad=False)
output = model.forward(var_x)
return output.data.numpy().argmax(axis=1)


def main():
torch.manual_seed(42)
trX, teX, trY, teY = load_mnist(onehot=False)
trX = torch.from_numpy(trX).float()
teX = torch.from_numpy(teX).float()
trY = torch.from_numpy(trY).long()

n_examples, n_features = trX.size()
n_classes = 10
model = build_model(n_features, n_classes)
loss = torch.nn.CrossEntropyLoss(size_average=True)
optimizer = optim.SGD(model.parameters(), lr=0.01, momentum=0.9)
batch_size = 100

for i in range(100):
cost = 0.
num_batches = n_examples / batch_size
for k in range(num_batches):
start, end = k * batch_size, (k + 1) * batch_size
cost += train(model, loss, optimizer, trX[start:end], trY[start:end])
predY = predict(model, teX)
print("Epoch %d, cost = %f, acc = %.2f%%"
% (i + 1, cost / num_batches, 100. * np.mean(predY == teY)))


if __name__ == "__main__":
main()
75 changes: 75 additions & 0 deletions 4_modern_neural_net.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,75 @@
import numpy as np

import torch
from torch.autograd import Variable
from torch import optim

from data_util import load_mnist


def build_model(input_dim, output_dim):
model = torch.nn.Sequential()
model.add_module("linear_1", torch.nn.Linear(input_dim, 512, bias=False))
model.add_module("relu_1", torch.nn.ReLU())
model.add_module("dropout_1", torch.nn.Dropout(0.2))
model.add_module("linear_2", torch.nn.Linear(512, 512, bias=False))
model.add_module("relu_2", torch.nn.ReLU())
model.add_module("dropout_2", torch.nn.Dropout(0.2))
model.add_module("linear_3", torch.nn.Linear(512, output_dim, bias=False))
model.add_module("softmax", torch.nn.Softmax())
return model


def train(model, loss, optimizer, x, y):
x = Variable(x, requires_grad=False)
y = Variable(y, requires_grad=False)

# Reset gradient
optimizer.zero_grad()

# Forward
fx = model.forward(x)
output = loss.forward(fx, y)

# Backward
output.backward()

# Update parameters
optimizer.step()

return output.data[0]


def predict(model, x):
var_x = Variable(x, requires_grad=False)
output = model.forward(var_x)
return output.data.numpy().argmax(axis=1)


def main():
torch.manual_seed(42)
trX, teX, trY, teY = load_mnist(onehot=False)
trX = torch.from_numpy(trX).float()
teX = torch.from_numpy(teX).float()
trY = torch.from_numpy(trY).long()

n_examples, n_features = trX.size()
n_classes = 10
model = build_model(n_features, n_classes)
loss = torch.nn.CrossEntropyLoss(size_average=True)
optimizer = optim.RMSprop(model.parameters(), lr=0.01)
batch_size = 100

for i in range(100):
cost = 0.
num_batches = n_examples / batch_size
for k in range(num_batches):
start, end = k * batch_size, (k + 1) * batch_size
cost += train(model, loss, optimizer, trX[start:end], trY[start:end])
predY = predict(model, teX)
print("Epoch %d, cost = %f, acc = %.2f%%"
% (i + 1, cost / num_batches, 100. * np.mean(predY == teY)))


if __name__ == "__main__":
main()

0 comments on commit 48b8ec4

Please sign in to comment.