Untitled

From Cute Tapir, 4 Years ago, written in Python.

Embed

Download Paste or View Raw
Hits: 90

import numpy as np

from scipy.special import expit

import sys

import struct

import os

class NeuralNetMLP(object):

def __init__(self, n_output, n_features, n_hidden=30

, l1=0.0, l2=0.0, epochs=500, eta=0.001,

alpha=0.0, decrease_const=0.0, shuffle=True,

minibatches=1, random_state=None):

np.random.seed(random_state)

self.n_output = n_output

self.n_features = n_features

self.n_hidden = n_hidden

self.w1, self.w2, = self._initialize_weights()

self.l1 = l1

self.l2 = l2

self.epochs = epochs

self.eta = eta

self.alpha = alpha

self.decrease_const = decrease_const

self.shuffle = shuffle

self.minibatches = minibatches

def _encode_labels(selfself, y, k):

onehot = np.zeros((k, y.shape[0]))

for idx, val in enumerate(y):

onehot[val, idx] = 1.0

return onehot

def _initialize_weights(self):

w1 = np.random.uniform(-1.0, 1.0,

size=self.n_hidden * (self.n_features + 1))

w1 = w1.reshape(self.n_hidden, self.n_features + 1)

w2 = np.random.uniform(-1.0, 1.0,

size=self.n_output * (self.n_hidden + 1))

w2 = w2.reshape(self.n_output, self.n_hidden + 1)

return w1, w2

def _sigmoid(self, z):

return expit(z)

def _sigmoid_gradient(self, z):

sg = self._sigmoid(z)

return sg * (1 - sg)

def _add_bias_unit(self, x, how='column'):

if how == 'column':

x_new = np.ones((x.shape[0], x.shape[1]+1))

x_new[:, 1:] = x

elif how == 'row':

x_new = np.ones((x.shape[0] + 1, x.shape[1]))

x_new[1:, :] = x

else:

raise AttributeError('Atrybut how musi miec wartosc column lub row')

return x_new

def _feedforward(self, X, w1, w2):

a1 = self._add_bias_unit(X, how='column')

z2 = w1.dot(a1.T)

a2 = self._sigmoid(z2)

a2 = self._add_bias_unit(a2, how='row')

z3 = w2.dot(a2)

a3 = self._sigmoid(z3)

return a1, z2, a2, z3, a3

def _L2_reg(self, lambda_, w1, w2):

return (lambda_ / 2.0) * (np.sum(w1[:, 1:] ** 2) + np.sum(w2[:, 1:]))

def _L1_reg(self, lambda_, w1, w2):

return (lambda_ / 2.0) * (np.abs(w1[:, 1:].sum() ** 2) + np.abs(w2[:, 1:]).sum())

def _get_cost(self, y_enc, output, w1, w2):

term1 = -y_enc * (np.log(output))

term2 = (1-y_enc) * np.log(1-output)

cost = np.sum(term1-term2)

L1_term = self._L1_reg(self.l1, w1, w2)

L2_term = self._L2_reg(self.l2, w1, w2)

cost = cost + L1_term + L2_term

return cost

def _get_gradient(self, a1, a2, a3, z2, y_enc, w1, w2):

sigma3 = a3 - y_enc

z2 = self._add_bias_unit(z2, how='row')

sigma2 = w2.T.dot(sigma3) * self._sigmoid_gradient(z2)

sigma2 = sigma2[1:, :]

grad1 = sigma2.dot(a1)

grad2 = sigma3.dot(a2.T)

grad1[:, 1:] += self.l2 * w1[:, 1:]

grad1[:, 1:] += self.l1 * np.sign(w1[:, 1:])

grad2[:, 1:] += self.l2 * w2[:, 1:]

grad2[:, 1:] += self.l1 * np.sign(w2[:, 1:])

return grad1, grad2

def predict(self, X):

a1, z2, a2, z3, a3 = self._feedforward(X, self.w1, self.w2)

y_pred = np.argmax(z3, axis=0)

return y_pred

def fit(self, X, y, print_progress = False):

self.cost_ = []

X_data, y_data = X.copy(), y.copy()

y_enc = self._encode_labels(y, self.n_output)

delta_w1_prev = np.zeros(self.w1.shape)

delta_w2_prev = np.zeros(self.w2.shape)

for i in range(self.epochs):

self.eta /= (1+self.decrease_const*i)

if print_progress:

sys.stderr.write('\rEpoka: %d/%d' % (i+1, self.epochs))

sys.stderr.flush()

if self.shuffle:

idx = np.random.permutation(y_data.shape[0])

X_data, y_enc = X_data[idx], y_enc[:,idx]

mini = np.array_split(range(y_data.shape[0]), self.minibatches)

for idx in mini:

a1, z2, a2, z3, a3 = self._feedforward(X_data[idx], self.w1, self.w2)

cost = self._get_cost(y_enc=y_enc[:, idx],

output=a3,

w1 = self.w1,

w2 = self.w2)

self.cost_.append(cost)

grad1, grad2 = self._get_gradient(a1=a1, a2=a2, a3=a3,z2=z2, y_enc=y_enc[:, idx], w1=self.w1, w2=self.w2)

delta_w1, delta_w2 = self.eta * grad1, self.eta*grad2

self.w1 -=(delta_w1+(self.alpha * delta_w1_prev))

self.w2 -= (delta_w2 + (self.alpha * delta_w2_prev))

delta_w1_prev, delta_w2_prev = delta_w1, delta_w2

return self

def load_mnist(path, kind='train'):

labels_path = os.path.join(path, '%s-labels.idx1-ubyte' % kind)

images_path = os.path.join(path, '%s-images.idx3-ubyte' % kind)

with open(labels_path, 'rb') as lbpath:

magic, n = struct.unpack('>II', lbpath.read(8))

labels = np.fromfile(lbpath, dtype=np.uint8)

with open(images_path, 'rb') as imgpath:

magic, num, rows, cols = struct.unpack(">IIII", imgpath.read(16))

images = np.fromfile(imgpath, dtype=np.uint8).reshape(len(labels), 784)

return images, labels

if __name__ == "__main__":

X_train, y_train = load_mnist(r'C:\Users\domin\Desktop\Python\mnist', kind='train')

X_test, y_test = load_mnist(r'C:\Users\domin\Desktop\Python\mnist', kind='t10k')

nn = NeuralNetMLP(n_output=10,

n_features=X_train.shape[1],

n_hidden=50,

l2=0.1,

l1=0.0,

epochs=1000,

eta=0.001,

alpha=0.001,

decrease_const=0.00001,

shuffle=True,

minibatches=50,

random_state=1)

nn.fit(X_train, y_train, print_progress=True)

Author

Title

Language

Your paste - Paste your paste here

import numpy as np
from scipy.special import expit
import sys
import struct
import os

class NeuralNetMLP(object):
    def __init__(self, n_output, n_features, n_hidden=30
                 , l1=0.0, l2=0.0, epochs=500, eta=0.001,
                 alpha=0.0, decrease_const=0.0, shuffle=True,
                 minibatches=1, random_state=None):
        np.random.seed(random_state)
        self.n_output = n_output
        self.n_features = n_features
        self.n_hidden = n_hidden
        self.w1, self.w2, = self._initialize_weights()
        self.l1 = l1
        self.l2 = l2
        self.epochs = epochs
        self.eta = eta
        self.alpha = alpha
        self.decrease_const = decrease_const
        self.shuffle = shuffle
        self.minibatches = minibatches

def _encode_labels(selfself, y, k):
        onehot = np.zeros((k, y.shape[0]))
        for idx, val in enumerate(y):
            onehot[val, idx] = 1.0
        return onehot

def _initialize_weights(self):
        w1 = np.random.uniform(-1.0, 1.0,
                               size=self.n_hidden * (self.n_features + 1))
        w1 = w1.reshape(self.n_hidden, self.n_features + 1)
        w2 = np.random.uniform(-1.0, 1.0,
                               size=self.n_output * (self.n_hidden + 1))
        w2 = w2.reshape(self.n_output, self.n_hidden + 1)
        return w1, w2

def _sigmoid(self, z):
        return expit(z)

def _sigmoid_gradient(self, z):
        sg = self._sigmoid(z)
        return sg * (1 - sg)

def _add_bias_unit(self, x, how='column'):
        if how == 'column':
            x_new = np.ones((x.shape[0], x.shape[1]+1))
            x_new[:, 1:] = x
        elif how == 'row':
            x_new = np.ones((x.shape[0] + 1, x.shape[1]))
            x_new[1:, :] = x
        else:
            raise AttributeError('Atrybut how musi miec wartosc column lub row')
        return x_new

def _feedforward(self, X, w1, w2):
        a1 = self._add_bias_unit(X, how='column')
        z2 = w1.dot(a1.T)
        a2 = self._sigmoid(z2)
        a2 = self._add_bias_unit(a2, how='row')
        z3 = w2.dot(a2)
        a3 = self._sigmoid(z3)
        return a1, z2, a2, z3, a3

def _L2_reg(self, lambda_, w1, w2):
        return (lambda_ / 2.0) * (np.sum(w1[:, 1:] ** 2) + np.sum(w2[:, 1:]))

def _L1_reg(self, lambda_, w1, w2):
        return (lambda_ / 2.0) * (np.abs(w1[:, 1:].sum() ** 2) + np.abs(w2[:, 1:]).sum())

def _get_cost(self, y_enc, output, w1, w2):
        term1 = -y_enc * (np.log(output))
        term2 = (1-y_enc) * np.log(1-output)
        cost = np.sum(term1-term2)
        L1_term = self._L1_reg(self.l1, w1, w2)
        L2_term = self._L2_reg(self.l2, w1, w2)
        cost = cost + L1_term + L2_term
        return cost

def _get_gradient(self, a1, a2, a3, z2, y_enc, w1, w2):
        sigma3 = a3 - y_enc
        z2 = self._add_bias_unit(z2, how='row')
        sigma2 = w2.T.dot(sigma3) * self._sigmoid_gradient(z2)
        sigma2 = sigma2[1:, :]
        grad1 = sigma2.dot(a1)
        grad2 = sigma3.dot(a2.T)

grad1[:, 1:] += self.l2 * w1[:, 1:]
        grad1[:, 1:] += self.l1 * np.sign(w1[:, 1:])
        grad2[:, 1:] += self.l2 * w2[:, 1:]
        grad2[:, 1:] += self.l1 * np.sign(w2[:, 1:])

return  grad1, grad2

def predict(self, X):
        a1, z2, a2, z3, a3 = self._feedforward(X, self.w1, self.w2)
        y_pred = np.argmax(z3, axis=0)
        return y_pred

def fit(self, X, y, print_progress = False):
        self.cost_ = []
        X_data, y_data = X.copy(), y.copy()
        y_enc = self._encode_labels(y, self.n_output)

delta_w1_prev = np.zeros(self.w1.shape)
        delta_w2_prev = np.zeros(self.w2.shape)

for i in range(self.epochs):

self.eta /= (1+self.decrease_const*i)

if print_progress:
                sys.stderr.write('\rEpoka: %d/%d' % (i+1, self.epochs))
                sys.stderr.flush()

if self.shuffle:
                idx = np.random.permutation(y_data.shape[0])
                X_data, y_enc = X_data[idx], y_enc[:,idx]

mini = np.array_split(range(y_data.shape[0]), self.minibatches)
            for idx in mini:
                a1, z2, a2, z3, a3 = self._feedforward(X_data[idx], self.w1, self.w2)
                cost = self._get_cost(y_enc=y_enc[:, idx],
                                      output=a3,
                                      w1 = self.w1,
                                      w2 = self.w2)
                self.cost_.append(cost)

grad1, grad2 = self._get_gradient(a1=a1, a2=a2, a3=a3,z2=z2, y_enc=y_enc[:, idx], w1=self.w1, w2=self.w2)

delta_w1, delta_w2 = self.eta * grad1, self.eta*grad2
                self.w1 -=(delta_w1+(self.alpha * delta_w1_prev))
                self.w2 -= (delta_w2 + (self.alpha * delta_w2_prev))
                delta_w1_prev, delta_w2_prev = delta_w1, delta_w2

return self

def load_mnist(path, kind='train'):
    labels_path = os.path.join(path, '%s-labels.idx1-ubyte' % kind)
    images_path = os.path.join(path, '%s-images.idx3-ubyte' % kind)

with open(labels_path, 'rb') as lbpath:
        magic, n = struct.unpack('&gt;II', lbpath.read(8))
        labels = np.fromfile(lbpath, dtype=np.uint8)

with open(images_path, 'rb') as imgpath:
        magic, num, rows, cols = struct.unpack(&quot;&gt;IIII&quot;, imgpath.read(16))
        images = np.fromfile(imgpath, dtype=np.uint8).reshape(len(labels), 784)

return images, labels

if __name__ == &quot;__main__&quot;:

X_train, y_train = load_mnist(r'C:\Users\domin\Desktop\Python\mnist', kind='train')
    X_test, y_test =  load_mnist(r'C:\Users\domin\Desktop\Python\mnist', kind='t10k')

nn = NeuralNetMLP(n_output=10,
                      n_features=X_train.shape[1],
                      n_hidden=50,
                      l2=0.1,
                      l1=0.0,
                      epochs=1000,
                      eta=0.001,
                      alpha=0.001,
                      decrease_const=0.00001,
                      shuffle=True,
                      minibatches=50,
                      random_state=1)
    nn.fit(X_train, y_train, print_progress=True)

Private - Private paste aren't shown in recent listings.

Delete After - When should we delete your paste?

Spam protection -

Reply to "Untitled"