import numpy as np
import matplotlib.pyplot as plt
from IPython.display import Image


# option 1
def AND(x1, x2):
    w1, w2, theta = 0.5, 0.5, 0.7
    tmp = x1*w1 + x2*w2
    
    if tmp <= theta:
        return 0
    elif tmp > theta:
        return 1
    
# option 2
def AND(x1, x2):
    x = np.array([x1, x2])
    w = np.array([0.5, 0.5])
    b = -0.7
    
    tmp = np.sum(w*x)+b
    
    if tmp <= 0:
        return 0
    else:
        return 1

print(AND(0, 0), AND(0, 1), AND(1, 0), AND(1, 1))

0 0 0 1


def NAND(x1, x2):
    x = np.array([x1, x2])
    w = np.array([-0.5, -0.5])
    b = 0.7
    tmp = np.sum(w*x) + b
    if tmp <= 0:
        return 0
    else:
        return 1

print(NAND(0, 0), NAND(0, 1), NAND(1, 0), NAND(1, 1))

1 1 1 0


def OR(x1, x2):
    x = np.array([x1, x2])
    w = np.array([0.5, 0.5])
    b = -0.2
    tmp = np.sum(w*x) + b
    if tmp <= 0:
        return 0
    else:
        return 1

print(OR(0, 0), OR(0, 1), OR(1, 0), OR(1, 1))

0 1 1 1


def XOR(x1, x2):
    s1 = NAND(x1, x2)
    s2 = OR(x1, x2)
    y = AND(s1, s2)
    return y

print(XOR(0, 0), XOR(0, 1), XOR(1, 0), XOR(1, 1))

0 1 1 0


def step_function(x):
    return np.array(x > 0, dtype=np.int32)


X = np.arange(-5.0, 5.0, 0.1)
Y = step_function(X)

plt.plot(X, Y)
plt.ylim(-0.1, 1.1) # y limit 설정

(-0.1, 1.1)


def sigmoid(x):
    return 1 / (1 + np.exp(-x))


X = np.arange(-5.0, 5.0, 0.1)
Y = sigmoid(X)

plt.plot(X, Y)
plt.ylim(-0.1, 1.1)

(-0.1, 1.1)


def relu(x):
    return np.maximum(0, x)


X = np.arange(-5.0, 5.0, 0.1)
Y = relu(X)

plt.plot(X, Y)
plt.ylim(-1.0, 6.0)

(-1.0, 6.0)


Image("fig 3-11.png", width=400)


A = np.array([[1, 2], [3, 4]])
B = np.array([[5, 6], [7, 8]])
np.dot(A, B)

array([[19, 22],
       [43, 50]])

A@B

array([[19, 22],
       [43, 50]])


Image("fig 3-12.png", width=400)


A = np.array([[1, 2], [3, 4], [5, 6]])
B = np.array([[1, 2, 3, 4], [5, 6, 7, 8]])
C = np.dot(A, B)

print(C)
print(A.shape, B.shape, C.shape)

[[11 14 17 20]
 [23 30 37 44]
 [35 46 57 68]]
(3, 2) (2, 4) (3, 4)


Image("fig 3-13.png", width=400)


A = np.array([[1, 2], [3, 4], [5, 6]])
B = np.array([1, 2])
C = np.dot(A, B)
print(C)
print(A.shape, B.shape, C.shape)

[ 5 11 17]
(3, 2) (2,) (3,)


Image("fig 3-14.png", width=400)


X = np.array([1, 2])
W = np.array([[1, 3, 5], [2, 4, 6]])
Y = np.dot(X, W)
print(Y)
print(X.shape, W.shape, Y.shape)

[ 5 11 17]
(2,) (2, 3) (3,)


Image("fig 3-17.png", width=400)


Image("e 3.9.png", width=200)


X = np.array([1.0, 0.5])
W1 = np.array([[0.1, 0.3, 0.5], [0.2, 0.4, 0.6]])
B1 = np.array([0.1, 0.2, 0.3])

A1 = np.dot(X, W1) + B1
A1

array([0.3, 0.7, 1.1])


Image("fig 3-18.png", width=400)


Z1 = sigmoid(A1)

Z1, Z1.shape

(array([0.57444252, 0.66818777, 0.75026011]), (3,))


Image("fig 3-19.png", width=400)


W2 = np.array([[0.1, 0.4], [0.2, 0.5], [0.3, 0.6]])
B2 = np.array([0.1, 0.2])

A2 = np.dot(Z1, W2) + B2 
Z2 = sigmoid(A2)

Z2, Z2.shape

(array([0.62624937, 0.7710107 ]), (2,))


Image("fig 3-20.png", width=400)


def identity_function(x):
    return x


W3 = np.array([[0.1, 0.3], [0.2, 0.4]])
B3 = np.array([0.1, 0.2])

A3 = np.dot(Z2, W3) + B3
Y = identity_function(A3)

Y, Y.shape

(array([0.31682708, 0.69627909]), (2,))


def init_network():
    network = {}
    network['W1'] = np.array([[0.1, 0.3, 0.5], [0.2, 0.4, 0.6]])
    network['W2'] = np.array([[0.1, 0.4], [0.2, 0.5], [0.3, 0.6]])
    network['W3'] = np.array([[0.1, 0.3], [0.2, 0.4]])
    network['B1'] = np.array([0.1, 0.2, 0.3])
    network['B2'] = np.array([0.1, 0.2])
    network['B3'] = np.array([0.1, 0.2])
    return network

def forward(network, X):
    W1, W2, W3 = network['W1'], network['W2'], network['W3']
    B1, B2, B3 = network['B1'], network['B2'], network['B3']
    A1 = np.dot(X, W1) + B1
    Z1 = sigmoid(A1)

    A2 = np.dot(Z1, W2) + B2 
    Z2 = sigmoid(A2)

    A3 = np.dot(Z2, W3) + B3
    Y = identity_function(A3)
    return Y


network = init_network()
X = np.array([1.0, 0.5])
Y = forward(network, X)
Y

array([0.31682708, 0.69627909])


def softmax(a):
    c = np.max(a)
    exp_a = np.exp(a-c) # overflow 방지
    sum_exp_a = np.sum(exp_a)
    y = exp_a / sum_exp_a
    return y


a = np.array([0.3, 2.9, 4.0])

softmax(a)

array([0.01821127, 0.24519181, 0.73659691])


import pickle
from dataset.mnist import load_mnist


def get_data():
    (x_train, t_train), (x_test, t_test) = load_mnist(normalize=True, flatten=True, one_hot_label=False)
    return x_test, t_test

def init_network():
    with open('sample_weight.pkl', 'rb') as f:
        network = pickle.load(f)
    return network

def predict(network, X):
    W1, W2, W3 = network['W1'], network['W2'], network['W3']
    b1, b2, b3 = network['b1'], network['b2'], network['b3']
    A1 = np.dot(X, W1) + b1
    Z1 = sigmoid(A1)

    A2 = np.dot(Z1, W2) + b2 
    Z2 = sigmoid(A2)

    A3 = np.dot(Z2, W3) + b3
    Y = softmax(A3)
    return Y


x, t = get_data()
network = init_network()
y = forward(network, x)


plt.imshow(x[0].reshape(28, -1), cmap='binary')

<matplotlib.image.AxesImage at 0x1d839c44eb0>


keys = sorted(network.keys())
for key in keys:
    print("{} : {}".format(key, network[key].shape))

W1 : (784, 50)
W2 : (50, 100)
W3 : (100, 10)
b1 : (50,)
b2 : (100,)
b3 : (10,)


Image("fig 3-26.png", width=400)


accuracy_cnt = 0

for i in range(len(x)):
    y = predict(network, x[i])
    p = np.argmax(y)
    if p == t[i]:
        accuracy_cnt += 1
print("Accuracy : ", accuracy_cnt / len(x))

Accuracy :  0.9352


Image("fig 3-27.png", width=400)


accuracy_cnt = 0
batch_size = 100

for i in range(0, len(x), batch_size):
    x_batch = x[i:i+batch_size]
    y_batch = predict(network, x_batch)
    p = np.argmax(y_batch, axis=1)
    accuracy_cnt += np.sum(p == t[i:i+batch_size])
print("Accuracy : ", accuracy_cnt / len(x))

Accuracy :  0.9352

Deep Learning(0903_day1)

퍼셉트론(간단한 논리회로)¶

신경망¶

활성화 함수¶

신경망에서의 행렬곱¶

3층 신경망 구현¶

출력층(소프트맥스 함수)¶

손글씨 숫자(MNIST)¶

배치처리¶