from IPython.display import Image 
Image("Pictures/activation.png")


import numpy as np
import matplotlib.pyplot as plt


x = np.array([-1.0, 1.0, 2.0])
y = x>0
print(y) # bool type 
print(y.astype(np.int32)) # change to int type

[False  True  True]
[0 1 1]


def step_function(x):
    return np.array(x>0, dtype= np.int32)


x = np.arange(-5.0, 5.0, 0.1)
y = step_function(x)
plt.plot(x, y)
plt.ylim(-0.1, 1.1) # y축 범위
plt.title('Step funcion Graph')
plt.show()


def sigmoid(x):
    return 1/(1+np.exp(-x))


x = np.array([-1.0, 1.0, 2.0])
sigmoid(x)

array([0.26894142, 0.73105858, 0.88079708])


x = np.arange(-5.0, 5.0, 0.1)
y = sigmoid(x)
plt.plot(x, y)
plt.ylim(-0.1, 1.1)
plt.title('Sigmoid Function Graph')
plt.show()


def relu(x):
    return np.maximum(0, x)


x = np.arange(-5.0, 5.0, 0.1)
y = relu(x)
plt.plot(x, y)
plt.ylim(-0.2, 5.0)
plt.title('Relu Function Graph')
plt.show()


# 항등함수, 입력을 그대로 출력하는 함수
def identity_function(x):
    return x


# 가중치와 편향을 초기화,  network 딕셔너리 함수에 저장
def init_network():
    network ={}
    network['W1'] = np.array([[0.1, 0.3, 0.5], [0.2, 0.4, 0.6]])
    network['b1'] = np.array([0.1, 0.2, 0.3])
    network['W2'] = np.array([[0.1, 0.4], [0.2, 0.5], [0.3, 0.6]])
    network['b2'] = np.array([0.1, 0.2])
    network['W3'] = np.array([[0.1, 0.3], [0.2, 0.4]])
    network['b3'] = np.array([0.1, 0.2])
    return network

# 입력을 출력으로 변환하는 처리 구현, 순전파 forward
def forward(network, x):
    W1 , W2, W3 = network['W1'], network['W2'], network['W3']
    b1 , b2, b3 = network['b1'], network['b2'], network['b3']
    
    z1 = np.dot(x, W1) +b1
    a1 = sigmoid(z1)
    z2 = np.dot(a1, W2) +b2
    a2 = sigmoid(z2)
    z3 = np.dot(a2, W3) +b3
    y = identity_function(z3)
    
    return y

network = init_network()
x = np.array([1.0, 0.5])
y = forward(network, x)
y

array([0.31682708, 0.69627909])


def softmax(a):
    exp_a = np.exp(a)
    sum_exp_a = np.sum(exp_a)
    y = exp_a/sum_exp_a
    return y


a = np.array([1010, 1000, 990])
# np.exp(a)/np.sum(np.exp(a)) # 잘 계산되지 않는다. 
c = np.max(a)
print(a-c)
np.exp(a-c)/np.sum(np.exp(a-c))

[  0 -10 -20]

array([9.99954600e-01, 4.53978686e-05, 2.06106005e-09])


# overflow를 개선한 softmax
def softmax(a):
    C = np.max(a)
    exp_a = np.exp(a-c) #오버플로 대책
    sum_exp_a= np.sum(exp_a)
    y = exp_a/sum_exp_a
    return y

티스토리

[Deep Learning from Scratch] chapter 3. Neural Network

[Deep Learning from Scratch] chapter 3. Neural Network

Nueral Network¶

활성화 함수¶

계단함수¶

Sigmoid함수¶

ReLU함수(Rectified Linear Unite)¶

다층 신경망 구현¶

출력계층 설계¶

출력층 뉴런수¶