In [19]:
import numpy as np
from aifunc import *

In [20]:
class MulLayer:
    def __init__(self):
        self.x = None
        self.y = None

    def forward(self, x, y):
        self.x = x
        self.y = y                
        out = x * y

        return out

    def backward(self, dout):
        dx = dout * self.y  # x와 y를 바꾼다.
        dy = dout * self.x

        return dx, dy


class AddLayer:
    def __init__(self):
        pass

    def forward(self, x, y):
        out = x + y

        return out

    # 미분값을 그대로 그냥 전달한다.
    def backward(self, dout):
        dx = dout * 1
        dy = dout * 1

        return dx, dy

In [21]:
apple = 100
apple_num = 2
tax = 1.1

In [22]:
mul_apple_layer = MulLayer()
mul_tax_layer = MulLayer()

In [23]:
# forward
apple_price = mul_apple_layer.forward(apple, apple_num)
price = mul_tax_layer.forward(apple_price, tax)

In [24]:
# backward
dprice = 1
dapple_price, dtax = mul_tax_layer.backward(dprice)
dapple, dapple_num = mul_apple_layer.backward(dapple_price)

In [25]:
print("price:", int(price))
print("dApple:", dapple)
print("dApple_num:", int(dapple_num))
print("dTax:", dtax)

price: 220
dApple: 2.2
dApple_num: 110
dTax: 200


In [26]:
class Relu():
    def __init__(self):
        self.mask = None
        
    def forwaord(self,x):
        # 0보다 작은 수들을 mask 해논다.
        self.mask = (x <=0)
        out = x.copy()
        out[self.mask] = 0
        return out
    
    def backwoard(self,dout):
        dx = dout.copy()
        dx[self.mask] = 0
        return dx

In [27]:
# 역잔파 식은
# dL/dy * y^2 * exp(-x)
# x는 forword에서 받았던 입력값, y는 forword의 출력값 dL/dy는 총결과값에 대한 출력한 값의 편미분
class Sigmoid():
    def __init__(self):
        self.out = None
    
    def forward(self,x):
        self.x = x
        self.out = sigmoid(x)
        return self.out
    
    def backward(self,dout):
        # L = sigmoid(x)
        # 1 + exp(-x) = y = 1/L
        # L = 1 / {1+ exp(-x)} = 1 / y = y^-1
        # L을 x로 미분  -> (-1*y^-2) * (-1 * exp(-x))  = dL/dy * dy/dx
        # y^-2 = L^2
        # exp(-x) * L^2 = L-L^2 = L(1-L)
        dx = dout * self.out * (1-self.out)
        return dx

In [57]:
class Affine():
    def __init__(self,W,b):
        self.W,self.b = W,b
        self.x , self.dW, self.db = \
            None,None,None
        
    def forward(self,x):
        self.x = x
        out = np.dot(x,self.W) + self.b
        return out
    
    def backward(self,dout):
        dx = np.dot(dout,self.W.T)
        self.dW = np.dot(self.x.T,dout)
        self.db = np.sum(dout,axis = 0)
        
        return dx

In [58]:
class SoftmaxWLoss():
    def __init__(self,W):
        self.loss = None
        self.y,self.t = None,None
    
    def forward(self,x,t):
        self.t = t
        self.y = softmax(x)
        self.loss = \
            cross_entropy_error(self.y,self.t)
        
        return self.loss
    
    def backward(self,dout = 1):
        batch_size = self.t.shape[0]
        dx = (self.y - self.t) / batch_size
        return dx