In [1]:
import numpy as np

# sigmoid 함수
def sigmoid(x):
    return 1 / (1+np.exp(-x))

# 수치미분 함수
def numerical_derivative(f, x):
    delta_x = 1e-4 # 0.0001
    grad = np.zeros_like(x)
    
    it = np.nditer(x, flags=['multi_index'], op_flags=['readwrite'])
    
    while not it.finished:
        idx = it.multi_index        
        tmp_val = x[idx]
        x[idx] = float(tmp_val) + delta_x
        fx1 = f(x) # f(x+delta_x)
        
        x[idx] = tmp_val - delta_x 
        fx2 = f(x) # f(x-delta_x)
        grad[idx] = (fx1 - fx2) / (2*delta_x)
        
        x[idx] = tmp_val 
        it.iternext()   
        
    return grad

In [3]:
# LogicGate Class

class LogicGate:
    
    def __init__(self, gate_name, xdata, tdata):  # xdata, tdata => numpy.array(...)
        
        self.name = gate_name
        
        # 입력 데이터, 정답 데이터 초기화
        self.__xdata = xdata.reshape(4,2)
        self.__tdata = tdata.reshape(4,1)
        
        # 가중치 W, 바이어스 b 초기화
        self.__W = np.random.rand(2,1)  # weight, 2 X 1 matrix
        self.__b = np.random.rand(1)
                        
        # 학습률 learning rate 초기화
        self.__learning_rate = 1e-2
        
    # 손실함수
    def __loss_func(self):
        
        delta = 1e-7    # log 무한대 발산 방지
    
        z = np.dot(self.__xdata, self.__W) + self.__b
        y = sigmoid(z)
    
        # cross-entropy 
        return  -np.sum( self.__tdata*np.log(y + delta) + (1-self.__tdata)*np.log((1 - y)+delta ) )      
    
    # 손실 값 계산
    def error_val(self):
        
        delta = 1e-7    # log 무한대 발산 방지
    
        z = np.dot(self.__xdata, self.__W) + self.__b
        y = sigmoid(z)
    
        # cross-entropy 
        return  -np.sum( self.__tdata*np.log(y + delta) + (1-self.__tdata)*np.log((1 - y)+delta ) )

    # 수치미분을 이용하여 손실함수가 최소가 될때 까지 학습하는 함수
    def train(self):
        
        f = lambda x : self.__loss_func()
        
        print("Initial error value = ", self.error_val())
        
        for step in  range(8001):
            
            self.__W -= self.__learning_rate * numerical_derivative(f, self.__W)
    
            self.__b -= self.__learning_rate * numerical_derivative(f, self.__b)
    
            if (step % 400 == 0):
                print("step = ", step, "error value = ", self.error_val())
                
                
    # 미래 값 예측 함수
    def predict(self, input_data):
        
        z = np.dot(input_data, self.__W) + self.__b
        y = sigmoid(z)
    
        if y > 0.5:
            result = 1  # True
        else:
            result = 0  # False
    
        return y, result

In [4]:
xdata = np.array([ [0, 0], [0, 1], [1, 0], [1, 1] ])
tdata = np.array([0, 0, 0, 1])

AND_obj = LogicGate("AND_GATE", xdata, tdata)

AND_obj.train()

Initial error value =  3.87189614416236
step =  0 error value =  3.8290613456355285
step =  400 error value =  1.5472644381890523
step =  800 error value =  1.1478164614712822
step =  1200 error value =  0.9219666487783601
step =  1600 error value =  0.773170228380784
step =  2000 error value =  0.6663476567778215
step =  2400 error value =  0.585419886895292
step =  2800 error value =  0.5218015984941872
step =  3200 error value =  0.4704116270784027
step =  3600 error value =  0.4280163692671116
step =  4000 error value =  0.3924450589115024
step =  4400 error value =  0.36217960375245506
step =  4800 error value =  0.3361234349012342
step =  5200 error value =  0.3134633321338242
step =  5600 error value =  0.29358283992556594
step =  6000 error value =  0.2760058829626352
step =  6400 error value =  0.2603588540252483
step =  6800 error value =  0.24634442354044006
step =  7200 error value =  0.23372302204483467
step =  7600 error value =  0.2222994810945681
step =  8000 error valu

In [7]:
# AND Gate prediction
print(AND_obj.name, "\n")

test_data = np.array([ [0, 0], [0, 1], [1, 0], [1, 1] ])

for input_data in test_data:
    (sigmoid_val, logical_val) = AND_obj.predict(input_data) 
    print(input_data, " = ", sigmoid_val, logical_val, "\n")  

AND_GATE 

[0 0]  =  [0.00037347] 0 

[0 1]  =  [0.05993759] 0 

[1 0]  =  [0.05993974] 0 

[1 1]  =  [0.91583433] 1 



In [8]:
xdata = np.array([ [0, 0], [0, 1], [1, 0], [1, 1] ])
tdata = np.array([0, 1, 1, 1])

OR_obj = LogicGate("OR_GATE", xdata, tdata)

OR_obj.train() 

Initial error value =  1.8354987074486349
step =  0 error value =  1.8321271321722086
step =  400 error value =  1.1411611542544624
step =  800 error value =  0.8200178431125235
step =  1200 error value =  0.6339984380140804
step =  1600 error value =  0.513750681724652
step =  2000 error value =  0.4301153677278492
step =  2400 error value =  0.3688594411271438
step =  2800 error value =  0.3222264189260756
step =  3200 error value =  0.2856392131360178
step =  3600 error value =  0.2562299618579968
step =  4000 error value =  0.23211509173502304
step =  4400 error value =  0.21200934091078838
step =  4800 error value =  0.19500745181817397
step =  5200 error value =  0.18045448821164145
step =  5600 error value =  0.16786558804773738
step =  6000 error value =  0.15687455681491813
step =  6400 error value =  0.14719993873845286
step =  6800 error value =  0.13862203317711294
step =  7200 error value =  0.13096696439531788
step =  7600 error value =  0.12409541301152377
step =  8000 e

In [10]:
# OR Gate prediction
print(OR_obj.name, "\n")

test_data = np.array([ [0, 0], [0, 1], [1, 0], [1, 1] ])

for input_data in test_data:
    (sigmoid_val, logical_val) = OR_obj.predict(input_data) 
    print(input_data, " = ", sigmoid_val, logical_val, "\n")  

OR_GATE 

[0 0]  =  [0.0640742] 0 

[0 1]  =  [0.9744518] 1 

[1 0]  =  [0.97457988] 1 

[1 1]  =  [0.99995319] 1 



In [11]:
xdata = np.array([ [0, 0], [0, 1], [1, 0], [1, 1] ])
tdata = np.array([1, 1, 1, 0])

NAND_obj = LogicGate("NAND_GATE", xdata, tdata)

NAND_obj.train()

Initial error value =  3.016369194737334
step =  0 error value =  3.0110004851194656
step =  400 error value =  1.7315791571232308
step =  800 error value =  1.2382415479166153
step =  1200 error value =  0.977102928091718
step =  1600 error value =  0.8109828591839887
step =  2000 error value =  0.6941513898864193
step =  2400 error value =  0.6068199361902182
step =  2800 error value =  0.538816097017133
step =  3200 error value =  0.484274183673449
step =  3600 error value =  0.43953042285108734
step =  4000 error value =  0.40215939591707406
step =  4400 error value =  0.3704832093962748
step =  4800 error value =  0.34330033238511143
step =  5200 error value =  0.31972602968830793
step =  5600 error value =  0.2990936311751099
step =  6000 error value =  0.28089090316304527
step =  6400 error value =  0.2647176365896073
step =  6800 error value =  0.2502565642874539
step =  7200 error value =  0.23725292937996856
step =  7600 error value =  0.22549982721738654
step =  8000 error v

In [14]:
# NAND Gate prediction
print(NAND_obj.name, "\n")

test_data = np.array([ [0, 0], [0, 1], [1, 0], [1, 1] ])

for input_data in test_data:
    (sigmoid_val, logical_val) = NAND_obj.predict(input_data) 
    print(input_data, " = ",sigmoid_val,  logical_val, "\n")  

NAND_GATE 

[0 0]  =  [0.99961043] 1 

[0 1]  =  [0.93927297] 1 

[1 0]  =  [0.93927078] 1 

[1 1]  =  [0.08528035] 0 



In [15]:
xdata = np.array([ [0, 0], [0, 1], [1, 0], [1, 1] ])
tdata = np.array([0, 1, 1, 0])


XOR_obj = LogicGate("XOR_GATE", xdata, tdata)

# XOR Gate 를 보면, 손실함수 값이 2.7 근처에서 더 이상 감소하지 않는것을 볼수 있음
XOR_obj.train()

Initial error value =  2.914734145753466
step =  0 error value =  2.9104795793301967
step =  400 error value =  2.772788519509934
step =  800 error value =  2.772637019698026
step =  1200 error value =  2.7726008069134473
step =  1600 error value =  2.7725914348989513
step =  2000 error value =  2.772588899020577
step =  2400 error value =  2.772588196545225
step =  2800 error value =  2.7725879996417335
step =  3200 error value =  2.772587944131052
step =  3600 error value =  2.7725879284380714
step =  4000 error value =  2.7725879239957294
step =  4400 error value =  2.7725879227374
step =  4800 error value =  2.7725879223808594
step =  5200 error value =  2.772587922279821
step =  5600 error value =  2.772587922251187
step =  6000 error value =  2.772587922243071
step =  6400 error value =  2.7725879222407714
step =  6800 error value =  2.7725879222401195
step =  7200 error value =  2.7725879222399348
step =  7600 error value =  2.772587922239882
step =  8000 error value =  2.772587

In [16]:
# XOR Gate prediction => 예측이 되지 않음
print(XOR_obj.name, "\n")

test_data = np.array([ [0, 0], [0, 1], [1, 0], [1, 1] ])

for input_data in test_data:
    (sigmoid_val, logical_val) = XOR_obj.predict(input_data) 
    print(input_data, " = ", sigmoid_val,logical_val, "\n")  

XOR_GATE 

[0 0]  =  [0.49999996] 0 

[0 1]  =  [0.49999999] 0 

[1 0]  =  [0.49999999] 0 

[1 1]  =  [0.50000003] 1 



In [17]:
# XOR 을 NAND + OR => AND 조합으로 계산함
input_data = np.array([ [0, 0], [0, 1], [1, 0], [1, 1] ])

s1 = []    # NAND 출력
s2 = []    # OR 출력

new_input_data = []  # AND 입력
final_output = []    # AND 출력

for index in range(len(input_data)):
    
    s1 = NAND_obj.predict(input_data[index])  # NAND 출력
    s2 = OR_obj.predict(input_data[index])    # OR 출력
    
    new_input_data.append(s1[-1])    # AND 입력
    new_input_data.append(s2[-1])    # AND 입력
    
    (sigmoid_val, logical_val) = AND_obj.predict(np.array(new_input_data))
    
    final_output.append(logical_val)    # AND 출력, 즉 XOR 출력    
    new_input_data = []    # AND 입력 초기화


for index in range(len(input_data)):    
    print(input_data[index], " = ", final_output[index], end='')
    print("\n")

[0 0]  =  0

[0 1]  =  1

[1 0]  =  1

[1 1]  =  0

