import numpy as np

W1 = np.random.randn(2,4) # 重み
b1 = np.random.randn(4)   # バイアス
x = np.random.randn(1,2)  # 入力

h = np.dot(x,W1) + b1

h

array([[ 0.48247096, -1.2644639 ,  2.33997006,  3.01376622]])

y = [0.2,0.7,0.1]
t = [0,1,0]

import numpy as np
y1 = np.array([0.2,0.7,0.1])
t = np.array([0,1,0])

def mean_squared_error(y,t):
    mse = 0.5 * np.sum((y-t)**2)
    return mse

mean_squared_error(y1,t)

0.07000000000000002

y2 = np.array([0.5,0.3,0.2])

def cross_entropy_error(y,t):
    delta = 1e-7
    cee = -np.sum(t * np.log(y + delta))
    return cee

import numpy as np
def cross_entropy_error(y,t):
    cee = - np.sum(t * np.log(y))/y.shape[0]

y = np.array([[0.1,0.2,0.7],[0.5,0.2,0.3]])
t = np.array([[1,0,0],[1,0,0]])

# 交差エントロピー誤差
def cross_entropy_error(y,t):
    cee = - np.sum(t * np.log(y))/y.shape[0]
    return cee

# softmax関数
def softmax(a):
    c = np.max(a)
    exp_a = np.exp(a - c)
    sum_a = np.sum(exp_a)
    y = exp_a / sum_a
    
    return y

import numpy as np

class simpleNet:
    def __init__(self):
        self.W = np.random.randn(2,3)
        
    def predict(self,x):
        return np.dot(x,self.W)
    
    def loss(self,x,t):
        z = self.predict(x)
        y = softmax(z)
        loss = cross_entorypy_error(y,t)
        
        return loss

# インスタンスの生成
sn = simpleNet()

# インスタンスを生成させると、重みにランダムな値が入ります（初期化）。以下のように確認できます。
sn.W

array([[ 1.72265811,  0.68672941,  1.10772301],
       [ 0.60344169,  0.60322389, -0.3536039 ]])

# 掛け算(推論)
x = np.array([2.0,3.0])
sn.predict(x)

array([5.25564131, 3.1831305 , 1.15463432])

# 正解ラベル
t = np.array([0,0,1])

# 損失の計算
sn.loss(x,t)

1.4113868299245542

def numerical_gradient(f, x):
    h = 1e-4 # 0.0001
    grad = np.zeros_like(x)
    
    it = np.nditer(x, flags=['multi_index'], op_flags=['readwrite'])
    while not it.finished:
        idx = it.multi_index
        tmp_val = x[idx]
        x[idx] = float(tmp_val) + h
        fxh1 = f(x) # f(x+h)
        
        x[idx] = tmp_val - h 
        fxh2 = f(x) # f(x-h)
        grad[idx] = (fxh1 - fxh2) / (2*h)
        
        x[idx] = tmp_val # 値を元に戻す
        it.iternext()   
        
    return grad

def f(W):
    return sn.loss(x,t)

numerical_gradient(f,sn.W)

array([[ 0.58355381,  0.07345154, -0.65700535],
       [ 0.87533072,  0.11017731, -0.98550803]])

学習者言語の分析（応用）1（第4回）

4.2 ニューラルネットワーク¶

4.2.1 ニューラルネットワークの推論¶

4.2.2 機械学習のモデルとしてのニューラルネットワーク¶

4.2.3 損失関数¶

4.2.4 ニューラルネットワークにおける勾配¶