import lib needed¶

from PIL import Image  import numpy as np  import matplotlib.pyplot as plt  import re  from glob import glob

begin, load data¶

def load_data(train_path='train/',test_path='test/'):      train_list=glob(r'train/*.png')      pattern = re.compile(r'num(d).png')      train_id = np.array([float(pattern.search(img_name).groups()[0]) for img_name in train_list])      train_data=np.concatenate([np.array(Image.open(img_name)).reshape(1,784) for img_name in train_list],axis=0).astype(np.float)      test_list=glob(r'test/*.png')      test_id=np.array([float(pattern.search(img_name).groups()[0]) for img_name in test_list])      test_data=np.concatenate([np.array(Image.open(img_name)).reshape(1,784) for img_name in test_list],axis=0).astype(np.float)      return train_id,train_data,test_id,test_data

load data, print the shape of data¶

train_id,train_data,test_id,test_data=load_data()  train_id.shape,train_data.shape,test_id.shape,test_data.shape

((60000,), (60000, 784), (10000,), (10000, 784))

convert the shape of id/label¶

e.g. data_id “3” can be converted to [0,0,0,1,0,0,0,0,0,0]¶

train_val=np.zeros((train_id.shape[0],10))  for i in range(train_id.shape[0]):      train_val[i,train_id[i].astype('int')]=1

split data into minibatches¶

mini_batch_num=100  mini_batch_size=600

define function need, such as softmax, propagation,back_propagation¶

def softmax(x):      x=x-np.max(x) #using softmax(x)=softmax(x+c)      exp_x=np.exp(x)      softmax_x=exp_x/sum(np.exp(x))      return softmax_x

use cross entrophy to compute loss, this is part of propagation¶

def propa(train_x,train_y,W,b): #propagation      yt=softmax(np.dot(train_x,W)+b)      loss=-np.sum(train_y.T.dot(np.log(yt))) #cross entrophy      dy=(yt-train_y).T      return dy,loss

update W¶

def back_propa(train_data,train_id,W,b,alpha,data_size):      for i in range(data_size):          dy,loss=propa(train_data[i,:],train_id[i,:],W,b)          dy=dy.reshape(1,10)          p=train_data[i,:]          p=p.reshape(784,1)          dW=alpha*np.dot(p,dy)          W-=dW      return W,loss

initialize W and b¶

W=np.zeros((784,10))  b=1

loop and update, also print accurancy of our traindataset¶

for i in range(mini_batch_num):      for iteration in range(20):          lb=(mini_batch_size*i)          ub=(mini_batch_size*(i+1))          mini_batch_data=train_data[lb:ub,:]          mini_batch_id=train_val[lb:ub,:]          W,loss=back_propa(mini_batch_data,mini_batch_id,W,b,0.01,600)          count=0          for j in range(600):              if np.argmax(softmax(train_data[j,:].dot(W)))==train_id[j].astype('int'):                  count+=1          acc=count/600      if i%10==0:          print('batch={},acc={}'.format(i+1,acc))

e:Anaconda3libsite-packagesipykernel_launcher.py:3: RuntimeWarning: divide by zero encountered in log    This is separate from the ipykernel package so we can avoid doing imports until

batch=1,acc=1.0  batch=11,acc=0.8833333333333333  batch=21,acc=0.865  batch=31,acc=0.8983333333333333  batch=41,acc=0.8766666666666667  batch=51,acc=0.8883333333333333  batch=61,acc=0.8733333333333333  batch=71,acc=0.845  batch=81,acc=0.89  batch=91,acc=0.8766666666666667

predict in the test dataset¶

for j in range(test_id.shape[0]):      if np.argmax(softmax(test_data[j,:].dot(W)))==test_id[j].astype('int'):          count+=1  acc=count/test_id.shape[0]  print(acc)

0.9103

One layer SoftMax Classifier, "Handwriting recognition"

import lib needed¶

begin, load data¶

load data, print the shape of data¶

convert the shape of id/label¶

e.g. data_id “3” can be converted to [0,0,0,1,0,0,0,0,0,0]¶

split data into minibatches¶

define function need, such as softmax, propagation,back_propagation¶

use cross entrophy to compute loss, this is part of propagation¶

update W¶

initialize W and b¶

loop and update, also print accurancy of our traindataset¶

predict in the test dataset¶

VirMach 便宜 VPS

QNews

One layer SoftMax Classifier, "Handwriting recognition"

import lib needed¶

begin, load data¶

load data, print the shape of data¶

convert the shape of id/label¶

e.g. data_id “3” can be converted to [0,0,0,1,0,0,0,0,0,0]¶

split data into minibatches¶

define function need, such as softmax, propagation,back_propagation¶

use cross entrophy to compute loss, this is part of propagation¶

update W¶

initialize W and b¶

loop and update, also print accurancy of our traindataset¶

predict in the test dataset¶

分享此文：

Related Posts

vue+echarts可視化大屏,全國地圖下鑽,頁面自適應

【死磕Java並發】—–記憶體模型之happens-before

Kotlin基本語法和使用技巧

Python的urllib庫

VirMach 便宜 VPS

QNews

熱門搜尋