aFewTricks.py

2015. 2. 9. 22:38

aFewTricks.py

336x280(권장), 300x250(권장), 250x250, 200x200 크기의 광고 코드만 넣을 수 있습니다.

#! -*- coding: utf-8 -*-

import numpy
import copy

def sigmoid(x):
return 1.0/(1.0+numpy.exp(-x))

class NeuralNet:
def __init__(self,numUnitsPerLayer):
    """
    COnstructor
    @param numUnitPerLayer numbers of uits per layer, excluding bias
    """

    numLayers=len(numUnitsPerLayer)
    if numLayers<2:
      raise RuntimeError, 'ERROR number of layers must be >=2! (Got %d)' % numLayers

    #totla number of layers incl. input and output
    self.numLayers=numLayers

    #activations
    self.activations=[numpy.zeros((numUnitsPerLayer[i]+1,),numpy.float64) for i in range(numLayers)]

    #set the biases
    for el in range(numLayers):
      self.activations[el][0]=1.0

    #weights
    self.weights=[]
    self.bigDeltas=[]
    self.approxGradients=[]
    for el in range(numLayers-1):
      shp=(numUnitsPerLayer[el+1],numUnitsPerLayer[el]+1)
      self.weights.append(numpy.zeros(shp,numpy.float64))
      self.bigDeltas.append(numpy.zeros(shp,numpy.float64))
      self.approxGradients.append(numpy.zeros(shp,numpy.float64))

    #back propagating errors, no error for layer 0
    self.deltas=[numpy.zeros((len(a)-1,),numpy.float64) for a in self.activations]
    self.deltas[0][:]=0.0 # by definition

def randomlyInitializeWeights(self,magnitude=0.1):
    """
    Randomly initialize the weights to values between -magnitude... +magnitude
    @param magnitude
    """
    numpy.random.seed(1234)
    for w in self.weights:
      w[:]=magnitude* (numpy.random.rand(w.shape[0],w.shape[1])-0.5)

def forward(self,inputData):
    """
    Compute activation by propagating input forward
    @param inputData input (excl. bias)
    """
    self.activations[0][1:]=inputData #copy input data
    for el in range(1,self.numLayers):
      z=numpy.dot(self.weights[el-1],self.activations[el-1])
      self.activations[el][1:]=sigmoid(z)
      self.activations[el][0]=1.0

    return self.getOutput()

def backward(self,targetOutputData):
    """
    Propagate error backward
    @param targetOutputData target output data
    """
    weightsTranspose=[numpy.transpose(w) for w in self.weights]
    self.deltas[self.numLayers-1][:]=self.activations[-1][1:]-targetOutputData
    for el in range(self.numLayers-2,0,-1):
      a=self.activations[el]
      gprime=a*(1.0-a)
      d=numpy.dot(weightsTranspose[el],self.deltas[el+1])*a*(1.0-a)
      self.deltas[el][:]=d[1:]

def getOutput(self):
    """
    Get the network output (excl. bias)
    @return array
    """
    return self. activations[-1][1:]

def getInput(self):
    """
    Get the network input (excl. bias)
    @return array
    """
    return self.activations[0][1:]

def getCost(self,inputOutputList,lam=0.0):
    """
    Compute cost function associated with input/output training data
    @param inputOutputList list of [(input, output), ...] values
    @param lam>=0 regularization parameter (lam=0 means no regularization)
    """
    res=0.0

    #standard term
    for x,y in inputOutputList:
      # output from inputs and weights
      out =self.forward(x)

      #error
      res-=numpy.sum(y*numpy.log(out)+(1.0-y)*numpy.log(1.0-out))

    #regularization term
    for w in self.weights:
      res+=(lam/2.0)*numpy.sum(w[:,1:]**2)

    res/= float(len(inputOutputList))

    return res

def train(self, inputOutputList, lam=0.0, alpha=1.0):
    """
    Update the weights using training set
    @param inputOutputList list of [(input, output), ...] values
    @param lam>=0 regularization parameter (lam=0 means no regularization)
    @param alpha>0 gradient descent step
    @return cost before completion of step, cost after completion of step
    """

    numTraining=len(inputOutputList)

    #accumulate the error
    for x,y in inputOutputList:

      # compute the activations at each level
      self.forward(x)

      # compute the errors at each level
      self.backward(y)

      for el in range(self.numLayers-1):
        # d J /d Theta
        self.bigDeltas[el] += numpy.outer(self.deltas[el+1],self.activations[el])

      cost=self.getCost(inputOutputList, lam)

      #update the weights across all layers
      for el in range(self.numLayers-1):
        self.weights[el][:, :] -=alpha*self.bigDeltas[el][:, :] /numTraining
        # regularization term
        self.weights[el][:, 1:] -=alpha*lam*self.weights[el][:, 1:]

      newCost=self.getCost(inputOutputList, lam)

      return cost, newCost

n=NeuralNet([2,1]) # 2 inputs, 1 output, nohidden layer
n.randomlyInitializeWeights(0.1)
maxNumIter=200
tol=0.001
cost=float('inf')
alpha=1.0 #step size for gradient descent
lam =0.0 #regularization term, not needed here
count=0
trainingSet=[([0.,0.],0.),([0.,1.],0.),([1.,0.],0.),([1.,1.],1.),]
while cost >tol and count < maxNumIter and alpha > 1.e-4:
#save old weights
oldCost, newCost=n.train(trainingSet, lam=lam, alpha=alpha)
print '%d old cost=%f new cost=%f alpha=%f' % (count, oldCost, newCost, alpha)
if newCost<oldCost:
    alpha*=1.2 #increase step
else:
    alpha/=2.0 #decrease step
cost=newCost
count+=1
#check
n.forward([0.,0.])
print '0,0->',n.getOutput()
n.forward([0.,1.])
print '0.1->',n.getOutput()
n.forward([1.,0.])
print '1.0->',n.getOutput()
n.forward([1.,1.])
print '1,1->',n.getOutput()

저작자표시 비영리 변경금지 (새창열림)

'Python' 카테고리의 다른 글

primeNumber.py (0)	2015.02.09
externalEditor.py (0)	2015.02.09
assKick.py (0)	2015.02.09
sinebeep.py (0)	2015.02.09
rockPaperScissors.py (0)	2015.02.09

Posted by af334

일	월	화	수	목	금	토
					1	2
3	4	5	6	7	8	9
10	11	12	13	14	15	16
17	18	19	20	21	22	23
24	25	26	27	28	29	30
31

BA

aFewTricks.py

'Python' 카테고리의 다른 글

카테고리

태그목록

공지사항

최근에 올라온 글

최근에 달린 댓글

최근에 받은 트랙백

링크

글 보관함

티스토리툴바