Removed regularization from network_basic

mnielsen · mnielsen · commit 07745a0026dd · 2013-08-19T10:10:00.000-04:00
diff --git a/code/network_basic.py b/code/network_basic.py
@@ -42,7 +42,7 @@ def feedforward(self, a):
         return a
 
     def SGD(self, training_data, epochs, mini_batch_size, eta,
-            lmbda, test_data=None):
+            test_data=None):
         """Train the neural network using mini-batch stochastic
         gradient descent.  The ``training_data`` is a list of tuples
         ``(x, y)`` representing the training inputs and the desired
@@ -59,14 +59,14 @@ def SGD(self, training_data, epochs, mini_batch_size, eta,
                 training_data[k:k+mini_batch_size]
                 for k in xrange(0, n, mini_batch_size)]
             for mini_batch in mini_batches:
-                self.backprop(mini_batch, n, eta, lmbda)
+                self.backprop(mini_batch, n, eta)
             if test_data:
                 print "Epoch {}: {} / {}".format(
                     j, self.evaluate(test_data), n_test)
             else:
                 print "Epoch %s complete" % j
 
-    def backprop(self, training_data, n, eta, lmbda):
+    def backprop(self, training_data, n, eta):
         """Update the network's weights and biases by applying a
         single iteration of gradient descent using backpropagation.
         The ``training_data`` is a list of tuples ``(x, y)``.  It need
@@ -77,7 +77,6 @@ def backprop(self, training_data, n, eta, lmbda):
         self-explanatory."""
         nabla_b = [np.zeros(b.shape) for b in self.biases]
         nabla_w = [np.zeros(w.shape) for w in self.weights]
-        B = len(training_data)
         for x, y in training_data:
             # feedforward
             activation = x
@@ -105,8 +104,6 @@ def backprop(self, training_data, n, eta, lmbda):
                 delta = np.dot(self.weights[-l+1].transpose(), delta) * spv
                 nabla_b[-l] += delta
                 nabla_w[-l] += np.dot(delta, activations[-l-1].transpose())
-        # Add the regularization terms to the gradient for the weights
-        nabla_w = [nw+(lmbda*B/n)*w for nw, w in zip(nabla_w, self.weights)]
         self.weights = [w-eta*nw for w, nw in zip(self.weights, nabla_w)]
         self.biases = [b-eta*nb for b, nb in zip(self.biases, nabla_b)]
 
@@ -121,15 +118,12 @@ def evaluate(self, test_data):
         
     def cost(self, x, y):
         """Return the quadratic cost associated to the network, with
-        input ``x`` and desired output ``y``.  Note that there is no
-        regularization."""
+        input ``x`` and desired output ``y``."""
         return np.sum((self.feedforward(x)-y)**2)/2.0
 
     def cost_derivative(self, output_activations, y):
         """Return the vector of partial derivatives \partial C_x /
-        \partial a for the output activations, ``a``.  For the
-        unregularized quadratic cost this is just the difference
-        between the output activations and the desired output, ``y``."""
+        \partial a for the output activations, ``a``."""
         return (output_activations-y) 
 
 #### Miscellaneous functions