Particle Swarm Optimization

masscollaborationlabs · Oct 6, 2017 · c5256ff · c5256ff
1 parent 3794bde
commit c5256ff
Show file tree

Hide file tree

Showing 2 changed files with 21 additions and 16 deletions.
diff --git a/mlfromscratch/examples/particle_swarm_optimization.py b/mlfromscratch/examples/particle_swarm_optimization.py
@@ -55,12 +55,15 @@ def model_builder(n_inputs, n_outputs):
                         inertia_weight=inertia_weight,
                         cognitive_weight=cognitive_weight,
                         social_weight=social_weight,
+                        max_velocity=5,
                         model_builder=model_builder)
 
     model = model.evolve(X_train, y_train, n_generations=n_generations)
 
     loss, accuracy = model.test_on_batch(X_test, y_test)
 
+    print ("Accuracy: %.1f%%" % float(100*accuracy))
+
     # Reduce dimension to 2D using PCA and plot the results
     y_pred = np.argmax(model.predict(X_test), axis=1)
     Plot().plot_in_2d(X_test, y_pred, title="Particle Swarm Optimized Neural Network", accuracy=accuracy, legend_labels=range(y.shape[1]))

diff --git a/mlfromscratch/supervised_learning/particle_swarm_optimization.py b/mlfromscratch/supervised_learning/particle_swarm_optimization.py
@@ -9,24 +9,28 @@ class ParticleSwarmOptimizedNN():
     -----------
     n_individuals: int
         The number of neural networks that are allowed in the population at a time.
+    model_builder: method
+        A method which returns a user specified NeuralNetwork instance.
     inertia_weight:     float [0,1)
     cognitive_weight:   float [0,1)
     social_weight:      float [0,1)
-    model_builder: method
-        A method which returns a user specified NeuralNetwork instance.
+    max_velocity: float
+        The maximum allowed value for the velocity.
 
     Reference:
         Neural Network Training Using Particle Swarm Optimization
         https://visualstudiomagazine.com/articles/2013/12/01/neural-network-training-using-particle-swarm-optimization.aspx 
     """
-    def __init__(self, population_size, inertia_weight, cognitive_weight, social_weight, model_builder):
+    def __init__(self, population_size, model_builder, inertia_weight=0.8, cognitive_weight=2, social_weight=2, max_velocity=10):
         self.population_size = population_size
         self.model_builder = model_builder
         self.best_individual = None
         # Parameters used to update velocity
         self.cognitive_w = cognitive_weight
         self.inertia_w = inertia_weight
         self.social_w = social_weight
+        self.min_v = -max_velocity
+        self.max_v = max_velocity
 
     def _build_model(self, id):
         """ Returns a new individual """
@@ -35,19 +39,17 @@ def _build_model(self, id):
         model.fitness = 0
         model.highest_fitness = 0
         model.accuracy = 0
+        # Set intial best as the current initialization
+        model.best_layers = copy.copy(model.layers)
 
-        # Set initial velocity
+        # Set initial velocity to zero
         model.velocity = []
         for layer in model.layers:
+            velocity = {"W": 0, "w0": 0}
             if hasattr(layer, 'W'):
                 velocity = {"W": np.zeros_like(layer.W), "w0": np.zeros_like(layer.w0)}
-            else:
-                velocity = {"W": 0, "w0": 0}
             model.velocity.append(velocity)
 
-        # Set intial best as the current initialization
-        model.best_layers = copy.copy(model.layers)
-
         return model
 
     def _initialize_population(self):
@@ -64,18 +66,19 @@ def _update_weights(self, individual):
         r2 = np.random.uniform()
         for i, layer in enumerate(individual.layers):
             if hasattr(layer, 'W'):
-
                 # Layer weights velocity
                 first_term_W = self.inertia_w * individual.velocity[i]["W"]
                 second_term_W = self.cognitive_w * r1 * (individual.best_layers[i].W - layer.W)
                 third_term_W = self.social_w * r2 * (self.best_individual.layers[i].W - layer.W)
-                individual.velocity[i]["W"] = first_term_W + second_term_W + third_term_W
+                new_velocity = first_term_W + second_term_W + third_term_W
+                individual.velocity[i]["W"] = np.clip(new_velocity, self.min_v, self.max_v)
 
                 # Bias weight velocity
                 first_term_w0 = self.inertia_w * individual.velocity[i]["w0"]
                 second_term_w0 = self.cognitive_w * r1 * (individual.best_layers[i].w0 - layer.w0)
                 third_term_w0 = self.social_w * r2 * (self.best_individual.layers[i].w0 - layer.w0)
-                individual.velocity[i]["w0"] = first_term_w0 + second_term_w0 + third_term_w0
+                new_velocity = first_term_w0 + second_term_w0 + third_term_w0
+                individual.velocity[i]["w0"] = np.clip(new_velocity, self.min_v, self.max_v)
 
                 # Update layer weights with velocity
                 individual.layers[i].W += individual.velocity[i]["W"]
@@ -93,17 +96,17 @@ def evolve(self, X, y, n_generations):
 
         self._initialize_population()
 
-        # The best individual of the population is initialized to the first individual
+        # The best individual of the population is initialized as population's first ind.
         self.best_individual = copy.copy(self.population[0])
 
         for epoch in range(n_generations):
             for individual in self.population:
-                # Update the NN weights by calculating new velocity
+                # Calculate new velocity and update the NN weights
                 self._update_weights(individual)
                 # Calculate the fitness of the updated individual
                 self._calculate_fitness(individual)
 
-                # If the current fitness is higher than the previous highest
+                # If the current fitness is higher than the individual's previous highest
                 # => update the individual's best layer setup
                 if individual.fitness > individual.highest_fitness:
                     individual.best_layers = copy.copy(individual.layers)
@@ -117,6 +120,5 @@ def evolve(self, X, y, n_generations):
                                                                             self.best_individual.id,
                                                                             self.best_individual.fitness,
                                                                             100*float(self.best_individual.accuracy)))
-
         return self.best_individual