journal_robustness.py redone, now is sensitive to seeds and plots

2021-05-23 13:46:21 +02:00 · 2021-05-23 13:46:21 +02:00 · 55bdd706b6
commit 55bdd706b6
parent 74d618774a
4 changed files with 70 additions and 34 deletions
--- a/README.md
+++ b/README.md
@ -19,6 +19,15 @@
 - [ ] Adjust Self Training so that it favors second order fixpoints-> Second order test implementation (?)
 - [ ] Barplot over clones -> how many become a fixpoint cs how many diverge per noise level
 - [ ] Box-Plot of Avg. Distance of clones from parent
 # Future Todos:
 - [ ] Find a statistik over weight space that provides a better init function
 - [ ] Test this init function on a mnist classifier - just for the lolz
 - [ ] 
 ---
 ## Notes: 
--- a/journal_basins.py
+++ b/journal_basins.py
@ -28,7 +28,7 @@ def mean_invariate_manhattan_distance(x, y):
    # distances of ascending values, ie. sum (abs(min1_X-min1_Y), abs(min2_X-min2Y) ...) / mean.  
    # Idea was to find weight sets that have same values but just in different positions, that would
    # make this distance 0.
-    return np.mean(list(map(l1, zip(sorted(x), sorted(y)))))
+    return np.mean(list(map(l1, zip(sorted(x.numpy()), sorted(y.numpy())))))
 def distance_matrix(nets, distance="MIM", print_it=True):
@ -212,19 +212,19 @@ if __name__ == "__main__":
    # Define number of runs & name:
    ST_runs = 1
    ST_runs_name = "test-27"
-    ST_steps = 1700
+    ST_steps = 2500
    ST_epochs = 2
    ST_log_step_size = 10
    # Define number of networks & their architecture
-    nr_clones = 5
+    nr_clones = 10
-    ST_population_size = 1
+    ST_population_size = 3
    ST_net_hidden_size = 2
    ST_net_learning_rate = 0.04
    ST_name_hash = random.getrandbits(32)
    print(f"Running the Spawn experiment:")
-    for noise_factor in range(2,3):
+    for noise_factor in [1]:
        SpawnExperiment(
            population_size=ST_population_size,
            log_step_size=ST_log_step_size,
--- a/journal_robustness.py
+++ b/journal_robustness.py
@ -1,7 +1,10 @@
 import pickle
 import pandas as pd
 import torch
 import random
 import copy
 import numpy as np
 from pathlib import Path
 from tqdm import tqdm
@ -14,6 +17,8 @@ from functionalities_test import is_identity_function, is_zero_fixpoint, test_fo
 from network import Net
 from torch.nn import functional as F
 from visualization import plot_loss, bar_chart_fixpoints
 import seaborn as sns
 from matplotlib import pyplot as plt
 def prng():
@ -31,7 +36,6 @@ class RobustnessComparisonExperiment:
    @staticmethod
    def apply_noise(network, noise: int):
        """ Changing the weights of a network to values + noise """
        for layer_id, layer_name in enumerate(network.state_dict()):
            for line_id, line_values in enumerate(network.state_dict()[layer_name]):
                for weight_id, weight_value in enumerate(network.state_dict()[layer_name][line_id]):
@ -77,41 +81,48 @@ class RobustnessComparisonExperiment:
    def populate_environment(self):
        loop_population_size = tqdm(range(self.population_size))
        nets = []
        if self.synthetic:
            ''' Either use perfect / hand-constructed fixpoint ... '''
            net_name = f"net_{str(0)}_synthetic"
            net = Net(self.net_input_size, self.net_hidden_size, self.net_out_size, net_name)
            net.apply_weights(generate_perfekt_synthetic_fixpoint_weights())
            nets.append(net)
        else:
            for i in loop_population_size:
                loop_population_size.set_description("Populating experiment %s" % i)
            if self.synthetic:
                ''' Either use perfect / hand-constructed fixpoint ... '''
                net_name = f"net_{str(i)}_synthetic"
                net = Net(self.net_input_size, self.net_hidden_size, self.net_out_size, net_name)
                net.apply_weights(generate_perfekt_synthetic_fixpoint_weights())
            else:
                ''' .. or use natural approach to train fixpoints from random initialisation. '''
                net_name = f"net_{str(i)}"
                net = Net(self.net_input_size, self.net_hidden_size, self.net_out_size, net_name)
                for _ in range(self.epochs):
                    net.self_train(self.ST_steps, self.log_step_size, self.net_learning_rate)
                nets.append(net)
        return nets
-    def test_robustness(self, print_it=True):
+    def test_robustness(self, print_it=True, noise_levels=10, seeds=10):
-        avg_time_to_vergence = [[0 for _ in range(10)] for _ in range(len(self.id_functions))]
+        assert (len(self.id_functions) == 1 and seeds > 1) or (len(self.id_functions) > 1 and seeds == 1)
-        avg_time_as_fixpoint = [[0 for _ in range(10)] for _ in range(len(self.id_functions))]
+        is_synthetic = True if len(self.id_functions) > 1 and seeds == 1 else False
-        avg_loss_per_application = [[0 for _ in range(10)] for _ in range(len(self.id_functions))]
+        avg_time_to_vergence = [[0 for _ in range(noise_levels)] for _ in
-        noise_range = range(10)
+                                range(seeds if is_synthetic else len(self.id_functions))]
        avg_time_as_fixpoint = [[0 for _ in range(noise_levels)] for _ in
                                range(seeds if is_synthetic else len(self.id_functions))]
        row_headers = []
        data_pos = 0
        # This checks wether to use synthetic setting with multiple seeds
        #   or multi network settings with a singlee seed
-        for i, fixpoint in enumerate(self.id_functions):
+        df = pd.DataFrame(columns=['seed', 'noise_level', 'application_step', 'absolute_loss'])
        for i, fixpoint in enumerate(self.id_functions): #1 / n
            row_headers.append(fixpoint.name)
-            loss_per_application = [[0 for _ in range(10)] for _ in range(len(self.id_functions))]
+            for seed in range(seeds): #n / 1
-            for seed in range(10):
+                for noise_level in range(noise_levels):
-                for noise_level in noise_range:
+                    self_application_steps = 1
                    clone = Net(fixpoint.input_size, fixpoint.hidden_size, fixpoint.out_size,
                                f"{fixpoint.name}_clone_noise10e-{noise_level}")
                    clone.load_state_dict(copy.deepcopy(fixpoint.state_dict()))
-                    rand_noise = prng() * pow(10, -noise_level)
+                    rand_noise = prng() * pow(10, -noise_level) #n / 1
                    clone = self.apply_noise(clone, rand_noise)
                    while not is_zero_fixpoint(clone) and not is_divergent(clone):
@ -128,12 +139,24 @@ class RobustnessComparisonExperiment:
                        clone_weight_post_application = clone.input_weight_matrix()
                        target_data_post_application = clone.create_target_weights(clone_weight_post_application)
-                        loss_per_application[seed][noise_level] = (F.l1_loss(target_data_pre_application,
+                        absolute_loss = F.l1_loss(target_data_pre_application, target_data_post_application).item()
                                                                             target_data_post_application))
                        setting = i if is_synthetic else seed
                        df.loc[data_pos] = [setting, noise_level, self_application_steps, absolute_loss]
                        data_pos += 1
                        self_application_steps += 1
        # calculate the average:
        df = df.replace([np.inf, -np.inf], np.nan)
        df = df.dropna()
        # sns.set(rc={'figure.figsize': (10, 50)})
        bx = sns.catplot(data=df[df['absolute_loss'] < 1], y='absolute_loss', x='application_step', kind='box',
                         col='noise_level', col_wrap=3, showfliers=False)
        plt.show()
        if print_it:
-            col_headers = [str(f"10e-{d}") for d in noise_range]
+            col_headers = [str(f"10e-{d}") for d in range(noise_levels)]
            print(f"\nAppplications steps until divergence / zero: ")
            print(tabulate(avg_time_to_vergence, showindex=row_headers, headers=col_headers, tablefmt='orgtbl'))
--- a/requirements.txt
+++ b/requirements.txt
@ -1,7 +1,11 @@
-torch
+torch~=1.8.1+cpu
-tqdm
+tqdm~=4.60.0
-numpy==1.19.0
+numpy~=1.20.3
-matplotlib
+matplotlib~=3.4.2
 sklearn
 scipy
-tabulate
+tabulate~=0.8.9
 scikit-learn~=0.24.2
 pandas~=1.2.4
 seaborn~=0.11.1