README.md Update

2022-02-10 16:53:49 +01:00
parent 594bbaa3dd
commit 14768ffc0a
8 changed files with 134 additions and 18 deletions
--- a/README.md
+++ b/README.md
@@ -1,6 +1,9 @@
 # Bureaucratic Cohort Swarms
 ### (The Meta-Task Experience)  # Deadline: 28.02.22
 ## Experimente
+
+Data Exchange: [Google Drive Folder](***REMOVED***)
+
 ### Fixpoint Tests:
    
 - [ ] Dropout Test 
@@ -30,19 +33,29 @@
 ---

 ### Tasks für Steffen:
+- [x] Sanity Check:

- [x] Training mit kleineren GNs
-  - Accuracy leidet enorm (_0.56_)
-    ![image info](./figures/lesser_neurons_training_lineplot.png)
-  - Es entstehen mehr SRNN
-  - Der Dropout Effekt wird stärker (diff_ohne_SRNN = _0.0_)
-    ![image info](./figures/lesser_neurons_dropout_stacked_barplot.png)
- [X] Weiter Trainieren -> 500 Epochs?
- [ ] Loss Gewichtung anpassen
+  - [x] Neuronen können lernen einen Eingabewert mit x zu multiplizieren?
+
+    | SRNN x*n    3 Neurons            Identity_Func     | SRNN x*n    4 Neurons              Identity_Func  |
+    |---------------------------------------------------|----------------------------------------------------|
+    | ![](./figures/sanity/sanity_3hidden_xtimesn.png)   | ![](./figures/sanity/sanity_4hidden_xtimesn.png)  |
+    | SRNN x*n    6 Neurons              Other_Func      | SRNN x*n    10 Neurons      Other_Func            |
+    | ![](./figures/sanity/sanity_6hidden_xtimesn.png)   | ![](./figures/sanity/sanity_10hidden_xtimesn.png) |
+
+- [ ] Training mit kleineren GNs
+  
+    
+- [ ] Weiter Trainieren -> 500 Epochs?
 - [x] Training ohne Residual Skip Connection
-  - Ist kacke
-  ![image info](./figures/no_res_training_lineplot.png)
-  ![image info](./figures/no_res_dropout_stacked_barplot.png)
+  - Ist anders:
+     Self Training wird zunächst priorisiert, dann kommt langsam der eigentliche Task durch:
+      
+      | No Residual Skip connections 8 Neurons in SRNN  Alpha=100                                    | Residual Skip connections 8 Neurons in SRNN    Alpha=100                                 |
+      |------------------------------------------------------------------------------------------|----------------------------------------------------------------------------------------------|
+      | ![LinePlot](./figures/res_no_res/mn_st_200_8_alpha_100_no_res_training_particle_type_lp.png) | ![image info](./figures/res_no_res/mn_st_200_8_alpha_100_training_particle_type_lp.png)  |
+      | ![image info](./figures/res_no_res/mn_st_200_8_alpha_100_no_res_training_lineplot.png)       | ![image info](./figures/res_no_res/mn_st_200_8_alpha_100_training_lineplot.png)          |
+
 - [ ] Test mit Baseline Dense Network 
  - [ ] mit vergleichbaren Neuron Count
  - [ ] mit gesamt Weight Count
@@ -56,4 +69,3 @@
  - (Spaß bei Seite, wäre wichtig für schnellere Forschung)
    <https://pytorch.org/docs/stable/sparse.html>

---
--- a/experiments/meta_task_exp.py
+++ b/experiments/meta_task_exp.py
@@ -198,12 +198,13 @@ if __name__ == '__main__':
    plotting = True
    particle_analysis = True
    as_sparse_network_test = True
-    self_train_alpha = 100
+    self_train_alpha = 1
+    batch_train_beta = 1

    data_path = Path('data')
    data_path.mkdir(exist_ok=True, parents=True)

-    run_path = Path('output') / 'mn_st_200_8_alpha_100'
+    run_path = Path('output') / 'mn_st_400_2_no_res'
    model_path = run_path / '0000_trained_model.zip'
    df_store_path = run_path / 'train_store.csv'
    weight_store_path = run_path / 'weight_store.csv'
@@ -217,7 +218,7 @@ if __name__ == '__main__':
        d = DataLoader(dataset, batch_size=BATCHSIZE, shuffle=True, drop_last=True, num_workers=WORKER)

        interface = np.prod(dataset[0][0].shape)
-        metanet = MetaNet(interface, depth=5, width=6, out=10, residual_skip=True).to(DEVICE)
+        metanet = MetaNet(interface, depth=5, width=6, out=10, residual_skip=False).to(DEVICE)
        meta_weight_count = sum(p.numel() for p in next(metanet.particles).parameters())

        loss_fn = nn.CrossEntropyLoss()
@@ -249,7 +250,7 @@ if __name__ == '__main__':
                batch_x, batch_y = batch_x.to(DEVICE), batch_y.to(DEVICE)
                y = metanet(batch_x)
                # loss = loss_fn(y, batch_y.unsqueeze(-1).to(torch.float32))
-                loss = loss_fn(y, batch_y.to(torch.long))
+                loss = loss_fn(y, batch_y.to(torch.long)) * batch_train_beta
                loss.backward()

                # Adjust learning weights
@@ -312,7 +313,7 @@ if __name__ == '__main__':
        plot_training_result(df_store_path)
        if particle_analysis:
            plot_training_particle_types(df_store_path)
-    exit()
+
    if particle_analysis:
        model_path = next(run_path.glob(f'*e{EPOCH}.tp'))
        latest_model = torch.load(model_path, map_location=DEVICE).eval()
--- a/experiments/meta_task_sanity_exp.py
+++ b/experiments/meta_task_sanity_exp.py
@@ -0,0 +1,103 @@
+import sys
+from collections import defaultdict
+from pathlib import Path
+import platform
+
+import pandas as pd
+import torch.optim
+from matplotlib import pyplot as plt
+from torch import nn
+from torch.utils.data import Dataset, DataLoader
+import numpy as np
+import seaborn as sns
+from tqdm import trange
+from tqdm.contrib import tenumerate
+
+
+if platform.node() == 'CarbonX':
+    debug = True
+    print("@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@")
+    print("@ Warning, Debugging Config@!!!!!! @")
+    print("@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@")
+else:
+    debug = False
+    try:
+        # noinspection PyUnboundLocalVariable
+        if __package__ is None:
+            DIR = Path(__file__).resolve().parent
+            sys.path.insert(0, str(DIR.parent))
+            __package__ = DIR.name
+        else:
+            DIR = None
+    except NameError:
+        DIR = None
+        pass
+
+import functionalities_test
+from network import Net
+
+
+class MultiplyByXTaskDataset(Dataset):
+    def __init__(self, x=0.23, length=int(5e5)):
+        super().__init__()
+        self.length = length
+        self.x = x
+        self.prng = np.random.default_rng()
+
+    def __len__(self):
+        return self.length
+
+    def __getitem__(self, _):
+        ab = self.prng.normal(size=(1,)).astype(np.float32)
+        return ab, ab * self.x
+
+
+if __name__ == '__main__':
+    net = Net(5, 1, 1)
+    multiplication_target = 0.03
+
+    loss_fn = nn.MSELoss()
+    optimizer = torch.optim.SGD(net.parameters(), lr=0.008, momentum=0.9)
+
+    train_frame = pd.DataFrame(columns=['Epoch', 'Batch', 'Metric', 'Score'])
+
+    dataset = MultiplyByXTaskDataset(x=multiplication_target, length=1000000)
+    dataloader = DataLoader(dataset=dataset, batch_size=8000)
+    for epoch in trange(30):
+        mean_batch_loss = []
+        mean_self_tain_loss = []
+        for batch, (batch_x, batch_y) in tenumerate(dataloader):
+            self_train_loss, _ = net.self_train(10, save_history=False)
+            batch_x_emb = torch.zeros(batch_x.shape[0], 5)
+            batch_x_emb[:, -1] = batch_x.squeeze()
+            y = net(batch_x_emb)
+            loss = loss_fn(y, batch_y)
+
+            loss.backward()
+            optimizer.step()
+
+            mean_batch_loss.append(loss.detach())
+            mean_self_tain_loss.append(self_train_loss.detach())
+
+        train_frame.loc[train_frame.shape[0]] = dict(Epoch=epoch, Batch=batch,
+                                                     Metric='Self Train Loss', Score=np.average(mean_self_tain_loss))
+        train_frame.loc[train_frame.shape[0]] = dict(Epoch=epoch, Batch=batch,
+                                                         Metric='Batch Loss', Score=np.average(mean_batch_loss))
+
+    counter = defaultdict(lambda: 0)
+    functionalities_test.test_for_fixpoints(counter, nets=[net])
+    print(dict(counter))
+    sanity = net(torch.Tensor([0,0,0,0,1])).detach()
+    print(sanity)
+    print(abs(sanity - multiplication_target))
+    sns.lineplot(data=train_frame, x='Epoch', y='Score', hue='Metric')
+    outpath = Path('output') / 'sanity' / 'test.png'
+    outpath.parent.mkdir(exist_ok=True, parents=True)
+    plt.savefig(outpath)
+
+
+
+
+
+
+
--- a/figures/lesser_neurons_dropout_stacked_barplot.png
+++ b/figures/lesser_neurons_dropout_stacked_barplot.png
--- a/figures/lesser_neurons_training_lineplot.png
+++ b/figures/lesser_neurons_training_lineplot.png
--- a/figures/no_res_dropout_stacked_barplot.png
+++ b/figures/no_res_dropout_stacked_barplot.png
--- a/figures/no_res_training_lineplot.png
+++ b/figures/no_res_training_lineplot.png
--- a/network.py
+++ b/network.py
@@ -296,7 +296,7 @@ class MetaCell(nn.Module):
        self.name = name
        self.interface = interface
        self.weight_interface = 5
-        self.net_hidden_size = 8
+        self.net_hidden_size = 2
        self.net_ouput_size = 1
        self.meta_weight_list = nn.ModuleList()
        self.meta_weight_list.extend(