From bbebf17c1d782a6a5d88bfe83a6421161e3215a9 Mon Sep 17 00:00:00 2001
From: Peter Sharpe <pds@mit.edu>
Date: Thu, 7 Mar 2024 15:06:58 -0500
Subject: [PATCH] sync at point of supercloud run

---
 neuralfoil/gen2_architecture/main.py          |  46 ++++-
 ...pute_kulfan_parameter_covariance_matrix.py |  36 ++++
 .../train_blind_neural_network.py             | 165 ++++++++++--------
 .../training_data/generate_xfoil_data.py      |   4 +-
 .../generate_xfoil_data_multiprocessing.py    | 164 +++++++++++++++++
 .../training_data/load_data.py                |  10 +-
 .../training_data/supercloud_generate_data.sh |   2 +-
 7 files changed, 340 insertions(+), 87 deletions(-)
 create mode 100644 training/gen2_architecture/optimal_sensor_placement/compute_kulfan_parameter_covariance_matrix.py
 create mode 100644 training/gen2_architecture/training_data/generate_xfoil_data_multiprocessing.py

diff --git a/neuralfoil/gen2_architecture/main.py b/neuralfoil/gen2_architecture/main.py
index 39fb852..78d90d1 100644
--- a/neuralfoil/gen2_architecture/main.py
+++ b/neuralfoil/gen2_architecture/main.py
@@ -124,15 +124,43 @@ def net(x: np.ndarray):
     y_unflipped[:, 3] *= -1  # CM
     y_unflipped[:, 4] = y_flipped[:, 5]  # switch Top_Xtr with Bot_Xtr
     y_unflipped[:, 5] = y_flipped[:, 4]  # switch Bot_Xtr with Top_Xtr
-    y_unflipped[:, 6:6 + 72] = y_flipped[:, 6 + 72: 6 + 2 * 72]  # switch upper_bl_theta with lower_bl_theta
-    y_unflipped[:, 6 + 72: 6 + 2 * 72] = y_flipped[:, 6:6 + 72]  # switch lower_bl_theta with upper_bl_theta
+
+    # switch upper and lower Ret, H
+    y_unflipped[:, 6:6 + 32 * 2] = y_flipped[:, 6 + 32 * 3: 6 + 32 * 5]
+    y_unflipped[:, 6 + 32 * 3: 6 + 32 * 5] = y_flipped[:, 6:6 + 32 * 2]
+
+    # switch upper_bl_ue/vinf with lower_bl_ue/vinf
+    y_unflipped[:, 6 + 32 * 2: 6 + 32 * 3] = -1 * y_flipped[:, 6 + 32 * 5: 6 + 32 * 6]
+    y_unflipped[:, 6 + 32 * 5: 6 + 32 * 6] = -1 * y_flipped[:, 6 + 32 * 2: 6 + 32 * 3]
 
     ### Then, average the two outputs to get the "symmetric" result
     y_fused = (y + y_unflipped) / 2
     y_fused[:, 0] = _sigmoid(y_fused[:, 0])  # Analysis confidence, a binary variable
 
     # Unpack the neural network outputs
-    sqrt_Rex_approx = [((Data.bl_x_points[i] + 1e-2) / Re) ** 0.5 for i in range(Data.N)]
+    # sqrt_Rex_approx = [((Data.bl_x_points[i] + 1e-2) / Re) ** 0.5 for i in range(Data.N)]
+    # TODO
+
+    analysis_confidence = y_fused[:, 0]
+    CL = y_fused[:, 1] / 2
+    CD = np.exp((y_fused[:, 2] - 2) * 2)
+    CM = y_fused[:, 3] / 20
+    Top_Xtr = y_fused[:, 4]
+    Bot_Xtr = y_fused[:, 5]
+
+    upper_bl_ue_over_vinf = y_fused[:, 6 + Data.N * 2:6 + Data.N * 3]
+    lower_bl_ue_over_vinf = y_fused[:, 6 + Data.N * 5:6 + Data.N * 6]
+
+    upper_theta = (
+                          (10 ** y_fused[:, 6: 6 + Data.N]) - 0.1
+    ) / (np.abs(upper_bl_ue_over_vinf) * Re)
+    upper_H = 2.6 * np.exp(y_fused[:, 6 + Data.N: 6 + Data.N * 2])
+
+    lower_theta = (
+                            (10 ** y_fused[:, 6 + Data.N * 3: 6 + Data.N * 4]) - 0.1
+    ) / (np.abs(lower_bl_ue_over_vinf) * Re)
+    lower_H = 2.6 * np.exp(y_fused[:, 6 + Data.N * 4: 6 + Data.N * 5])
+
 
     results = {
         "analysis_confidence": y_fused[:, 0],
@@ -142,27 +170,27 @@ def net(x: np.ndarray):
         "Top_Xtr"            : y_fused[:, 4],
         "Bot_Xtr"            : y_fused[:, 5],
         **{
-            f"upper_bl_theta_{i}": np.exp(y_fused[:, 6 + i]) * sqrt_Rex_approx[i]
+            f"upper_bl_theta_{i}": upper_theta[:, i]
             for i in range(Data.N)
         },
         **{
-            f"upper_bl_H_{i}": np.exp(y_fused[:, 6 + Data.N + i]) * 2.6
+            f"upper_bl_H_{i}": upper_H[:, i]
             for i in range(Data.N)
         },
         **{
-            f"upper_bl_Cp_{i}": 1 - (1 + y_fused[:, 6 + 2 * Data.N + i]) ** 2
+            f"upper_bl_ue/vinf_{i}": upper_bl_ue_over_vinf[:, i]
             for i in range(Data.N)
         },
         **{
-            f"lower_bl_theta_{i}": np.exp(y_fused[:, 6 + 3 * Data.N + i]) * sqrt_Rex_approx[i]
+            f"lower_bl_theta_{i}": lower_theta[:, i]
             for i in range(Data.N)
         },
         **{
-            f"lower_bl_H_{i}": np.exp(y_fused[:, 6 + 4 * Data.N + i]) * 2.6
+            f"lower_bl_H_{i}": lower_H[:, i]
             for i in range(Data.N)
         },
         **{
-            f"lower_bl_Cp_{i}": 1 - (1 + y_fused[:, 6 + 5 * Data.N + i]) ** 2
+            f"lower_bl_ue/vinf_{i}": lower_bl_ue_over_vinf[:, i]
             for i in range(Data.N)
         },
     }
diff --git a/training/gen2_architecture/optimal_sensor_placement/compute_kulfan_parameter_covariance_matrix.py b/training/gen2_architecture/optimal_sensor_placement/compute_kulfan_parameter_covariance_matrix.py
new file mode 100644
index 0000000..a8b0f1a
--- /dev/null
+++ b/training/gen2_architecture/optimal_sensor_placement/compute_kulfan_parameter_covariance_matrix.py
@@ -0,0 +1,36 @@
+from load_data import df, Data
+import aerosandbox as asb
+import numpy as np
+
+kulfans_data = np.stack([
+    df[f"kulfan_{side}_{i}"]
+    for side in [
+        "upper",
+        "lower"
+    ]
+    for i in range(8)
+] + [
+    df["kulfan_LE_weight"],
+    df["kulfan_TE_thickness"]
+], axis=1)
+
+cov_data = np.cov(kulfans_data, rowvar=False)
+
+airfoil_database_path = asb._asb_root / "geometry" / "airfoil" / "airfoil_database"
+
+airfoil_database = [
+    asb.Airfoil(name=filename.stem).normalize().to_kulfan_airfoil()
+    for filename in airfoil_database_path.glob("*.dat")
+]
+
+kulfans_database = np.stack([
+    np.concatenate([
+        airfoil.upper_weights,
+        airfoil.lower_weights,
+        np.atleast_1d(airfoil.leading_edge_weight),
+        np.atleast_1d(airfoil.TE_thickness)
+    ])
+    for airfoil in airfoil_database
+], axis=0)
+
+cov_database = np.cov(kulfans_database, rowvar=False)
\ No newline at end of file
diff --git a/training/gen2_architecture/train_blind_neural_network.py b/training/gen2_architecture/train_blind_neural_network.py
index 90572cf..699a504 100644
--- a/training/gen2_architecture/train_blind_neural_network.py
+++ b/training/gen2_architecture/train_blind_neural_network.py
@@ -1,5 +1,4 @@
-import aerosandbox as asb
-import aerosandbox.numpy as np
+import numpy as np
 from pathlib import Path
 import sys, os
 
@@ -19,25 +18,29 @@
 N_inputs = len(df_train_inputs_scaled.columns)
 N_outputs = len(df_train_outputs_scaled.columns)
 
-cache_file = Path(__file__).parent / "nn-large.pth"
-
+cache_file = Path(__file__).parent / "nn-xxxlarge.pth"
+print("Cache file: ", cache_file)
 
 # Define the model
 class Net(torch.nn.Module):
     def __init__(self):
         super().__init__()
 
-        width = 256
+        width = 512
 
         self.net = torch.nn.Sequential(
             torch.nn.Linear(N_inputs, width),
             torch.nn.Tanh(),
+
+            torch.nn.Linear(width, width),
+            torch.nn.Tanh(),
             torch.nn.Linear(width, width),
             torch.nn.Tanh(),
             torch.nn.Linear(width, width),
             torch.nn.Tanh(),
             torch.nn.Linear(width, width),
             torch.nn.Tanh(),
+
             torch.nn.Linear(width, N_outputs),
         )
 
@@ -64,8 +67,14 @@ def forward(self, x: torch.Tensor):
         y_unflipped[:, 3] *= -1  # CM
         y_unflipped[:, 4] = y_flipped[:, 5]  # switch Top_Xtr with Bot_Xtr
         y_unflipped[:, 5] = y_flipped[:, 4]  # switch Bot_Xtr with Top_Xtr
-        y_unflipped[:, 6:6 + 72] = y_flipped[:, 6 + 72: 6 + 2 * 72]  # switch upper_bl_theta with lower_bl_theta
-        y_unflipped[:, 6 + 72: 6 + 2 * 72] = y_flipped[:, 6:6 + 72]  # switch lower_bl_theta with upper_bl_theta
+
+        # switch upper and lower Ret, H
+        y_unflipped[:, 6:6 + 32 * 2] = y_flipped[:, 6 + 32 * 3: 6 + 32 * 5]
+        y_unflipped[:, 6 + 32 * 3: 6 + 32 * 5] = y_flipped[:, 6:6 + 32 * 2]
+
+        # switch upper_bl_ue/vinf with lower_bl_ue/vinf
+        y_unflipped[:, 6 + 32 * 2: 6 + 32 * 3] = -1 * y_flipped[:, 6 + 32 * 5: 6 + 32 * 6]
+        y_unflipped[:, 6 + 32 * 5: 6 + 32 * 6] = -1 * y_flipped[:, 6 + 32 * 2: 6 + 32 * 3]
 
         ### Then, average the two outputs to get the "symmetric" result
         y_fused = (y + y_unflipped) / 2
@@ -74,7 +83,6 @@ def forward(self, x: torch.Tensor):
         return y_fused
 
 
-
 if __name__ == '__main__':
     device = torch.device('cuda') if torch.cuda.is_available() else torch.device('cpu')
     print(device)
@@ -93,15 +101,15 @@ def forward(self, x: torch.Tensor):
     scheduler = torch.optim.lr_scheduler.ReduceLROnPlateau(
         optimizer,
         factor=0.5,
-        patience=20,
+        patience=10,
         verbose=True,
-        min_lr=1e-6,
+        min_lr=0,
     )
 
     # Define the data loader
     print(f"Preparing data...")
 
-    batch_size = 1024
+    batch_size = 128
     train_inputs = torch.tensor(
         df_train_inputs_scaled.to_numpy(),
         dtype=torch.float32,
@@ -131,6 +139,53 @@ def forward(self, x: torch.Tensor):
         # num_workers=4,
     )
 
+    # Prepare the loss function
+    loss_weights = torch.ones(N_outputs, dtype=torch.float32).to(device)
+    loss_weights[0] *= 0.05  # Analysis confidence
+    loss_weights[1] *= 1  # CL
+    loss_weights[2] *= 2  # ln(CD)
+    loss_weights[3] *= 0.5  # CM
+    loss_weights[4] *= 0.25  # Top Xtr
+    loss_weights[5] *= 0.25  # Bot Xtr
+    loss_weights[6:] *= 1 / (32 * 6)  # Lower the weight on all boundary layer outputs
+
+
+    def loss_function(y_pred, y_data, return_individual_loss_components=False):
+        # For data with NaN, overwrite the data with the prediction. This essentially makes the model ignore NaN data,
+        # since the gradient of the loss with respect to parameters is zero when the data is NaN.
+        y_data = torch.where(
+            torch.isnan(y_data),
+            y_pred,
+            y_data
+        )
+
+        analysis_confidence_loss = torch.nn.functional.binary_cross_entropy(y_pred[:, 0], y_data[:, 0])
+        # other_loss_components = torch.mean(
+        #     (y_pred[:, 1:] - y_data[:, 1:]) ** 2,
+        #     dim=0
+        # )
+        other_loss_components = torch.mean(
+            torch.nn.functional.huber_loss(
+                y_pred[:, 1:], y_data[:, 1:],
+                reduction='none',
+                delta=1
+            ),
+            dim=0
+        )
+
+        unweighted_loss_components = torch.stack([
+            analysis_confidence_loss,
+            *other_loss_components
+        ], dim=0)
+        weighted_loss_components = unweighted_loss_components * loss_weights
+        loss = torch.sum(weighted_loss_components)
+
+        if return_individual_loss_components:
+            return weighted_loss_components
+        else:
+            return loss
+
+
     # raise Exception
     print(f"Training...")
     unweighted_epoch_loss_components = torch.ones(N_outputs, dtype=torch.float32).to(device)
@@ -142,83 +197,53 @@ def forward(self, x: torch.Tensor):
         # Put the model in training mode
         net.train()
 
-        # Choose model weights for this epoch
-        loss_weights = torch.ones(N_outputs, dtype=torch.float32).to(device)
-        loss_weights[0] *= 0.05  # Analysis confidence
-        loss_weights[1] *= 1  # CL
-        loss_weights[2] *= 3  # ln(CD)
-        loss_weights[3] *= 0.5  # CM
-        loss_weights[4] *= 0.25  # Top Xtr
-        loss_weights[5] *= 0.25  # Bot Xtr
-        loss_weights[6:] *= 0.05  # Lower the weight on the boundary layer outputs
-
-        list_unweighted_batch_loss_components = []
+        loss_from_each_training_batch = []
 
-        for i, (x, y) in enumerate(tqdm(train_loader)):
+        for x, y_data in tqdm(train_loader):
 
             x = x.to(device)
-            y = y.to(device)
-
-            y_pred = net(x)
+            y_data = y_data.to(device)
 
-            y = torch.where(
-                torch.isnan(y),
-                y_pred,
-                y
+            loss = loss_function(
+                y_pred=net(x),
+                y_data=y_data
             )
 
-            unweighted_batch_loss_components = torch.mean( # 1 per output
-                    (y_pred - y) ** 2,
-                    dim=0,
-                )
-            list_unweighted_batch_loss_components.append(unweighted_batch_loss_components)
-
-            batch_loss = torch.sum(loss_weights * unweighted_batch_loss_components)
-            reweighted_batch_loss = torch.sum(loss_weights * unweighted_batch_loss_components / unweighted_epoch_loss_components)
-
             optimizer.zero_grad()
-            # batch_loss.backward()
-            reweighted_batch_loss.backward()
+            loss.backward()
             optimizer.step()
 
-        unweighted_epoch_loss_components = torch.mean(torch.stack(list_unweighted_batch_loss_components, dim=0), dim=0).detach()
-        unweighted_epoch_loss = torch.sum(unweighted_epoch_loss_components, dim=0)
-        epoch_loss = torch.sum(loss_weights * unweighted_epoch_loss_components)
+            loss_from_each_training_batch.append(loss.detach())
 
-        # Evaluate the model
+        train_loss = torch.mean(torch.stack(loss_from_each_training_batch, dim=0), dim=0)
+
+        # Put the model in evaluation mode
         net.eval()
 
-        batch_losses = []
-        batch_residual_mae = []  # Residual mean absolute error (MAE, L1 norm) of each test batch
+        loss_components_from_each_test_batch = []
+        mae_from_each_test_batch = []
 
-        for i, (x, y) in enumerate(test_loader):
+        for i, (x, y_data) in enumerate(test_loader):
             with torch.no_grad():
                 x = x.to(device)
-                y = y.to(device)
+                y_data = y_data.to(device)
 
                 y_pred = net(x)
 
-                y_nonan = torch.where(
-                    torch.isnan(y),
-                    y_pred,
-                    y
+                loss_components = loss_function(
+                    y_pred=y_pred,
+                    y_data=y_data,
+                    return_individual_loss_components=True
                 )
 
-                loss = torch.mean(
-                    torch.sum(
-                        loss_weights *
-                        (y_pred - y_nonan) ** 2,
-                        dim=1
-                    ),
-                    dim=0
-                )
-                batch_losses.append(loss.item())
-                batch_residual_mae.append(
-                    torch.nanmean(torch.abs(y_pred - y_nonan), dim=0).cpu().detach().numpy()
+                loss_components_from_each_test_batch.append(loss_components)
+                mae_from_each_test_batch.append(
+                    torch.nanmean(torch.abs(y_pred - y_data), dim=0)
                 )
 
-        test_loss = np.mean(batch_losses)
-        test_residual_mae = np.nanmean(np.stack(batch_residual_mae, axis=0), axis=0)
+        test_loss_components = torch.mean(torch.stack(loss_components_from_each_test_batch, dim=0), dim=0)
+        test_loss = torch.sum(test_loss_components)
+        test_residual_mae = torch.nanmean(torch.stack(mae_from_each_test_batch, dim=0), dim=0)
 
         labeled_maes = {
             "analysis_confidence": test_residual_mae[0],
@@ -229,7 +254,7 @@ def forward(self, x: torch.Tensor):
             "Bot_Xtr"            : test_residual_mae[5],
         }
         print(
-            f"Epoch: {epoch} | Train Loss: {epoch_loss.item():.6g} | Test Loss: {test_loss.item():.6g} | "
+            f"Epoch: {epoch} | Train Loss: {train_loss.item():.6g} | Test Loss: {test_loss.item():.6g} | "
             + " | ".join(
                 [
                     f"{k}: {v:.6g}"
@@ -237,11 +262,11 @@ def forward(self, x: torch.Tensor):
                 ]
             )
         )
-        loss_argsort = torch.argsort(unweighted_epoch_loss_components, descending=True)
+        loss_argsort = torch.argsort(test_loss_components, descending=True)
         print(f"Loss contributors: ")
         for i in loss_argsort[:10]:
-            print(f"\t{df_train_outputs_scaled.columns[i]:25}: {unweighted_epoch_loss_components[i].item():.6g}")
+            print(f"\t{df_train_outputs_scaled.columns[i]:25}: {test_loss_components[i].item():.6g}")
 
-        scheduler.step(epoch_loss)
+        scheduler.step(train_loss)
 
         torch.save(net.state_dict(), cache_file)
diff --git a/training/gen2_architecture/training_data/generate_xfoil_data.py b/training/gen2_architecture/training_data/generate_xfoil_data.py
index 4780454..aea9c5e 100644
--- a/training/gen2_architecture/training_data/generate_xfoil_data.py
+++ b/training/gen2_architecture/training_data/generate_xfoil_data.py
@@ -88,7 +88,7 @@ def worker(csv_actor):
             slices,
             [1]
         ])
-        weights = np.diff(slices) # result is N random numbers in [0, 1] that sum to 1
+        weights = np.diff(slices)  # result is N random numbers in [0, 1] that sum to 1
 
         parent_airfoils = np.random.choice(airfoil_database, size=n_airfoils_to_combine, replace=True)
 
@@ -119,7 +119,7 @@ def worker(csv_actor):
         af = af.scale(1, np.random.lognormal(0, 0.25))
 
         deviations = np.random.multivariate_normal(
-            np.zeros_like(mean_database), # Not including, since we already have a linear combo of 3 airfoils
+            np.zeros_like(mean_database),  # Not including, since we already have a linear combo of 3 airfoils
             cov_database,
         )
 
diff --git a/training/gen2_architecture/training_data/generate_xfoil_data_multiprocessing.py b/training/gen2_architecture/training_data/generate_xfoil_data_multiprocessing.py
new file mode 100644
index 0000000..bce6a9f
--- /dev/null
+++ b/training/gen2_architecture/training_data/generate_xfoil_data_multiprocessing.py
@@ -0,0 +1,164 @@
+import multiprocessing as mp
+import csv
+import aerosandbox as asb
+import aerosandbox.numpy as np
+from typing import List
+import time
+import os
+from neuralfoil.gen2_architecture._basic_data_type import Data
+
+datafile = "data_xfoil_comp1-mp.csv"
+
+airfoil_database_path = asb._asb_root / "geometry" / "airfoil" / "airfoil_database"
+
+airfoil_database = [
+    asb.Airfoil(name=filename.stem).normalize().to_kulfan_airfoil()
+    for filename in airfoil_database_path.glob("*.dat")
+]
+
+### Compute the covariance matrix of airfoil shape parameters, for better data generation later
+kulfans_database = np.stack([
+    np.concatenate([
+        airfoil.upper_weights,
+        airfoil.lower_weights,
+        np.atleast_1d(airfoil.leading_edge_weight),
+        np.atleast_1d(airfoil.TE_thickness)
+    ])
+    for airfoil in airfoil_database
+], axis=0)
+mean_database = np.mean(kulfans_database, axis=0)
+cov_database = np.cov(kulfans_database, rowvar=False)
+
+
+class CSVActor:
+    def __init__(self, filename):
+        self.filename = filename
+
+    @staticmethod
+    def float_to_str(f: float) -> str:
+        if np.isnan(f):
+            return ""  # Polars will read this as a null value
+
+        s = f"{f:.8g}"
+
+        if len(s) > 2 and s[:2] == "0.":
+            s = s[1:]
+
+        if "." in s:
+            s = s.rstrip("0")
+
+        if s[-1] == ".":
+            s = s[:-1]
+
+        if s == "." or s == "" or s == "-0":
+            s = "0"
+
+        return s
+
+    def append_row(self, row: List[float]):
+
+        row = [self.float_to_str(item) for item in row]
+
+        with open(self.filename, 'a', newline='') as file:
+            writer = csv.writer(file)
+            writer.writerow(row)
+
+
+def worker(csv_actor):
+    print("Worker started.")
+    while True:
+
+        n_airfoils_to_combine = 3
+
+        slices = np.random.rand(n_airfoils_to_combine - 1)
+        slices = np.sort(slices)
+        slices = np.concatenate([
+            [0],
+            slices,
+            [1]
+        ])
+        weights = np.diff(slices) # result is N random numbers in [0, 1] that sum to 1
+
+        parent_airfoils = np.random.choice(airfoil_database, size=n_airfoils_to_combine, replace=True)
+
+        af = asb.KulfanAirfoil(
+            name="Reconstructed Airfoil",
+            upper_weights=np.dot(
+                weights,
+                [parent_airfoil.upper_weights for parent_airfoil in parent_airfoils],
+                manual=True
+            ),
+            lower_weights=np.dot(
+                weights,
+                [parent_airfoil.lower_weights for parent_airfoil in parent_airfoils],
+                manual=True
+            ),
+            leading_edge_weight=np.dot(
+                weights,
+                [parent_airfoil.leading_edge_weight for parent_airfoil in parent_airfoils],
+                manual=True
+            ),
+            TE_thickness=np.dot(
+                weights,
+                [parent_airfoil.TE_thickness for parent_airfoil in parent_airfoils],
+                manual=True
+            )
+        )
+
+        af = af.scale(1, np.random.lognormal(0, 0.25))
+
+        deviations = np.random.multivariate_normal(
+            np.zeros_like(mean_database), # Not including, since we already have a linear combo of 3 airfoils
+            cov_database,
+        )
+
+        # deviance = np.random.exponential(0.05)
+        af.upper_weights += deviations[:8]
+        af.lower_weights += deviations[8:16]
+        af.leading_edge_weight += deviations[16]
+        af.TE_thickness += deviations[17]
+
+        # if not af.as_shapely_polygon().is_valid:
+        #     continue
+
+        alphas = np.linspace(-15, 15, 7) + np.random.uniform(-2.5, 2.5) + 2.5 * np.random.randn()
+        Re = float(10 ** (5.5 + 1.5 * np.random.randn()))
+
+        n_crit = np.random.uniform(0, 18)
+        if np.random.rand() < 0.8:
+            xtr_upper = 1
+        else:
+            xtr_upper = np.random.uniform(0, 1)
+        if np.random.rand() < 0.8:
+            xtr_lower = 1
+        else:
+            xtr_lower = np.random.uniform(0, 1)
+
+        datas = Data.from_xfoil(
+            airfoil=af,
+            alphas=alphas,
+            Re=Re,
+            mach=0,
+            n_crit=n_crit,
+            xtr_upper=xtr_upper,
+            xtr_lower=xtr_lower,
+            timeout=30,
+            max_iter=200,
+            xfoil_command="/home/gridsan/pds/NeuralFoil/training/gen2_architecture/training_data/xfoil_supercloud"
+        )
+
+        for data in datas:
+            csv_actor.append_row(data.to_vector())
+
+
+
+if __name__ == '__main__':
+    pool = mp.Pool(mp.cpu_count())
+    n_procs = mp.cpu_count()
+    print(f"Running on {n_procs} processes.")
+
+    # csv_actor = CSVActor(filename=datafile)
+    #
+    # worker(csv_actor)
+
+    pool.map(worker, [CSVActor(filename=datafile)] * n_procs)
\ No newline at end of file
diff --git a/training/gen2_architecture/training_data/load_data.py b/training/gen2_architecture/training_data/load_data.py
index 6946581..b9af2b1 100644
--- a/training/gen2_architecture/training_data/load_data.py
+++ b/training/gen2_architecture/training_data/load_data.py
@@ -34,7 +34,7 @@
 
 c = pl.col("CD") <= 0
 print(
-    f"Eliminating {int(df.select(c).sum().to_numpy()[0, 0])} rows with CD <= 0..."
+    f"Nullifying {int(df.select(c).sum().to_numpy()[0, 0])} rows with CD <= 0..."
 )
 df = df.with_columns(
     [
@@ -53,7 +53,7 @@
                           for i in range(Data.N)
                       ])
 print(
-    f"Eliminating {int(df.select(c).sum().to_numpy()[0, 0])} rows with nonpositive boundary layer thetas..."
+    f"Nullifying {int(df.select(c).sum().to_numpy()[0, 0])} rows with nonpositive boundary layer thetas..."
 )
 df = df.with_columns(
     [
@@ -72,7 +72,7 @@
                           for i in range(Data.N)
                       ])
 print(
-    f"Eliminating {int(df.select(c).sum().to_numpy()[0, 0])} rows with H < 1 (non-physical BL)..."
+    f"Nullifying {int(df.select(c).sum().to_numpy()[0, 0])} rows with H < 1 (non-physical BL)..."
 )
 df = df.with_columns(
     [
@@ -94,7 +94,7 @@
 ], start=[])
 )
 print(
-    f"Eliminating {int(df.select(c).sum().to_numpy()[0, 0])} rows with non-physical edge velocities..."
+    f"Nullifying {int(df.select(c).sum().to_numpy()[0, 0])} rows with non-physical edge velocities..."
 )
 df = df.with_columns(
     [
@@ -110,7 +110,7 @@
 print("Dataset statistics:")
 print(df.describe())
 
-### Shuffle the training set
+### Shuffle the training set (deterministically)
 df = df.sample(
     fraction=1,
     with_replacement=False,
diff --git a/training/gen2_architecture/training_data/supercloud_generate_data.sh b/training/gen2_architecture/training_data/supercloud_generate_data.sh
index 2903d46..5af34ab 100644
--- a/training/gen2_architecture/training_data/supercloud_generate_data.sh
+++ b/training/gen2_architecture/training_data/supercloud_generate_data.sh
@@ -11,4 +11,4 @@ module unload anaconda
 module load anaconda/2023a
 
 # Run the script
-python -u ./generate_xfoil_data.py
\ No newline at end of file
+python -u ./generate_xfoil_data_multiprocessing.py
\ No newline at end of file