benchopt · chris-mrn · Jul 10, 2023 · Jul 10, 2023 · Jul 10, 2023 · Jul 10, 2023
diff --git a/benchmark_utils/dataset.py b/benchmark_utils/dataset.py
@@ -126,10 +126,10 @@ def split_windows_train_test(data_subject_test, data_subject_train):
     """
     # Converting the windows dataset into numpy arrays
     X_test = SliceDataset(data_subject_test, idx=0)
-    y_test = array(list(SliceDataset(data_subject_test, idx=1)))
+    y_test = array(list(SliceDataset(data_subject_test, idx=1)))-1
 
     X_train = SliceDataset(data_subject_train, idx=0)
-    y_train = array(list(SliceDataset(data_subject_train, idx=1)))
+    y_train = array(list(SliceDataset(data_subject_train, idx=1)))-1
 
     return {
         "X_train": X_train,

diff --git a/benchmark_utils/transformation.py b/benchmark_utils/transformation.py
@@ -6,15 +6,21 @@
 # - getting requirements info when all dependencies are not installed.
 with safe_import_context() as import_ctx:
     import numpy as np
-
-    from numpy import concatenate
     from torch import as_tensor
     from skorch.helper import to_numpy
     from braindecode.augmentation import ChannelsDropout, SmoothTimeMask
 
 
+def gen_seed():
+    # Iterator that generates random seeds for reproducibility reasons
+    seed = 0
+    while True:
+        yield seed
+        seed += 1
+
+
 def channels_dropout(
-    X, y, n_augmentation, seed=0, probability=0.5, p_drop=0.2
+    X, y, n_augmentation, probability=0.5, p_drop=0.2
-    X, y, n_augmentation, probability=0.5, p_drop=0.2
+    X, y, n_augmentation, probability=0.5, p_drop=0.2, seed=None
-    X, y, n_augmentation, probability=0.5, p_drop=0.2
+    X, y, n_augmentation, probability=0.5, p_drop=0.2, seed=None
 ):
     """
     Function to apply channels dropout to X raw data
@@ -27,8 +33,6 @@ def channels_dropout(
         The labels.
     n_augmentation : int
         Number of augmentation to apply and increase the size of the dataset.
-    seed : int
-        Random seed.
     probability : float
         Probability of applying the tranformation.
     p_drop : float
@@ -43,51 +47,58 @@ def channels_dropout(
         The labels.
 
     """
-    transform = ChannelsDropout(probability=probability, random_state=seed)
+
+    seed = gen_seed()
-    seed = gen_seed()
+    rng = np.random.RandomState(seed)
-    seed = gen_seed()
+    rng = np.random.RandomState(seed)
     X_augm = to_numpy(X)
     y_augm = y
-    for i in range(n_augmentation):
+    for _ in range(n_augmentation):
+        transform = ChannelsDropout(
+                                    probability=probability,
+                                    random_state=next(seed)
+                                    )
-        transform = ChannelsDropout(
-                                    probability=probability,
-                                    random_state=next(seed)
-                                    )
+        transform = ChannelsDropout(
+            probability=probability,
+            random_state=rng
+        )
-        transform = ChannelsDropout(
-                                    probability=probability,
-                                    random_state=next(seed)
-                                    )
+        transform = ChannelsDropout(
+            probability=probability,
+            random_state=rng
+        )
         X_tr, _ = transform.operation(
             as_tensor(X).float(), None, p_drop=p_drop
         )
 
         X_tr = X_tr.numpy()
-        X_augm = concatenate((X_augm, X_tr))
-        y_augm = concatenate((y_augm, y))
+        X_augm = np.concatenate((X_augm, X_tr))
+        y_augm = np.concatenate((y_augm, y))
 
     return X_augm, y_augm
 
 
 def smooth_timemask(
-    X, y, n_augmentation, sfreq, seed=0, probability=0.5, second=0.1
+    X, y, n_augmentation, sfreq, probability=0.8, second=0.2
-    X, y, n_augmentation, sfreq, probability=0.8, second=0.2
+    X, y, n_augmentation, sfreq, probability=0.8, second=0.2, seed=None
-    X, y, n_augmentation, sfreq, probability=0.8, second=0.2
+    X, y, n_augmentation, sfreq, probability=0.8, second=0.2, seed=None
 ):
     """
     Function to apply smooth time mask to X raw data
     and concatenate it to the original data.
     """
 
-    transform = SmoothTimeMask(
-        probability=probability,
-        mask_len_samples=int(sfreq * second),
-        random_state=seed,
-    )
-
+    seed_generator = gen_seed()
-    seed_generator = gen_seed()
+    rng = np.random.RandomState(seed)
-    seed_generator = gen_seed()
+    rng = np.random.RandomState(seed)
     X_torch = as_tensor(np.array(X)).float()
     y_torch = as_tensor(y).float()
-    param_augm = transform.get_augmentation_params(X_torch, y_torch)
-    mls = param_augm["mask_len_samples"]
-    msps = param_augm["mask_start_per_sample"]
-
     X_augm = to_numpy(X)
     y_augm = y
 
-    for i in range(n_augmentation):
+    mls = int(sfreq * second)
+    for _ in range(n_augmentation):
+        seed = next(seed_generator)
-        seed = next(seed_generator)
-        seed = next(seed_generator)
+        transform = SmoothTimeMask(
+            probability=probability,
+            mask_len_samples=mls,
+            random_state=rng
+        )
+
+        param_augm = transform.get_augmentation_params(X_torch, y_torch)
+        mls = param_augm["mask_len_samples"]
+        msps = param_augm["mask_start_per_sample"]
+
         X_tr, _ = transform.operation(
             X_torch, None, mask_len_samples=mls, mask_start_per_sample=msps
         )
-
         X_tr = X_tr.numpy()
-        X_augm = concatenate((X_augm, X_tr))
-        y_augm = concatenate((y_augm, y))
+        X_augm = np.concatenate((X_augm, X_tr))
+        y_augm = np.concatenate((y_augm, y))
 
     return X_augm, y_augm
diff --git a/objective.py b/objective.py
@@ -2,14 +2,14 @@
 
 
 with safe_import_context() as import_ctx:
-    from numpy import array
-
+    import numpy as np
     from sklearn.dummy import DummyClassifier
     from sklearn.pipeline import make_pipeline
     from sklearn.pipeline import FunctionTransformer
 
     from sklearn.model_selection import train_test_split
     from sklearn.metrics import balanced_accuracy_score as BAS
+    from sklearn.metrics import accuracy_score
 
     from skorch.helper import SliceDataset, to_numpy
     from benchmark_utils.dataset import split_windows_train_test
@@ -31,6 +31,7 @@ class Objective(BaseObjective):
     parameters = {
         'evaluation_process, subject, subject_test, session_test': [
             ('intra_subject', 1, None, None),
+            ('inter_subject', None, 3, None),
         ],
     }
 
@@ -55,7 +56,9 @@ def set_data(self, dataset, sfreq):
 
             dataset = data_split_subject[str(self.subject)]
             X = SliceDataset(dataset, idx=0)
-            y = array(list(SliceDataset(dataset, idx=1)))
+            y = np.array(list(SliceDataset(dataset, idx=1)))-1
+            # we have to susbtract 1 to the labels for compatibility reasons
+            # with the deep learning solvers
-            y = np.array(list(SliceDataset(dataset, idx=1)))-1
-            # we have to susbtract 1 to the labels for compatibility reasons
-            # with the deep learning solvers
+            # we have to susbtract 1 to the labels for compatibility reasons
+            # with the deep learning solvers
+            y = np.array(list(SliceDataset(dataset, idx=1)))-1
-            y = np.array(list(SliceDataset(dataset, idx=1)))-1
-            # we have to susbtract 1 to the labels for compatibility reasons
-            # with the deep learning solvers
+            # we have to susbtract 1 to the labels for compatibility reasons
+            # with the deep learning solvers
+            y = np.array(list(SliceDataset(dataset, idx=1)))-1
 
             # maybe we need to do here different process for each subjects
 
@@ -64,6 +67,8 @@ def set_data(self, dataset, sfreq):
             self.X_test, self.y_test = X_test, y_test
 
         elif self.evaluation_process == 'inter_subject':
+            # the evaluation proccess here is to leave one subject out
+            #  to test on it and train on the rest of the subjects
 
             sujet_test = self.subject_test
             data_subject_test = data_split_subject[str(sujet_test)]
@@ -82,6 +87,8 @@ def set_data(self, dataset, sfreq):
             self.y_test = splitted_data['y_test']
 
         elif self.evaluation_process == 'inter_session':
+            # the evaluation proccess here is to leave one session out
+            #  to test on it and train on the rest of the sessions
 
             data_subject = data_split_subject[str(self.subject)]
             data_split_session = data_subject.split('session')
@@ -103,9 +110,9 @@ def set_data(self, dataset, sfreq):
         self.sfreq = sfreq
 
         return dict(
-            X_train=X_train, y_train=y_train,
-            X_test=X_test, y_test=y_test,
-            sfreq=sfreq,
+            X_train=self.X_train, y_train=self.y_train,
+            X_test=self.X_test, y_test=self.y_test,
+            sfreq=self.sfreq,
         )
 
     def evaluate_result(self, model):
@@ -125,9 +132,14 @@ def evaluate_result(self, model):
         value: error on the testing set.
         """
 
-        score_train = model.score(self.X_train, self.y_train)
-        score_test = model.score(self.X_test, self.y_test)
-        bl_acc = BAS(self.y_test, model.predict(self.X_test))
+        # we compute here the predictions so
+        # that we don't compute it for each score
+        y_pred_train = model.predict(self.X_train)
+        y_pred_test = model.predict(self.X_test)
+
+        score_train = accuracy_score(self.y_train, y_pred_train)
+        score_test = accuracy_score(self.y_test, y_pred_test)
+        bl_acc = BAS(self.y_test, y_pred_test)
 
         return dict(
             score_test=score_test,
@@ -161,6 +173,8 @@ def get_objective(self):
         sfreq: sampling frequency to allow filtering the data.
         """
 
+        X_train, X_test, y_train, y_test = self.get_split(self.X, self.y)
+
         return dict(
             X=self.X_train,
             y=self.y_train,

diff --git a/solvers/CSPlda.py b/solvers/CSPlda.py
@@ -15,8 +15,23 @@
 
 
 class Solver(AugmentedBCISolver):
+    '''
+    You can choose an augmentation parameter from the following list:
+    - IdentityTransform
+    - ChannelsDropout
+    - SmoothTimeMask
+
+    Running the benchmark with -n = n_augmentation
+    you will get a cuvre of solver's score
+    with respect to the number of augmentation which corresponds
+    to how much the dataset has been multiplied.
+    '''
     name = "CSPLDA"
     parameters = {
+        "augmentation": [
+            "SmoothTimeMask",
+            "ChannelsDropout",
+        ],
-        "augmentation": [
-            "SmoothTimeMask",
-            "ChannelsDropout",
-        ],
-        "augmentation": [
-            "SmoothTimeMask",
-            "ChannelsDropout",
-        ],
         "n_components": [8],
         **AugmentedBCISolver.parameters
     }

diff --git a/solvers/MOABB.py b/solvers/MOABB.py
@@ -13,20 +13,9 @@
 class Solver(AugmentedBCISolver):
     name = "MOABBPipelines"
     parameters = {
+        # you can choose here any pipeline form Moabb
         "pipeline": [
-            "AUGTangSVMGrid",
-            "MDM",
-            "MDMAug",
-            "TangentSpaceSVMGrid",
-            "COVCSPLDA",
-            "FgMDM",
-            "LogVarianceLDA",
-            "DLCSPautoshLDA",
-            "LogVarianceSVMgrid",
-            "COVCSPSVMGrid",
-            "TSElasticNetGrid",
             "TangentSpaceLR",
-            "TRCSPLDA",
             "DUMMY",
         ],
         **AugmentedBCISolver.parameters

diff --git a/solvers/ShallowFBCSPNet_augm_channeldrop.py b/solvers/ShallowFBCSPNet_augm_channeldrop.py
@@ -13,7 +13,7 @@
         SmoothTimeMask,
     )
     from braindecode.models import ShallowFBCSPNet
-    from numpy import linspace, pi
+    from numpy import linspace
-    from numpy import linspace
+    import numpy as np
-    from numpy import linspace
+    import numpy as np
     from skorch.callbacks import LRScheduler
 
 
@@ -33,7 +33,7 @@ class Solver(BaseSolver):
         "lr": [0.0625 * 0.01],
         "weight_decay": [0],
         "batch_size": [64],
-        "n_epochs": [4],
+        "n_epochs": [1],
         "proba": [0.5],
 
     }
@@ -96,25 +96,25 @@ def set_objective(self, X, y, sfreq):
                     mask_len_samples=int(sfreq * second),
                     random_state=seed,
                 )
-                for second in linspace(0.1, 2, 10)
+                for second in linspace(0.1, 2, 3)
-                for second in linspace(0.1, 2, 3)
+                for second in np.linspace(0.1, 2, 3)
-                for second in linspace(0.1, 2, 3)
+                for second in np.linspace(0.1, 2, 3)
             ]
 
         elif self.augmentation == "ChannelDropout":
             transforms = [
                 ChannelsDropout(
                     probability=self.proba, p_drop=prob, random_state=seed
                 )
-                for prob in linspace(0, 1, 10)
+                for prob in linspace(0, 1, 3)
-                for prob in linspace(0, 1, 3)
+                for prob in np.linspace(0, 1, 3)
-                for prob in linspace(0, 1, 3)
+                for prob in np.linspace(0, 1, 3)
             ]
 
         elif self.augmentation == "FTSurrogate":
             transforms = [
                 FTSurrogate(
                     probability=self.proba,
-                    phase_noise_magnitude=prob,
+                    phase_noise_magnitude=phase_freq,
                     random_state=seed,
                 )
-                for prob in linspace(0, 2 * pi, 10)
+                for phase_freq in linspace(0, 1, 3)
-                for phase_freq in linspace(0, 1, 3)
+                for phase_freq in np.linspace(0, 1, 3)
-                for phase_freq in linspace(0, 1, 3)
+                for phase_freq in np.linspace(0, 1, 3)
             ]
         else:
             transforms = [IdentityTransform()]

diff --git a/solvers/TGSPSVM.py b/solvers/TGSPSVM.py
@@ -19,6 +19,9 @@ class Solver(AugmentedBCISolver):
 
     name = "TGSPSVM"
     parameters = {
+        "augmentation": [
+            "SmoothTimeMask",
+        ],
         "covariances_estimator": ["oas"],
-        "augmentation": [
-            "SmoothTimeMask",
-        ],
-        "covariances_estimator": ["oas"],
+        "covariances_estimator": ["oas"],
-        "augmentation": [
-            "SmoothTimeMask",
-        ],
-        "covariances_estimator": ["oas"],
+        "covariances_estimator": ["oas"],
         "tangentspace_metric": ["riemann"],
         "svm_kernel": ["linear"],