NeuroTechX
diff --git a/‎.pre-commit-config.yaml
+1-1 b/‎.pre-commit-config.yaml
+1-1
diff --git a/‎docs/source/api/datasets.rst
+4 b/‎docs/source/api/datasets.rst
+4
diff --git a/‎docs/source/images/Dreyer_clf_scores_vs_subj_info/4_selected_subjects.png
70.6 KB b/‎docs/source/images/Dreyer_clf_scores_vs_subj_info/4_selected_subjects.png
70.6 KB
diff --git a/‎docs/source/images/Dreyer_clf_scores_vs_subj_info/all_subjects.png
104 KB b/‎docs/source/images/Dreyer_clf_scores_vs_subj_info/all_subjects.png
104 KB
diff --git a/‎docs/source/whats_new.rst
+2-1 b/‎docs/source/whats_new.rst
+2-1
diff --git a/‎examples/advanced_examples/plot_dreyer_clf_scores_vs_subj_info.py
+164 b/‎examples/advanced_examples/plot_dreyer_clf_scores_vs_subj_info.py
+164
diff --git a/‎moabb/datasets/__init__.py
+1 b/‎moabb/datasets/__init__.py
+1
diff --git a/‎moabb/datasets/download.py
+47 b/‎moabb/datasets/download.py
+47
@@ -79,7 +79,7 @@ repos:
     hooks:
       - id: codespell
         args:
-          - --ignore-words-list=assertIn,additionals,alle,alot,bund,currenty,datas,farenheit,falsy,fo,haa,hass,iif,incomfort,ines,ist,nam,nd,pres,pullrequests,resset,rime,ser,serie,te,technik,ue,unsecure,withing,zar,crate
+          - --ignore-words-list=assertIn,additionals,alle,alot,bund,currenty,datas,farenheit,falsy,fo,haa,hass,iif,incomfort,ines,ist,nam,nd,pres,pullrequests,resset,rime,ser,serie,te,technik,ue,unsecure,withing,zar,crate,Perfomances,Aline
           - --skip="./.*,*.csv,*.json,*.ambr"
           - --quiet-level=2
         exclude_types: [ csv, json, svg, pdf ]
 
@@ -15,6 +15,10 @@ Motor Imagery Datasets
     BNCI2015_001
     BNCI2015_004
     Cho2017
+    Dreyer2023
+    Dreyer2023A
+    Dreyer2023B
+    Dreyer2023C
     Lee2019_MI
     GrosseWentrup2009
     Ofner2017
 
@@ -17,12 +17,14 @@ Develop branch  - 1.2.1
 
 Enhancements
 ~~~~~~~~~~~~
+- Adding new motor imagery dataset, Dreyer2023 (PR :gh: `404` by `Sara Sedlar`_, `Sylvain Chevallier`_ and `Bruno Aristimunha`_)
 - Reordering the examples in the documentation (:gh:`807` by `Bruno Aristimunha`_)
 - Creating the meta information for the BIDS converted datasets (:gh:`688` by `Bruno Aristimunha`_)
 
 
 Bugs
 ~~~~
+- Fix caching issue with incomplete results (:gh:`715` by `Sylvain Chevallier`_)
 
 API changes
 ~~~~~~~~~~~
@@ -57,7 +59,6 @@ Bugs
 - Fixing the dataset details for bids conversion (:gh:`698` by `Bruno Aristimunha`_)
 - Fixing unit issue and lack of montage with :class:`moabb.datasets.Rodrigues2017`, :class:`moabb.datasets.Rodrigues2017`, :class:`moabb.datasets.BaseCastillos2023`,  :class:`moabb.datasets.BaseCastillos2023`,  :class:`moabb.datasets.Huebner2018`,  :class:`moabb.datasets.Cattan2019_PHMD`, :class:`moabb.datasets.Ofner2017`  (:gh:`700`  `Bruno Aristimunha`_)
 - Fix t-test permutation tests (:gh:`684` and :gh:`709` by `Gregoire Cattan`_, `Anton Andreev`_, `Marco Congedo`_ and `Bruno Aristimunha`_)
-- Fix caching issue with incomplete results (:gh:`715` by `Sylvain Chevallier`_)
 
 
 API changes
 
@@ -0,0 +1,164 @@
+"""
+===============================================
+Examples of analysis of a Dreyer2023 A dataset.
+===============================================
+
+This example shows how to plot Dreyer2023A Left-Right Imagery ROC AUC scores
+obtained with CSP+LDA pipeline versus demographic information of the examined
+subjects (gender and age) and experimenters (gender).
+
+To reduce computational time, the example is provided for four subjects.
+
+"""
+
+# Authors: Sara Sedlar <[email protected]>
+#          Sylvain Chevallier <[email protected]>
+# License: BSD (3-clause)
+
+import matplotlib.patches as mpatches
+import matplotlib.pyplot as plt
+import seaborn as sb
+from pyriemann.estimation import Covariances
+from pyriemann.spatialfilters import CSP
+from sklearn.discriminant_analysis import LinearDiscriminantAnalysis as LDA
+from sklearn.pipeline import make_pipeline
+
+from moabb.datasets import Dreyer2023A
+from moabb.evaluations import WithinSessionEvaluation
+from moabb.paradigms import MotorImagery
+
+
+########################################################################################
+# 1. Defining dataset, selecting subject for analysis and getting data
+dreyer2023 = Dreyer2023A()
+dreyer2023.subject_list = [1, 5, 7, 35]
+dreyer2023.get_data()
+########################################################################################
+# 2. Defining MotorImagery paradigm and CSP+LDA pipeline
+paradigm = MotorImagery()
+pipelines = {}
+pipelines["CSP+LDA"] = make_pipeline(
+    Covariances(estimator="oas"), CSP(nfilter=6), LDA(solver="lsqr", shrinkage="auto")
+)
+########################################################################################
+# 3. Within session evaluation of the pipeline
+evaluation = WithinSessionEvaluation(
+    paradigm=paradigm, datasets=[dreyer2023], suffix="examples", overwrite=False
+)
+results = evaluation.process(pipelines)
+
+########################################################################################
+# 4. Loading dataset info and concatenation with the obtained results
+info = dreyer2023.get_subject_info().rename(columns={"score": "score_MR"})
+# Creating a new column with subject's age
+info["Age"] = 2019 - info["Birth_year"]
+# Casting to int for merging
+info["subject"] = info["SUJ_ID"].astype(int)
+results["subject"] = results["subject"].astype(int)
+
+results_info = results.merge(info, on="subject", how="left")
+
+########################################################################################
+########################################################################################
+# 5.1 Plotting subject AUC ROC scores vs subject's gender
+fig, ax = plt.subplots(nrows=2, ncols=2, facecolor="white", figsize=[16, 8], sharey=True)
+fig.subplots_adjust(wspace=0.0, hspace=0.5)
+sb.boxplot(
+    data=results_info, y="score", x="SUJ_gender", ax=ax[0, 0], palette="Set1", width=0.3
+)
+sb.stripplot(
+    data=results_info,
+    y="score",
+    x="SUJ_gender",
+    ax=ax[0, 0],
+    palette="Set1",
+    linewidth=1,
+    edgecolor="k",
+    size=3,
+    alpha=0.3,
+    zorder=1,
+)
+ax[0, 0].set_title("AUC ROC scores vs. subject gender")
+ax[0, 0].set_xticklabels(["Man", "Woman"])
+ax[0, 0].set_ylabel("ROC AUC")
+ax[0, 0].set_xlabel(None)
+ax[0, 0].set_ylim(0.3, 1)
+########################################################################################
+# 5.2 Plotting subject AUC ROC scores vs subjects's age per gender
+sb.regplot(
+    data=results_info[results_info["SUJ_gender"] == 1][["score", "Age"]].astype(
+        "float32"
+    ),
+    y="score",
+    x="Age",
+    ax=ax[0, 1],
+    scatter_kws={"color": "#e41a1c", "alpha": 0.5},
+    line_kws={"color": "#e41a1c"},
+)
+sb.regplot(
+    data=results_info[results_info["SUJ_gender"] == 2][["score", "Age"]].astype(
+        "float32"
+    ),
+    y="score",
+    x="Age",
+    ax=ax[0, 1],
+    scatter_kws={"color": "#377eb8", "alpha": 0.5},
+    line_kws={"color": "#377eb8"},
+)
+ax[0, 1].set_title("AUC ROC scores vs. subject age per gender")
+ax[0, 1].set_ylabel(None)
+ax[0, 1].set_xlabel(None)
+ax[0, 1].legend(
+    handles=[
+        mpatches.Patch(color="#e41a1c", label="Man"),
+        mpatches.Patch(color="#377eb8", label="Woman"),
+    ]
+)
+########################################################################################
+# 5.3 Plotting subject AUC ROC scores vs experimenter's gender
+sb.boxplot(
+    data=results_info, y="score", x="EXP_gender", ax=ax[1, 0], palette="Set1", width=0.3
+)
+sb.stripplot(
+    data=results_info,
+    y="score",
+    x="EXP_gender",
+    ax=ax[1, 0],
+    palette="Set1",
+    linewidth=1,
+    edgecolor="k",
+    size=3,
+    alpha=0.3,
+    zorder=1,
+)
+ax[1, 0].set_title("AUC ROC scores vs. experimenter gender")
+ax[1, 0].set_xticklabels(["Man", "Woman"])
+ax[1, 0].set_ylabel("ROC AUC")
+ax[1, 0].set_xlabel(None)
+ax[1, 0].set_ylim(0.3, 1)
+########################################################################################
+# 5.4 Plotting subject AUC ROC scores vs subject's age
+sb.regplot(
+    data=results_info[["score", "Age"]].astype("float32"),
+    y="score",
+    x="Age",
+    ax=ax[1, 1],
+    scatter_kws={"color": "black", "alpha": 0.5},
+    line_kws={"color": "black"},
+)
+ax[1, 1].set_title("AUC ROC scores vs. subject age")
+ax[1, 1].set_ylabel(None)
+plt.show()
+########################################################################################
+# 5.5 Obtained results for four selected subjects correspond to the following figure.
+#
+# .. image:: ../images/Dreyer_clf_scores_vs_subj_info/4_selected_subjects.png
+#    :align: center
+#    :alt: 4_selected_subjects
+
+########################################################################################
+# Obtained results for all subjects correspond to the following figure.
+#
+# .. image:: ../images/Dreyer_clf_scores_vs_subj_info/all_subjects.png
+#    :align: center
+#    :alt: all_subjects
@@ -55,6 +55,7 @@
     CastillosCVEP40,
     CastillosCVEP100,
 )
+from .dreyer2023 import Dreyer2023, Dreyer2023A, Dreyer2023B, Dreyer2023C
 from .epfl import EPFLP300
 from .erpcore2021 import (
     ErpCore2021_ERN,
 
@@ -9,6 +9,7 @@
 import urllib
 from pathlib import Path
 
+import pandas as pd
 import requests
 from mne import get_config, set_config
 from mne.datasets.utils import _get_path
@@ -297,3 +298,49 @@ def download_if_missing(file_path, url, warn_missing=True):
         if warn_missing:
             warn(f"{file_path} not found. Downloading from {url}")
         urllib.request.urlretrieve(url, file_path)
+
+
+def create_metainfo_osf(osf_code: str) -> pd.DataFrame:
+    """Create a metadata file for a dataset stored on OSF."""
+    # OSF API base URL for the project's OSF storage
+
+    base_url = f"https://api.osf.io/v2/nodes/{osf_code}/files/osfstorage/"
+
+    files = []  # to collect (name, url) tuples
+    stack = [base_url + "?page[size]=100"]  # start with base URL, up to 100 results
+
+    while stack:
+        url = stack.pop()
+        try:
+            response = requests.get(url)
+            data = response.json()
+        except Exception as e:
+            print(f"Failed to fetch {url}: {e}")
+            continue
+
+        # Loop through items in this page
+        for item in data.get("data", []):
+            attrs = item.get("attributes", {})
+            kind = attrs.get("kind")
+            if kind == "folder":
+                # If folder, add its listing URL to stack for later retrieval
+                rel = item.get("relationships", {})
+                files_rel = rel.get("files", {}) if rel else {}
+                folder_url = files_rel.get("links", {}).get("related", {}).get("href")
+                if folder_url:
+                    # Append page[size]=100 to folder URL as well for efficiency
+                    stack.append(folder_url + "?page[size]=100")
+            elif kind == "file":
+                name = attrs.get("name")
+                download_url = item.get("links", {}).get("download")
+                if name and download_url:
+                    files.append((name, download_url))
+
+        # If there's a next page, add it to stack to continue pagination
+        next_url = data.get("links", {}).get("next")
+        if next_url:
+            stack.append(next_url)
+
+    metainfo = pd.DataFrame(files, columns=["filename", "url"])
+
+    return metainfo
Original file line number	Diff line number	Diff line change
`@@ -55,6 +55,7 @@`
`55`	`55`	`CastillosCVEP40,`
`56`	`56`	`CastillosCVEP100,`
`57`	`57`	`)`
	`58`	`+from .dreyer2023 import Dreyer2023, Dreyer2023A, Dreyer2023B, Dreyer2023C`
`58`	`59`	`from .epfl import EPFLP300`
`59`	`60`	`from .erpcore2021 import (`
`60`	`61`	`ErpCore2021_ERN,`