NeuroTechX · sylvchev · Jan 2, 2023 · Feb 9, 2022 · Feb 9, 2022 · Feb 9, 2022
diff --git a/docs/source/whats_new.rst b/docs/source/whats_new.rst
@@ -18,7 +18,7 @@ Develop branch
 Enhancements
 ~~~~~~~~~~~~
 
-- None
+- Adding a comprehensive benchmarking function (:gh:`264` by `Divyesh Narayanan`_)
 
 Bugs
 ~~~~

diff --git a/moabb/analysis/__init__.py b/moabb/analysis/__init__.py
@@ -19,7 +19,7 @@ def analyze(results, out_path, name="analysis", plot=False):
 
     Given a results dataframe, generates a folder with
     results and a dataframe of the exact data used to generate those results,
-    aswell as introspection to return information on the computer
+    as well as introspection to return information on the computer
 
     parameters
     ----------

diff --git a/moabb/benchmark.py b/moabb/benchmark.py
@@ -0,0 +1,200 @@
+import logging
+
+import mne
+import pandas as pd
+import yaml
+
+from moabb import paradigms as moabb_paradigms
+from moabb.analysis import analyze
+from moabb.evaluations import (
+    CrossSessionEvaluation,
+    CrossSubjectEvaluation,
+    WithinSessionEvaluation,
+)
+from moabb.pipelines.utils import generate_paradigms, parse_pipelines_from_directory
+
+
+log = logging.getLogger(__name__)
+
+
+def benchmark(
+    pipelines="./pipelines/",
+    evaluations=None,
+    select_paradigms=None,
+    results="./results/",
+    force=False,
+    output="./",
+    n_jobs=-1,
+    plot=False,
+    contexts=None,
+    include_datasets=None,
+    exclude_datasets=None,
+):
+    """Run benchmarks for selected pipelines and datasets
+
+    Load from saved pipeline configurations to determine associated paradigms. It is
+    possible to include or exclude specific datasets and to choose the type of
+    evaluation.
+
+    If particular paradigms are mentioned through select_paradigms, only the pipelines corresponding to those paradigms
+    will be run
+
+    To define the include_datasets or exclude_dataset, you could start from the full dataset list,
+    using for example the following code:
+    > # Choose your paradigm
+    > p = moabb.paradigms.SSVEP()
+    > # Get the class names
+    > print(p.datasets)
+    > # Get the dataset code
+    > print([d.code for d in p.datasets])
+
+    Parameters
+    ----------
+    pipelines: str
+        Folder containing the pipelines to evaluate
+    evaluations: list of str
+        If to restrict the types of evaluations to be run. By default all 3 base types are run
+        Can be a list of these elements ["WithinSession", "CrossSession", "CrossSubject"]
+    select_paradigms: list of str
+        To restrict the paradigms on which evaluations should be run.
+        Can be a list of these elements ['LeftRightImagery', 'MotorImagery', 'FilterBankSSVEP', 'SSVEP',
+        'FilterBankMotorImagery']
+    results: str
+        Folder to store the results
+    force: bool
+        Force evaluation of cached pipelines
+    output: str
+        Folder to store the analysis results
+    n_jobs: int
+        Number of threads to use for running parallel jobs
+    plot: bool
+        Plot results after computing
+    contexts: str
+        File path to context.yml file that describes context parameters.
+        If none, assumes all defaults. Must contain an entry for all
+        paradigms described in the pipelines
+    include_datasets: list of str or Dataset object
+        Datasets to include in the benchmark run. By default all suitable datasets are taken.
+        If arguments are given for both include_datasets as well as exclude_datasets,
+        include_datasets will take precedence and exclude_datasets will be neglected.
+    exclude_datasets: list of str or Dataset object
+        Datasets to exclude from the benchmark run.
+
+    Returns
+    -------
+
+    """
+    # set logs
+    if evaluations is None:
+        evaluations = ["WithinSession", "CrossSession", "CrossSubject"]
+
+    eval_type = {
+        "WithinSession": WithinSessionEvaluation,
+        "CrossSession": CrossSessionEvaluation,
+        "CrossSubject": CrossSubjectEvaluation,
+    }
+
+    mne.set_log_level(False)
+    # logging.basicConfig(level=logging.WARNING)
+
+    pipeline_configs = parse_pipelines_from_directory(pipelines)
+
+    context_params = {}
+    if contexts is not None:
+        with open(contexts, "r") as cfile:
+            context_params = yaml.load(cfile.read(), Loader=yaml.FullLoader)
+
+    paradigms = generate_paradigms(pipeline_configs, context_params, log)
+    print(paradigms)
+    if select_paradigms is not None:
+        paradigms = {p: paradigms[p] for p in select_paradigms}
+
+    log.debug(f"The paradigms being run are {paradigms}")
+
+    if len(context_params) == 0:
+        for paradigm in paradigms:
+            context_params[paradigm] = {}
+
+    # Looping over the evaluations to be done
+    df_eval = []
+    for evaluation in evaluations:
+        eval_results = dict()
+        for paradigm in paradigms:
+            # get the context
+            log.debug(f"{paradigm}: {context_params[paradigm]}")
+            p = getattr(moabb_paradigms, paradigm)(**context_params[paradigm])
+            # List of dataset class instances
+            datasets = p.datasets
+            d = _inc_exc_datasets(datasets, include_datasets, exclude_datasets)
+            log.debug(
+                f"Datasets considered for {paradigm} paradigm {[dt.code for dt in d]}"
+            )
+            print(f"Datasets considered for {paradigm} paradigm {[dt.code for dt in d]}")
+
+            # if len(d) = 0, raise warning that no suitable datasets were present after the
+            # arguments were satisfied
+            if len(d) == 0:
+                log.debug("No datasets matched the include_datasets or exclude_datasets")
+                print("No datasets matched the include_datasets or exclude_datasets")
+
+            context = eval_type[evaluation](
+                paradigm=p,
+                datasets=d,
+                random_state=42,
+                hdf5_path=results,
+                n_jobs=n_jobs,
+                overwrite=force,
+            )
+            paradigm_results = context.process(pipelines=paradigms[paradigm])
+            eval_results[f"{paradigm}"] = paradigm_results
+            paradigm_results["paradigm"] = f"{paradigm}"
+            paradigm_results["evaluation"] = f"{evaluation}"
+            df_eval.append(paradigm_results)
+
+        # Combining the FilterBank and the base Paradigm
+        combine_paradigms = ["SSVEP"]
+        for p in combine_paradigms:
+            if f"FilterBank{p}" in eval_results.keys() and f"{p}" in eval_results.keys():
+                eval_results[f"{p}"] = pd.concat(
+                    [eval_results[f"{p}"], eval_results[f"FilterBank{p}"]]
+                )
+                del eval_results[f"FilterBank{p}"]
+
+        for paradigm_result in eval_results.values():
+            analyze(paradigm_result, output, plot=plot)
+
+    return pd.concat(df_eval)
+
+
+def _inc_exc_datasets(datasets, include_datasets, exclude_datasets):
+    d = list()
+    if include_datasets is not None:
+        # Assert if the inputs are key_codes
+        if isinstance(include_datasets[0], str):
+            # Map from key_codes to class instances
+            datasets_codes = [d.code for d in datasets]
+            # Get the indices of the matching datasets
+            for incdat in include_datasets:
+                if incdat in datasets_codes:
+                    d.append(datasets[datasets_codes.index(incdat)])
+        else:
+            # The case where the class instances have been given
+            # can be passed on directly
+            d = include_datasets
+        if exclude_datasets is not None:
+            raise AttributeError("You could specify both include and exclude datasets")
+
+    elif exclude_datasets is not None:
+        d = datasets
+        # Assert if the inputs are not key_codes i.e expected to be dataset class objects
+        if not isinstance(exclude_datasets[0], str):
+            # Convert the input to key_codes
+            exclude_datasets = [e.code for e in exclude_datasets]
+
+        # Map from key_codes to class instances
+        datasets_codes = [d.code for d in datasets]
+        for excdat in exclude_datasets:
+            del d[datasets_codes.index(excdat)]
+    else:
+        d = datasets
+    return d
diff --git a/moabb/datasets/download.py b/moabb/datasets/download.py
@@ -219,6 +219,7 @@ def fs_get_file_list(article_id, version=None):
         return response
     else:
         url = fsurl + "/articles/{}/versions/{}".format(article_id, version)
+        headers = {"Content-Type": "application/json"}
         request = fs_issue_request("GET", url, headers=headers)
         return request["files"]
 

diff --git a/moabb/pipelines/utils.py b/moabb/pipelines/utils.py
@@ -1,10 +1,21 @@
+import importlib
+import logging
+import os
+from collections import OrderedDict
 from copy import deepcopy
+from glob import glob
 
 import numpy as np
 import scipy.signal as scp
+import yaml
 from sklearn.base import BaseEstimator, TransformerMixin
 from sklearn.pipeline import make_pipeline
 
+from moabb.analysis.results import get_string_rep
+
+
+log = logging.getLogger(__name__)
+
 
 def create_pipeline_from_config(config):
     """Create a pipeline from a config file.
@@ -39,6 +50,118 @@ def create_pipeline_from_config(config):
     return pipeline
 
 
+def parse_pipelines_from_directory(dir_path):
+    """
+    Takes in the path to a directory with pipeline configuration files and returns a dictionary
+    of pipelines.
+    Parameters
+    ----------
+    dir_path: str
+        Path to directory containing pipeline config .yml or .py files
+
+    Returns
+    -------
+    pipeline_configs: dict
+        Generated pipeline config dictionaries. Each entry has structure:
+        'name': string
+        'pipeline': sklearn.BaseEstimator
+        'paradigms': list of class names that are compatible with said pipeline
+    """
+    assert os.path.isdir(
+        os.path.abspath(dir_path)
+    ), "Given pipeline path {} is not valid".format(dir_path)
+
+    # get list of config files
+    yaml_files = glob(os.path.join(dir_path, "*.yml"))
+
+    pipeline_configs = []
+    for yaml_file in yaml_files:
+        with open(yaml_file, "r") as _file:
+            content = _file.read()
+
+            # load config
+            config_dict = yaml.load(content, Loader=yaml.FullLoader)
+            ppl = create_pipeline_from_config(config_dict["pipeline"])
+            pipeline_configs.append(
+                {
+                    "paradigms": config_dict["paradigms"],
+                    "pipeline": ppl,
+                    "name": config_dict["name"],
+                }
+            )
+
+    # we can do the same for python defined pipeline
+    python_files = glob(os.path.join(dir_path, "*.py"))
+
+    for python_file in python_files:
+        spec = importlib.util.spec_from_file_location("custom", python_file)
+        foo = importlib.util.module_from_spec(spec)
+        spec.loader.exec_module(foo)
+
+        pipeline_configs.append(foo.PIPELINE)
+    return pipeline_configs
+
+
+def generate_paradigms(pipeline_configs, context=None, logger=log):
+    """
+    Takes in a dictionary of pipelines configurations as returned by
+    parse_pipelines_from_directory and returns a dictionary of unique paradigms with all pipeline
+    configurations compatible with that paradigm.
+    Parameters
+    ----------
+    pipeline_configs:
+        dictionary of pipeline configurations
+    context:
+        TODO:add description
+    logger:
+        logger
+
+    Returns
+    -------
+    paradigms: dict
+        Dictionary of dictionaries with the unique paradigms and the configuration of the
+        pipelines compatible with the paradigm
+
+    """
+    context = context or {}
+    paradigms = OrderedDict()
+    for config in pipeline_configs:
+
+        if "paradigms" not in config.keys():
+            logger.error("{} must have a 'paradigms' key.".format(config))
+            continue
+
+        # iterate over paradigms
+
+        for paradigm in config["paradigms"]:
+
+            # check if it is in the context parameters file
+            if len(context) > 0:
+                if paradigm not in context.keys():
+                    logger.debug(context)
+                    logger.warning(
+                        "Paradigm {} not in context file {}".format(
+                            paradigm, context.keys()
+                        )
+                    )
+
+            if isinstance(config["pipeline"], BaseEstimator):
+                pipeline = deepcopy(config["pipeline"])
+            else:
+                logger.error(config["pipeline"])
+                raise (ValueError("pipeline must be a sklearn estimator"))
+
+            # append the pipeline in the paradigm list
+            if paradigm not in paradigms.keys():
+                paradigms[paradigm] = {}
+
+            # FIXME name are not unique
+            logger.debug("Pipeline: \n\n {} \n".format(get_string_rep(pipeline)))
+            paradigms[paradigm][config["name"]] = pipeline
+
+    return paradigms
+
+
 class FilterBank(BaseEstimator, TransformerMixin):
     """Apply a given indentical pipeline over a bank of filter.
-Original file line number
+Diff line change
@@ Expand Up / @@ -18,7 +18,7 @@ Develop branch @@
     Enhancements
     ~~~~~~~~~~~~
-    - None
+    - Adding a comprehensive benchmarking function (:gh:`264` by `Divyesh Narayanan`_)
     Bugs
     ~~~~
@@ Expand Down @@