From 7fd26adf49e0adcf93d560376a2ce90d6e1b823c Mon Sep 17 00:00:00 2001
From: NicolasGensollen <nicolas.gensollen@gmail.com>
Date: Mon, 25 Sep 2023 12:33:24 +0200
Subject: [PATCH] refactor...

---
 .../pipelines/statistics_surface/__init__.py  |    2 +-
 .../pipelines/statistics_surface/_model.py    | 1099 -----------------
 .../pipelines/statistics_surface/_utils.py    |  322 +++++
 .../{statistics_surface_cli.py => cli.py}     |   46 +-
 ...istics_surface_pipeline.py => pipeline.py} |  137 +-
 .../statistics_surface_utils.py               |  276 -----
 .../statistics_surface/surfstat/__init__.py   |    4 +
 .../_surfstat.py}                             |   63 +-
 .../{_inputs.py => surfstat/_utils.py}        |   25 +-
 .../surfstat/models/__init__.py               |    3 +
 .../surfstat/models/_base.py                  |  234 ++++
 .../surfstat/models/_contrast.py              |   87 ++
 .../surfstat/models/_correlation.py           |   61 +
 .../surfstat/models/_factory.py               |   99 ++
 .../surfstat/models/_group.py                 |  118 ++
 .../surfstat/models/_utils.py                 |  152 +++
 .../surfstat/models/results/__init__.py       |    9 +
 .../surfstat/models/results/_base.py          |   77 ++
 .../surfstat/models/results/_plot.py          |   89 ++
 .../surfstat/models/results/_serialize.py     |  110 ++
 .../surfstat/models/results/_statistics.py    |  187 +++
 .../pipelines/test_run_pipelines_stats.py     |   26 +-
 .../statistics_surface/test_inputs.py         |   18 +-
 .../statistics_surface/test_model.py          |  163 ++-
 24 files changed, 1794 insertions(+), 1613 deletions(-)
 delete mode 100644 clinica/pipelines/statistics_surface/_model.py
 create mode 100644 clinica/pipelines/statistics_surface/_utils.py
 rename clinica/pipelines/statistics_surface/{statistics_surface_cli.py => cli.py} (76%)
 rename clinica/pipelines/statistics_surface/{statistics_surface_pipeline.py => pipeline.py} (66%)
 delete mode 100644 clinica/pipelines/statistics_surface/statistics_surface_utils.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/__init__.py
 rename clinica/pipelines/statistics_surface/{clinica_surfstat.py => surfstat/_surfstat.py} (78%)
 rename clinica/pipelines/statistics_surface/{_inputs.py => surfstat/_utils.py} (88%)
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/__init__.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/_base.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/_contrast.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/_correlation.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/_factory.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/_group.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/_utils.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/results/__init__.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/results/_base.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/results/_plot.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/results/_serialize.py
 create mode 100644 clinica/pipelines/statistics_surface/surfstat/models/results/_statistics.py

diff --git a/clinica/pipelines/statistics_surface/__init__.py b/clinica/pipelines/statistics_surface/__init__.py
index 0cdbd511ed..f00831fce2 100644
--- a/clinica/pipelines/statistics_surface/__init__.py
+++ b/clinica/pipelines/statistics_surface/__init__.py
@@ -1 +1 @@
-from . import statistics_surface_cli
+from . import cli
diff --git a/clinica/pipelines/statistics_surface/_model.py b/clinica/pipelines/statistics_surface/_model.py
deleted file mode 100644
index ffa32e07a2..0000000000
--- a/clinica/pipelines/statistics_surface/_model.py
+++ /dev/null
@@ -1,1099 +0,0 @@
-import abc
-import warnings
-from dataclasses import dataclass
-from functools import reduce
-from os import PathLike
-from pathlib import Path
-from string import Template
-from typing import Callable, Dict, List, Optional, Union
-
-import numpy as np
-import pandas as pd
-from brainstat.stats.SLM import SLM
-from brainstat.stats.terms import FixedEffect
-from nilearn.surface import Mesh
-
-from clinica.utils.stream import cprint
-
-MISSING_TERM_ERROR_MSG = Template(
-    "Term ${term} from the design matrix is not in the columns of the "
-    "provided TSV file. Please make sure that there is no typo."
-)
-
-
-def _print_clusters(model: SLM, threshold: float) -> None:
-    """This function prints the results related to total number
-    of clusters, as well as the significative clusters.
-
-    Parameters
-    ----------
-    model : brainstat.stats.SLM
-        Fitted SLM model.
-
-    threshold : float
-        Cluster defining threshold.
-    """
-    cprint("#" * 40)
-    cprint("After correction (Cluster-wise Correction for Multiple Comparisons): ")
-    df = model.P["clus"][0]
-    cprint(df)
-    cprint(f"Clusters found: {len(df)}")
-    cprint(
-        f"Significative clusters (after correction): {len(df[df['P'] <= threshold])}"
-    )
-
-
-def _check_column_in_df(df: pd.DataFrame, column: str) -> None:
-    """Checks if the provided column name is in the provided DataFrame.
-    Raises a ValueError if not.
-
-    Parameters
-    ----------
-    df : pd.DataFrame
-        DataFrame to analyze.
-
-    column : str
-        Name of the column to check.
-    """
-    if column not in df.columns:
-        raise ValueError(MISSING_TERM_ERROR_MSG.safe_substitute(term=column))
-
-
-def _categorical_column(df: pd.DataFrame, column: str) -> bool:
-    """Returns `True` if the column is categorical and `False` otherwise.
-
-    Parameters
-    ----------
-    df : pd.DataFrame
-        The DataFrame to analyze.
-
-    column : str
-        The name of the column to check.
-
-    Returns
-    -------
-    bool :
-        `True` if the column contains categorical values, `False` otherwise.
-    """
-    return not df[column].dtype.name.startswith("float")
-
-
-def _build_model(design_matrix: str, df: pd.DataFrame) -> FixedEffect:
-    """Build a brainstat model from the design matrix in
-    string format.
-
-    This function assumes that the design matrix is formatted
-    in the following way:
-
-        1 + factor_1 + factor_2 + ...
-
-    Or:
-
-        factor_1 + factor_2 + ...
-
-    in the latter case the intercept will be added automatically.
-
-    Parameters
-    ----------
-    design_matrix : str
-        Design matrix specified as a string.
-
-    df : pd.DataFrame
-        Subjects DataFrame.
-
-    Returns
-    -------
-    model : FixedEffect
-        BrainStats model.
-    """
-    if len(design_matrix) == 0:
-        raise ValueError("Design matrix cannot be empty.")
-    if "+" in design_matrix:
-        terms = [_.strip() for _ in design_matrix.split("+")]
-    else:
-        terms = [design_matrix.strip()]
-    model = []
-    for term in terms:
-        # Intercept is automatically included in brainstat
-        if term == "1":
-            continue
-        # Handles the interaction effects
-        if "*" in term:
-            sub_terms = [_.strip() for _ in term.split("*")]
-            model_term = reduce(
-                lambda x, y: x * y, [_build_model_term(_, df) for _ in sub_terms]
-            )
-        else:
-            model_term = _build_model_term(term, df)
-        model.append(model_term)
-    return reduce(lambda x, y: x + y, model)
-
-
-def _build_model_term(
-    term: str,
-    df: pd.DataFrame,
-    add_intercept: Optional[bool] = True,
-) -> FixedEffect:
-    """Builds a BrainStats model term from the subjects
-    DataFrame and a column name.
-
-    Parameters
-    ----------
-    term : str
-        The name of the column of the DataFrame to be used.
-
-    df : pd.DataFrame
-        The subjects DataFrame.
-
-    add_intercept : bool
-        If `True`, adds an intercept term.
-
-    Returns
-    -------
-    FixedEffect :
-        BrainStats model term.
-    """
-    return FixedEffect(df[term], add_intercept=add_intercept)
-
-
-class GLM:
-    """This class implements the functionalities common to all GLM models
-    used in the Clinica SurfaceStatistics pipeline.
-
-    Attributes
-    ----------
-    design : str
-        The design matrix specified in string format.
-        If this contains a "*", it will be interpreted as an interaction effect.
-
-    df : pd.DataFrame
-        The subjects DataFrame.
-
-    feature_label : str
-        The label used for building output filenames.
-
-    contrast : str
-        The contrast specified in string format.
-
-    fwhm : int, optional
-        The smoothing FWHM. This is used in the output file names.
-        Default=20.
-
-    threshold_uncorrected_pvalue : float, optional
-        The threshold to be used with uncorrected P-values. Default=0.001.
-
-    threshold_corrected_pvalue : float, optional
-        The threshold to be used with corrected P-values. Default=0.05.
-
-    cluster_threshold : float, optional
-        The threshold to be used to declare clusters as significant. Default=0.001.
-    """
-
-    def __init__(
-        self,
-        design: str,
-        df: pd.DataFrame,
-        feature_label: str,
-        contrast: str,
-        fwhm: Optional[int] = 20,
-        threshold_uncorrected_pvalue: Optional[float] = 0.001,
-        threshold_corrected_pvalue: Optional[float] = 0.05,
-        cluster_threshold: Optional[float] = 0.001,
-    ):
-        self._two_tailed = False
-        self._correction = ["fdr", "rft"]
-        self.df = df
-        self.feature_label = feature_label
-        self.fwhm = fwhm
-        self.threshold_uncorrected_pvalue = threshold_uncorrected_pvalue
-        self.threshold_corrected_pvalue = threshold_corrected_pvalue
-        self.cluster_threshold = cluster_threshold
-        self.results_ = None
-        self.slm_models_ = None
-        self.contrasts = dict()
-        self.filenames = dict()
-        self.model = _build_model(design, df)
-        self.build_contrasts(contrast)
-
-    @property
-    def contrast_names(self) -> List[str]:
-        if self.contrasts is not None:
-            return list(self.contrasts.keys())
-        return list()
-
-    @property
-    def results(self):
-        if self._is_fitted():
-            return self.results_
-
-    @abc.abstractmethod
-    def build_contrasts(self, contrast: str):
-        """Build the contrasts from the provided contrast in string format.
-
-        .. note::
-            This method needs to be implemented in subclasses.
-
-        Parameters
-        ----------
-        contrast : str
-            Contrast in string format.
-        """
-        pass
-
-    @abc.abstractmethod
-    def filename_root(self, contrast: str):
-        """Returns the output file name root for the provided contrast.
-
-        .. note::
-            This method needs to be implemented in subclasses.
-
-        Parameters
-        ----------
-        contrast : str
-            Contrast for which to get the output filename.
-        """
-        pass
-
-    def _is_fitted(self) -> bool:
-        return self.results_ is not None
-
-    def fit(
-        self, data: np.ndarray, surface: Dict, mask: Optional[np.ndarray] = None
-    ) -> None:
-        """Fit the GLM model instance.
-
-        Parameters
-        ----------
-        data : np.ndarray
-            The data on which to fit the GLM model.
-
-        surface : dict
-            The Brainstat surface on which to fit the GLM model.
-
-        mask : np.ndarray, optional
-            The mask to be used to mask the data. Default=None.
-        """
-        if mask is None:
-            mask = data[0, :] > 0
-        self.results_ = dict()
-        self.slm_models_ = dict()
-        for contrast_name, contrast in self.contrasts.items():
-            slm_model = SLM(
-                self.model,
-                contrast=contrast,
-                surf=surface,
-                mask=mask,
-                two_tailed=self._two_tailed,
-                correction=self._correction,
-                cluster_threshold=self.cluster_threshold,
-            )
-            cprint(
-                msg=f"Fitting the GLM model with contrast {contrast_name}...",
-                lvl="info",
-            )
-            slm_model.fit(data)
-            _print_clusters(slm_model, self.threshold_corrected_pvalue)
-            self.results_[contrast_name] = StatisticsResults.from_slm_model(
-                slm_model,
-                mask,
-                self.threshold_uncorrected_pvalue,
-                self.threshold_corrected_pvalue,
-            )
-            self.slm_models_[contrast_name] = slm_model
-
-    def save_results(self, output_dir: PathLike, method: Union[str, List[str]]) -> None:
-        """Save results to the provided output directory.
-
-        Parameters
-        ----------
-        output_dir : PathLike
-            The output directory in which to write the results.
-
-        method : str or List[str]
-            The method(s) to write the results.
-        """
-        if not self._is_fitted():
-            raise ValueError(
-                "GLM model needs to be fitted before accessing the results."
-            )
-        if isinstance(method, str):
-            method = [method]
-        for contrast, result in self.results_.items():
-            result_serializer = StatisticsResultsSerializer(
-                Path(output_dir) / Path(self.filename_root(contrast))
-            )
-            for meth in method:
-                result_serializer.save(result, meth)
-
-    def plot_results(
-        self,
-        output_dir: PathLike,
-        method: Union[str, List[str]],
-        mesh: Mesh,
-    ) -> None:
-        """Plot results to the provided directory.
-
-        Parameters
-        ----------
-        output_dir : PathLike
-            The output directory in which to write the plot files.
-
-        method : str or List[str]
-            The method(s) to make the plots.
-
-        mesh : nilearn.surface.Mesh
-            The mesh on which to plot the result data.
-        """
-        if not self._is_fitted():
-            raise ValueError(
-                "GLM model needs to be fitted before accessing the results."
-            )
-        if isinstance(method, str):
-            method = [method]
-        for contrast, result in self.results_.items():
-            plotter = StatisticsResultsPlotter(
-                Path(output_dir) / Path(self.filename_root(contrast)), mesh
-            )
-            for meth in method:
-                plotter.plot(result, meth)
-
-
-class CorrelationGLM(GLM):
-    """Class implementing the correlation type GLM model.
-
-    Attributes
-    ----------
-    See documentation for `GLM` class.
-
-    group_label : str, optional
-        The label to use for group GLM models. Default=None.
-    """
-
-    def __init__(
-        self,
-        design: str,
-        df: pd.DataFrame,
-        feature_label: str,
-        contrast: str,
-        group_label: Optional[str],
-        fwhm: Optional[int] = 20,
-        threshold_uncorrected_pvalue: Optional[float] = 0.001,
-        threshold_corrected_pvalue: Optional[float] = 0.05,
-        cluster_threshold: Optional[float] = 0.001,
-    ):
-        self.with_interaction = False
-        self.absolute_contrast_name = None
-        self.contrast_sign = None
-        self.group_label = group_label
-        super().__init__(
-            design,
-            df,
-            feature_label,
-            contrast,
-            fwhm,
-            threshold_uncorrected_pvalue,
-            threshold_corrected_pvalue,
-            cluster_threshold,
-        )
-
-    def build_contrasts(self, contrast: str):
-        """Build the contrast from the string specification.
-
-        Parameters
-        ----------
-        contrast : str
-            The contrast to build.
-        """
-        absolute_contrast_name = contrast
-        contrast_sign = "positive"
-        if contrast.startswith("-"):
-            absolute_contrast_name = contrast[1:].lstrip()
-            contrast_sign = "negative"
-        built_contrast = self.df[absolute_contrast_name]
-        if contrast_sign == "negative":
-            built_contrast *= -1
-        self.contrasts[contrast] = built_contrast
-        self.absolute_contrast_name = absolute_contrast_name
-        self.contrast_sign = contrast_sign
-
-    def filename_root(self, contrast: str):
-        """Build the filename root part from class attributes and provided contrast.
-
-        Parameters
-        ----------
-        contrast : str
-            The contrast to use for building the filename.
-        """
-        if contrast not in self.contrasts:
-            raise ValueError(f"Unknown contrast {contrast}.")
-        return (
-            f"group-{self.group_label}_correlation-{self.absolute_contrast_name}"
-            f"-{self.contrast_sign}_measure-{self.feature_label}_fwhm-{self.fwhm}"
-        )
-
-
-class GroupGLM(GLM):
-    """Class implementing group GLM models.
-
-    Attributes
-    ----------
-    See documentation for `GLM` class.
-
-    group_label : str, optional
-        The Label to use for group GLM models. Default="group".
-    """
-
-    def __init__(
-        self,
-        design: str,
-        df: pd.DataFrame,
-        feature_label: str,
-        contrast: str,
-        group_label: Optional[str] = "group",
-        fwhm: Optional[int] = 20,
-        threshold_uncorrected_pvalue: Optional[float] = 0.001,
-        threshold_corrected_pvalue: Optional[float] = 0.05,
-        cluster_threshold: Optional[float] = 0.001,
-    ):
-        self.with_interaction = False
-        self.group_label = group_label
-        super().__init__(
-            design,
-            df,
-            feature_label,
-            contrast,
-            fwhm,
-            threshold_uncorrected_pvalue,
-            threshold_corrected_pvalue,
-            cluster_threshold,
-        )
-
-    def build_contrasts(self, contrast: str):
-        """Build the contrast from the string specification.
-
-        Parameters
-        ----------
-        contrast : str
-            The contrast to build.
-        """
-        _check_column_in_df(self.df, contrast)
-        if not _categorical_column(self.df, contrast):
-            raise ValueError(
-                "Contrast should refer to a categorical variable for group comparison. "
-                "Please select 'correlation' for 'glm_type' otherwise."
-            )
-        group_values = np.unique(self.df[contrast])
-        for contrast_type, (i, j) in zip(["positive", "negative"], [(0, 1), (1, 0)]):
-            contrast_name = f"{group_values[j]}-lt-{group_values[i]}"
-            self.contrasts[contrast_name] = (
-                self.df[contrast] == group_values[i]
-            ).astype(int) - (self.df[contrast] == group_values[j]).astype(int)
-
-    def filename_root(self, contrast: str):
-        """Build the filename root part from class attributes and provided contrast.
-
-        Parameters
-        ----------
-        contrast : str
-            The contrast to use for building the filename.
-        """
-        if contrast not in self.contrasts:
-            raise ValueError(f"Unknown contrast {contrast}.")
-        return f"group-{self.group_label}_{contrast}_measure-{self.feature_label}_fwhm-{self.fwhm}"
-
-
-class GroupGLMWithInteraction(GroupGLM):
-    """This class implements a GLM model for group comparison with
-    interaction effects.
-
-    Attributes
-    ----------
-    See attributes of parent class `GroupGLM`.
-    """
-
-    def __init__(
-        self,
-        design: str,
-        df: pd.DataFrame,
-        feature_label: str,
-        contrast: str,
-        group_label: Optional[str] = "group",
-        fwhm: Optional[int] = 20,
-        threshold_uncorrected_pvalue: Optional[float] = 0.001,
-        threshold_corrected_pvalue: Optional[float] = 0.05,
-        cluster_threshold: Optional[float] = 0.001,
-    ):
-        super().__init__(
-            design,
-            df,
-            feature_label,
-            contrast,
-            group_label,
-            fwhm,
-            threshold_uncorrected_pvalue,
-            threshold_corrected_pvalue,
-            cluster_threshold,
-        )
-        self.with_interaction = True
-        warnings.warn(
-            "You included interaction as covariate in your model, "
-            "please carefully check the format of your tsv files."
-        )
-
-    def build_contrasts(self, contrast: str):
-        """Build the contrast from the string specification.
-
-        Parameters
-        ----------
-        contrast : str
-            The contrast to build.
-        """
-        contrast_elements = [_.strip() for _ in contrast.split("*")]
-        for contrast_element in contrast_elements:
-            _check_column_in_df(self.df, contrast_element)
-        categorical = [_categorical_column(self.df, _) for _ in contrast_elements]
-        if len(contrast_elements) != 2 or sum(categorical) != 1:
-            raise ValueError(
-                "The contrast must be an interaction between one continuous "
-                "variable and one categorical variable. Your contrast contains "
-                f"the following variables : {contrast_elements}"
-            )
-        idx = 0 if categorical[0] else 1
-        categorical_contrast = contrast_elements[idx]
-        continue_contrast = contrast_elements[(idx + 1) % 2]
-        group_values = np.unique(self.df[categorical_contrast])
-        built_contrast = self.df[continue_contrast].where(
-            self.df[categorical_contrast] == group_values[0], 0
-        ) - self.df[continue_contrast].where(
-            self.df[categorical_contrast] == group_values[1], 0
-        )
-        self.contrasts[contrast] = built_contrast
-
-    def filename_root(self, contrast: str):
-        """Build the filename root part from class attributes and provided contrast.
-
-        Parameters
-        ----------
-        contrast : str
-            The contrast to use for building the filename.
-        """
-        if contrast not in self.contrasts:
-            raise ValueError(f"Unknown contrast {contrast}.")
-        return f"interaction-{contrast}_measure-{self.feature_label}_fwhm-{self.fwhm}"
-
-
-def create_glm_model(
-    glm_type: str,
-    design: str,
-    df: pd.DataFrame,
-    contrast: str,
-    feature_label: str,
-    group_label: Optional[str] = "group",
-    fwhm: Optional[int] = 20,
-    threshold_uncorrected_pvalue: Optional[float] = 0.001,
-    threshold_corrected_pvalue: Optional[float] = 0.05,
-    cluster_threshold: Optional[float] = 0.001,
-) -> GLM:
-    """Factory method for building a GLM model instance corresponding to the
-    provided type and design matrix.
-
-    Parameters
-    ----------
-    glm_type : str
-        The type of GLM to be created. Either "correlation" or "group_comparison".
-
-    design : str
-        The design matrix specified in string format.
-        If this contains a "*", it will be interpreted as an interaction effect.
-
-    df : pd.DataFrame
-        The subjects DataFrame.
-
-    contrast : str
-        The contrast specified in string format.
-
-    feature_label : str
-        The label used for building output filenames.
-
-    group_label : str, optional
-        The label to use for group GLM models. Default="group".
-
-    fwhm : int, optional
-        The smoothing FWHM. This is used in the output file names.
-        Default=20.
-
-    threshold_uncorrected_pvalue : float, optional
-        The threshold to be used with uncorrected P-values. Default=0.001.
-
-    threshold_corrected_pvalue : float, optional
-        The threshold to be used with corrected P-values. Default=0.05.
-
-    cluster_threshold : float, optional
-        The threshold to be used to declare clusters as significant. Default=0.001.
-
-    Returns
-    -------
-    model : GLM
-        An instance of the `GLM` class.
-
-    Raises
-    ------
-    ValueError
-        If the glm_type is not supported.
-    """
-    cprint(
-        msg=f"The GLM model is: {design} and the GLM type is: {glm_type}",
-        lvl="info",
-    )
-    params = {
-        "group_label": group_label,
-        "fwhm": fwhm,
-        "threshold_uncorrected_pvalue": threshold_uncorrected_pvalue,
-        "threshold_corrected_pvalue": threshold_corrected_pvalue,
-        "cluster_threshold": cluster_threshold,
-    }
-    if glm_type == "correlation":
-        return CorrelationGLM(design, df, feature_label, contrast, **params)
-    elif glm_type == "group_comparison":
-        if "*" in design:
-            return GroupGLMWithInteraction(
-                design, df, feature_label, contrast, **params
-            )
-        return GroupGLM(design, df, feature_label, contrast, **params)
-    raise ValueError(
-        f"create_glm_model received an unknown GLM type: {glm_type}."
-        f"Only 'correlation' and 'group_comparison' are supported."
-    )
-
-
-def _convert_arrays_to_lists(data: dict) -> dict:
-    """If the input dictionary contains numpy arrays, this function will
-    cast them to lists and return the same dictionary with the lists instead
-    of the numpy arrays.
-
-    Parameters
-    ----------
-    data : dict
-        The dictionary to clean.
-
-    Returns
-    -------
-    new_data : dict
-        The dictionary with arrays casted to lists.
-    """
-    new_data = dict()
-    for k, v in data.items():
-        if isinstance(v, dict):
-            new_data[k] = _convert_arrays_to_lists(v)
-        elif isinstance(v, np.ndarray):
-            new_data[k] = v.tolist()
-        else:
-            new_data[k] = v
-    return new_data
-
-
-class Results:
-    """Common class for GLM results."""
-
-    def to_dict(self) -> dict:
-        """Returns the `Results` instance in dict format.
-
-        Private attributes and all methods are not returned.
-
-        This function does not perform any casting.
-
-        Returns
-        -------
-        data : dict
-            Resulting dictionary.
-        """
-        import inspect
-
-        data = dict()
-        for attribute in inspect.getmembers(self):
-            name, value = attribute
-            if not name.startswith("_"):
-                if not inspect.ismethod(value):
-                    if hasattr(value, "to_dict"):
-                        data[name] = value.to_dict()
-                    else:
-                        data[name] = value
-        return data
-
-    def to_json(self, indent: Optional[int] = 4) -> str:
-        """Returns the json of the `Results` instance.
-
-        Parameters
-        ----------
-        indent : int, optional
-            Indent to use. Default=4.
-
-        Returns
-        -------
-        str :
-            The JSON dumps of the results.
-        """
-        import json
-
-        return json.dumps(_convert_arrays_to_lists(self.to_dict()), indent=indent)
-
-
-@dataclass
-class PValueResults(Results):
-    """This class implements a container for raw (uncorrected)
-    P-value results obtained with a GLM model.
-
-    Attributes
-    ----------
-    pvalues : np.ndarray
-        Array of uncorrected P-values.
-
-    mask : np.ndarray
-        The binary mask.
-
-    threshold : float
-        The threshold used.
-    """
-
-    pvalues: np.ndarray
-    mask: np.ndarray
-    threshold: float
-
-    @property
-    def thresh(self):
-        """For compatibility with previous Matlab implementation."""
-        return self.threshold
-
-    @property
-    def P(self):
-        """For compatibility with previous Matlab implementation."""
-        return self.pvalues
-
-    @classmethod
-    def from_t_statistics(
-        cls,
-        tstats: np.ndarray,
-        df: pd.DataFrame,
-        mask: np.ndarray,
-        threshold: float,
-    ):
-        """Instantiate the class from an array of T-statistics.
-
-        Parameters
-        ----------
-        tstats : np.ndarray
-            Array of T-statistics.
-
-        df : pd.DataFrame
-            The subjects DataFrame.
-
-        mask : np.ndarray
-            The binary mask.
-
-        threshold : float
-            The threshold to be used.
-        """
-        from scipy.stats import t
-
-        return cls(1 - t.cdf(tstats, df), mask, threshold)
-
-
-@dataclass
-class CorrectedPValueResults(PValueResults):
-    """This class implements a container for corrected P-value
-    results obtained with a GLM model.
-
-    Attributes
-    ----------
-    cluster_pvalues : np.ndarray
-        The cluster P-values.
-    """
-
-    cluster_pvalues: np.ndarray
-
-    @property
-    def C(self):
-        """For compatibility with previous Matlab implementation."""
-        return self.cluster_pvalues
-
-
-@dataclass
-class StatisticsResults(Results):
-    """This class implements a container for results obtained with
-    the GLM model classes. It holds information relative to a GLM
-    run with one specific contrast.
-
-    Attributes
-    ----------
-    coefficients : np.ndarray
-        The beta coefficients of the fitted GLM model.
-
-    tstats : np.ndarray
-        The corresponding T-statistics.
-
-    uncorrected_p_value : PValueResults
-        The corresponding uncorrected p values, stored in a `PValueResults` instance.
-
-    fdr : np.ndarray
-        The corresponding False Discovery Rate.
-
-    corrected_p_value : CorrectedPValueResults
-        The corresponding corrected p values, stored in a `CorrectedPValueResults` instance.
-    """
-
-    coefficients: np.ndarray
-    tstats: np.ndarray
-    uncorrected_p_values: PValueResults
-    fdr: np.ndarray
-    corrected_p_values: CorrectedPValueResults
-
-    @property
-    def TStatistics(self):
-        """Needed for compatibility with previous implementation in Matlab."""
-        return self.tstats
-
-    @property
-    def uncorrectedPValue(self):
-        """Needed for compatibility with previous implementation in Matlab."""
-        return self.uncorrected_p_values
-
-    @property
-    def correctedPValue(self):
-        """Needed for compatibility with previous implementation in Matlab."""
-        return self.corrected_p_values
-
-    @property
-    def FDR(self):
-        """Needed for compatibility with previous implementation in Matlab."""
-        return self.fdr
-
-    @classmethod
-    def from_slm_model(
-        cls,
-        model: SLM,
-        mask: np.ndarray,
-        threshold_uncorrected_p_value: float,
-        threshold_corrected_p_value: float,
-    ):
-        """Instantiate from a SLM model.
-
-        Parameters
-        ----------
-        model : brainstat.stats.SLM
-            SLM model instance to use.
-
-        mask : np.ndarray
-            The binary mask to use.
-
-        threshold_uncorrected_p_value : float
-            The threshold to use with uncorrected P-values.
-
-        threshold_corrected_p_value : float
-            The threshold to use with corrected P-values.
-        """
-        idx = np.argwhere(np.isnan(model.t))
-        corrected_pvals = model.P["pval"]["P"]
-        corrected_pvals[idx] = 1.0
-        tstats = np.nan_to_num(model.t)
-        uncorrected_p_values = PValueResults.from_t_statistics(
-            tstats,
-            model.df,
-            mask,
-            threshold_uncorrected_p_value,
-        )
-        corrected_p_values = CorrectedPValueResults(
-            corrected_pvals,
-            model.P["pval"]["C"],
-            mask,
-            threshold_corrected_p_value,
-        )
-        return cls(
-            np.nan_to_num(model.coef),
-            tstats,
-            uncorrected_p_values,
-            model.Q,
-            corrected_p_values,
-        )
-
-
-class StatisticsResultsPlotter:
-    """Class responsible to plotting results of GLM fit.
-
-    Attributes
-    ----------
-    output_file : PathLike
-        Path to the output file.
-
-    mesh : nilearn.surface.Mesh
-        The mesh to be used for plotting results.
-    """
-
-    def __init__(self, output_file: PathLike, mesh: Mesh):
-        self.output_file = output_file
-        self.mesh = mesh
-        self.plotting_extension = ".png"
-        self.no_plot = {"coefficients"}  # Elements which should not be plotted
-
-    def plot(self, result: StatisticsResults, method: str) -> None:
-        """Plot the results.
-
-        Parameters
-        ----------
-        result : StatisticsResults
-            The results to be plotted.
-
-        method : str
-            The plotting method to use.
-        """
-        plotter = self._get_plotter(method)
-        plotter(result)
-
-    def _get_plotter(self, method: str) -> Callable[[StatisticsResults], None]:
-        """Returns the plotting method from its name.
-
-        Parameters
-        ----------
-        method : str
-            Name of the plotting method to use.
-
-        Returns
-        -------
-        Callable :
-            Plotting method.
-        """
-        if method == "nilearn_plot_surf_stat_map":
-            return self._plot_stat_maps
-        else:
-            raise NotImplementedError(f"Plotting method {method} is not implemented.")
-
-    def _plot_stat_maps(self, result: StatisticsResults) -> None:
-        """Wrapper around the `nilearn.plotting.plot_surf_stat_map` method.
-
-        Parameters
-        ----------
-        result : StatisticsResults
-            The results to plot.
-        """
-        from nilearn.plotting import plot_surf_stat_map
-
-        for name, res in result.to_dict().items():
-            if name not in self.no_plot:
-                texture = res
-                threshold = None
-                plot_filename = (
-                    str(self.output_file) + "_" + name + self.plotting_extension
-                )
-                if isinstance(res, dict):
-                    texture = res["P"]
-                    threshold = res["thresh"]
-                cprint(msg=f"Saving plot to {plot_filename}", lvl="info")
-                plot_surf_stat_map(
-                    self.mesh,
-                    texture,
-                    threshold=threshold,
-                    output_file=plot_filename,
-                    title=name,
-                )
-
-
-class StatisticsResultsSerializer:
-    """This class is responsible for writing instances of `StatisticsResults`
-    to disk through different methods.
-
-    Attributes
-    ----------
-    output_file : PathLike
-        Path and filename root to be used.
-    """
-
-    def __init__(self, output_file: PathLike):
-        self.output_file = output_file
-        self.json_extension = "_results.json"
-        self.json_indent = 4
-        self.mat_extension = ".mat"
-
-    def save(self, result: StatisticsResults, method: str) -> None:
-        """Save provided `StatisticsResults` to disk with provided method.
-
-        Parameters
-        ----------
-        result : StatisticsResults
-            Results to be saved.
-
-        method : str
-            Name of the saving method to use.
-        """
-        writer = self._get_writer(method)
-        writer(result)
-
-    def _get_writer(self, method: str) -> Callable[[StatisticsResults], None]:
-        """Returns a writer method from its name.
-
-        Parameters
-        ----------
-        method : str
-            The name of the writing method to use.
-
-        Returns
-        -------
-        Callable :
-            The writing method.
-        """
-        if method.lower() == "json":
-            return self._write_to_json
-        elif method.lower() == "mat":
-            return self._write_to_mat
-        else:
-            raise NotImplementedError(
-                f"Serializing method {method} is not implemented."
-            )
-
-    def _write_to_json(self, results: StatisticsResults) -> None:
-        """Write the provided `StatisticsResults` to JSON format.
-
-        Parameters
-        ----------
-        results : StatisticsResults
-            The results to write to disk in JSON format.
-        """
-        import json
-        import os
-
-        out_json_file = Path(str(self.output_file) + self.json_extension)
-        if not os.path.exists(out_json_file.parents[0]):
-            os.makedirs(out_json_file.parents[0])
-        cprint(
-            msg=f"Writing results to JSON in {out_json_file}...",
-            lvl="info",
-        )
-        with open(out_json_file, "w") as fp:
-            json.dump(results.to_json(indent=self.json_indent), fp)
-
-    def _write_to_mat(self, results: StatisticsResults) -> None:
-        """Write the provided `StatisticsResults` to MAT format.
-
-        Parameters
-        ----------
-        results : StatisticsResults
-            The results to write to disk in MAT format.
-        """
-        from scipy.io import savemat
-
-        # These labels are used for compatibility with the previous
-        # MATLAB implementation of the Statistics Surface Pipeline
-        # of Clinica.
-        struct_labels = {
-            "coefficients": "coef",
-            "TStatistics": "tvaluewithmask",
-            "uncorrectedPValue": "uncorrectedpvaluesstruct",
-            "correctedPValue": "correctedpvaluesstruct",
-            "FDR": "FDR",
-        }
-        for name, res in results.to_dict().items():
-            if name in struct_labels:
-                mat_filename = str(self.output_file) + "_" + name + self.mat_extension
-                cprint(
-                    msg=f"Writing {name} results to MAT in  {mat_filename}",
-                    lvl="info",
-                )
-                savemat(mat_filename, {struct_labels[name]: res})
diff --git a/clinica/pipelines/statistics_surface/_utils.py b/clinica/pipelines/statistics_surface/_utils.py
new file mode 100644
index 0000000000..3bc627fd6d
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/_utils.py
@@ -0,0 +1,322 @@
+from pathlib import Path
+from typing import Optional
+
+__all__ = [
+    "init_input_node",
+    "run_clinica_surfstat",
+    "save_to_caps",
+    "get_t1_freesurfer_custom_file",
+    "get_pet_surface_custom_file",
+    "create_glm_info_dictionary",
+    "build_design_matrix",
+]
+
+
+def get_t1_freesurfer_custom_file() -> str:
+    import os
+
+    return os.path.join(
+        "%(subject)s",
+        "%(session)s",
+        "t1",
+        "freesurfer_cross_sectional",
+        "%(subject)s_%(session)s",
+        "surf",
+        "%(hemi)s.thickness.fwhm%(fwhm)s.fsaverage.mgh",
+    )
+
+
+def get_pet_surface_custom_file(acq_label: str, suvr_reference_region: str) -> str:
+    import os
+
+    return os.path.join(
+        "%(subject)s",
+        "%(session)s",
+        "pet",
+        "surface",
+        f"%(subject)s_%(session)s_trc-{acq_label}_pet"
+        f"_space-fsaverage_suvr-{suvr_reference_region}_pvc-iy_hemi-%(hemi)s_fwhm-%(fwhm)s_projection.mgh",
+    )
+
+
+def init_input_node(parameters: dict, base_dir, subjects_visits_tsv):
+    """Initialize the pipeline.
+
+    This function will:
+        - Create `surfstat_results_dir` in `base_dir`/<group_id> for SurfStat;
+        - Save pipeline parameters in JSON file;
+        - Copy TSV file with covariates;
+        - Print begin execution message.
+
+    Parameters
+    ----------
+    parameters : dict
+        The pipeline's parameters.
+
+    base_dir : Path
+        The path to the pipeline's base directory.
+        This is a pathlib Path. No type hints because of Nipype.
+
+    subjects_visits_tsv : Path
+        The path to the subjects TSV file.
+        This is a pathlib Path. No type hints because of Nipype.
+
+    Returns
+    -------
+    group_label : str
+        The group label.
+
+    surfstat_results_dir : Path
+        The folder which will contain the results for SurfStat.
+    """
+    import json
+    import shutil
+
+    from clinica.pipelines.statistics_surface._utils import create_glm_info_dictionary
+    from clinica.utils.ux import print_begin_image
+
+    group_id = "group-" + parameters["group_label"]
+    surfstat_results_dir = base_dir / group_id
+    surfstat_results_dir.mkdir(parents=True, exist_ok=True)
+
+    # Save pipeline parameters in JSON file
+    glm_dict = create_glm_info_dictionary(subjects_visits_tsv, parameters)
+    with open(surfstat_results_dir / f"{group_id}_glm.json", "w") as json_file:
+        json.dump(glm_dict, json_file, indent=4)
+
+    # Copy TSV file with covariates
+    tsv_filename = surfstat_results_dir / f"{group_id}_covariates.tsv"
+    shutil.copyfile(subjects_visits_tsv, tsv_filename)
+
+    # Print begin message
+    list_keys = ["AnalysisType", "Covariates", "Contrast", "FWHM", "ClusterThreshold"]
+    list_values = [
+        parameters["glm_type"],
+        parameters["covariates"],
+        parameters["contrast"],
+        str(parameters["full_width_at_half_maximum"]),
+        str(parameters["cluster_threshold"]),
+    ]
+    group_id = "group-" + parameters["group_label"]
+    print_begin_image(group_id, list_keys, list_values)
+
+    return parameters["group_label"], surfstat_results_dir
+
+
+def _get_string_format_from_tsv(tsv_file: Path) -> str:
+    """Determine string format from TSV file.
+
+    If the TSV file is like:
+
+    participant_id  session_id  sex     group   age
+    sub-CLNC0001    ses-M000     Female  CN      71.1
+    sub-CLNC0002    ses-M000     Male    CN      81.3
+    sub-CLNC0003    ses-M000     Male    CN      75.4
+
+    The columns of the TSV file contains consecutively strings, strings,
+    strings, strings and float. The string_format is therefore "%s %s %s %s %f".
+
+    Parameters
+    ----------
+    tsv_file : Path
+        The path to the TSV file.
+
+    Returns
+    -------
+    str :
+        The string formatting of the TSV file (e.g. "%s %s %s %s %f")
+    """
+    import pandas as pd
+
+    demographics_df = pd.read_csv(tsv_file, sep="\t")
+
+    return " ".join(
+        [
+            _convert_dtype_to_str_format(demographics_df[column].dtype)
+            for column in demographics_df.columns
+        ]
+    )
+
+
+def _convert_dtype_to_str_format(dtype) -> str:
+    """Convert pandas dtypes (e.g. int64) to string format (e.g. %d)"""
+    import numpy as np
+
+    if dtype == np.int64:
+        return "%d"
+    if dtype == np.float64:
+        return "%f"
+    if dtype == np.object:
+        return "%s"
+    raise ValueError(f"Unknown dtype (given: {dtype})")
+
+
+def build_design_matrix(contrast: str, covariates: Optional[str] = None) -> str:
+    """Generate the design matrix for SurfStat based on the contrast and the optional list of covariates.
+
+    Design matrix "1 + <contrast> + <covariate_1> + ... + <covariate_n>"
+
+    Example
+    -------
+    >>> from clinica.pipelines.statistics_surface.statistics_surface_utils import _build_design_matrix
+    >>> _build_design_matrix('group', 'age sex group')
+    1 + group + age + sex
+    >>> _build_design_matrix('group', 'age')
+    1 + group + age
+    >>> _build_design_matrix('group', None)
+    1 + group
+    """
+    if covariates:
+        # Convert string to list while handling case where several spaces are present
+        list_covariates = list(covariates)
+        try:
+            list_covariates.remove("")
+        except ValueError:
+            pass
+        if contrast in list_covariates:
+            return "1 + " + " + ".join(covariate for covariate in list_covariates)
+        return (
+            "1 + "
+            + contrast
+            + " + "
+            + " + ".join(covariate for covariate in list_covariates)
+        )
+    return "1 + " + contrast
+
+
+def run_clinica_surfstat(
+    caps_dir,  # Path. no type hint because of Nipype self-contained requirement
+    output_dir,  # Path. no type hint because of Nipype self-contained requirement
+    subjects_visits_tsv,  # Path. no type hint because of Nipype self-contained requirement
+    pipeline_parameters: dict,
+):
+    """Call clinica_surfstat function.
+
+    Parameters
+    ----------
+    caps_dir : Path
+        The path to CAPS directory containing surface-based features.
+
+    output_dir : Path
+        The path to output directory that will contain outputs.
+
+    subjects_visits_tsv : Path
+        The path to TSV file containing the GLM information.
+
+    pipeline_parameters : dict
+        Parameters of StatisticsSurface pipeline.
+
+    Returns
+    -------
+    output_dir : Path
+        The path to the output directory.
+    """
+    from pathlib import Path
+
+    from clinica.pipelines.statistics_surface._utils import build_design_matrix
+    from clinica.pipelines.statistics_surface.surfstat import clinica_surfstat
+    from clinica.utils.check_dependency import check_environment_variable
+
+    freesurfer_home = Path(check_environment_variable("FREESURFER_HOME", "FreeSurfer"))
+
+    clinica_surfstat(
+        caps_dir / "subjects",
+        output_dir,
+        subjects_visits_tsv,
+        build_design_matrix(
+            pipeline_parameters["contrast"], pipeline_parameters["covariates"]
+        ),
+        pipeline_parameters["contrast"],
+        pipeline_parameters["glm_type"],
+        pipeline_parameters["group_label"],
+        freesurfer_home,
+        pipeline_parameters["measure_label"],
+        surface_file=pipeline_parameters["custom_file"],
+        fwhm=pipeline_parameters["full_width_at_half_maximum"],
+        cluster_threshold=pipeline_parameters["cluster_threshold"],
+    )
+    return output_dir
+
+
+def create_glm_info_dictionary(tsv_file: Path, pipeline_parameters: dict) -> dict:
+    """Create dictionary containing the GLM information that will be stored in a JSON file."""
+    glm_info = {
+        # Clinica compulsory arguments
+        "AnalysisType": pipeline_parameters["glm_type"],
+        "DesignMatrix": build_design_matrix(
+            pipeline_parameters["contrast"],
+            pipeline_parameters["covariates"],
+        ),
+        "StringFormatTSV": _get_string_format_from_tsv(tsv_file),
+        "Contrast": pipeline_parameters["contrast"],
+        "GroupLabel": pipeline_parameters["group_label"],
+        # Optional arguments
+        "Covariates": pipeline_parameters["covariates"],
+        "FWHM": pipeline_parameters["full_width_at_half_maximum"],
+        # Optional arguments for custom pipeline
+        "custom_file": pipeline_parameters["custom_file"],
+        "measure_label": pipeline_parameters["measure_label"],
+        # Advanced arguments (i.e. tricky parameters)
+        "ThresholdUncorrectedPvalue": 0.001,
+        "ThresholdCorrectedPvalue": 0.05,
+        "ClusterThreshold": pipeline_parameters["cluster_threshold"],
+    }
+    # Optional arguments for inputs from pet-surface pipeline
+    if (
+        pipeline_parameters["acq_label"]
+        and pipeline_parameters["suvr_reference_region"]
+    ):
+        glm_info["acq_label"] = pipeline_parameters["acq_label"]
+        glm_info["suvr_reference_region"] = pipeline_parameters["suvr_reference_region"]
+
+    return glm_info
+
+
+def save_to_caps(
+    source_dir,  # Path. no type hint because of Nipype self-contained requirement
+    caps_dir,  # Path. no type hint because of Nipype self-contained requirement
+    overwrite_caps: bool,
+    group_label: str,
+    glm_type: str,
+) -> None:
+    """Save `source_dir`/ to CAPS folder.
+
+    This function copies outputs of `source_dir`/ to
+    `caps_dir`/groups/<group_id>/<statistics>/surfstat_<glm_type>/
+
+    The `source_dir`/ folder should contain the following elements:
+        - group-<group_label>_<group_1_or_2>-lt-<group_1_or_2>_measure-<measure>_fwhm-<label>_suffix.ext
+    or
+        - group-<group_label>_correlation-<label>_contrast-{-|+}_measure-<measure>_fwhm-<label>_suffix.ext
+    and
+        - group-<group_label>_covariates.tsv
+        - group-<group_label>_glm.json
+
+    Raises
+    ------
+    NotImplementedError
+        If overwrite_caps=True.
+    """
+    import shutil
+
+    from clinica.pipelines.statistics_surface.surfstat.models import GLMModelType
+    from clinica.utils.ux import print_end_image
+
+    glm_type = GLMModelType(glm_type)
+    if glm_type == GLMModelType.GROUP_COMPARISON:
+        surfstat_folder = f"surfstat_{glm_type}"
+    if glm_type == GLMModelType.CORRELATION:
+        surfstat_folder = f"surfstat_{glm_type}_analysis"
+
+    destination_dir = (
+        caps_dir.expanduser()
+        / "groups"
+        / f"group-{group_label}"
+        / "statistics"
+        / surfstat_folder
+    )
+
+    if overwrite_caps:
+        raise NotImplementedError("save_to_caps(overwrite_caps=True) not implemented")
+    shutil.copytree(source_dir, destination_dir, symlinks=True)
+    print_end_image(f"group-{group_label}")
diff --git a/clinica/pipelines/statistics_surface/statistics_surface_cli.py b/clinica/pipelines/statistics_surface/cli.py
similarity index 76%
rename from clinica/pipelines/statistics_surface/statistics_surface_cli.py
rename to clinica/pipelines/statistics_surface/cli.py
index 0fdbe91298..307f52d86d 100644
--- a/clinica/pipelines/statistics_surface/statistics_surface_cli.py
+++ b/clinica/pipelines/statistics_surface/cli.py
@@ -97,14 +97,14 @@ def cli(
     working_directory: Optional[str] = None,
     n_procs: Optional[int] = None,
 ) -> None:
-    """Surface-based mass-univariate analysis with SurfStat.
+    """Surface-based mass-univariate analysis with BrainStat.
 
-    GROUP_LABEL is a user-defined identifier to target a specific group of
-    subjects.
+    GROUP_LABEL is a user-defined identifier to target a specific group of subjects.
 
-    The type of surface-based feature can be defined by using the third
-    argument: t1-freesurfer for cortical thickness, pet-surface for projected
-    PET data or custom-pipeline for you own data in CAPS directory.
+    The type of surface-based feature can be defined by using the third argument:
+        - "t1-freesurfer" for cortical thickness
+        - "pet-surface" for projected PET data
+        - "custom-pipeline" for you own data in CAPS directory
 
     The type of analysis of the model is defined by the argument
     'group_comparison' or 'correlation'.
@@ -124,41 +124,9 @@ def cli(
     """
     from networkx import Graph
 
-    from clinica.utils.exceptions import ClinicaException
     from clinica.utils.ux import print_end_pipeline
 
-    from .statistics_surface_pipeline import StatisticsSurface
-    from .statistics_surface_utils import (
-        get_pet_surface_custom_file,
-        get_t1_freesurfer_custom_file,
-    )
-
-    # PET-Surface pipeline
-    if orig_input_data == "pet-surface":
-        if not acq_label:
-            raise ClinicaException(
-                "You selected pet-surface pipeline without setting --acq_label flag. "
-                "Clinica will now exit."
-            )
-        if not suvr_reference_region:
-            raise ClinicaException(
-                "You selected pet-surface pipeline without setting --suvr_reference_region flag. "
-                "Clinica will now exit."
-            )
-
-    # FreeSurfer cortical thickness
-    if orig_input_data == "t1-freesurfer":
-        custom_file = get_t1_freesurfer_custom_file()
-        measure_label = "ct"
-    # PET cortical projection
-    elif orig_input_data == "pet-surface":
-        custom_file = get_pet_surface_custom_file(acq_label, suvr_reference_region)
-        measure_label = acq_label
-    else:
-        if not all([custom_file, measure_label]):
-            raise ClinicaException(
-                "You must set --measure_label and --custom_file flags."
-            )
+    from .pipeline import StatisticsSurface
 
     parameters = {
         # Clinica compulsory arguments
diff --git a/clinica/pipelines/statistics_surface/statistics_surface_pipeline.py b/clinica/pipelines/statistics_surface/pipeline.py
similarity index 66%
rename from clinica/pipelines/statistics_surface/statistics_surface_pipeline.py
rename to clinica/pipelines/statistics_surface/pipeline.py
index 41297f1303..ffe8503099 100644
--- a/clinica/pipelines/statistics_surface/statistics_surface_pipeline.py
+++ b/clinica/pipelines/statistics_surface/pipeline.py
@@ -2,18 +2,16 @@
 
 
 class StatisticsSurface(cpe.Pipeline):
-    """StatisticsSurface - Surface-based mass-univariate analysis with SurfStat.
+    """StatisticsSurface - Surface-based mass-univariate analysis with BrainStat.
 
     See documentation at https://aramislab.paris.inria.fr/clinica/docs/public/latest/Pipelines/Stats_Surface/
 
-    Note:
-        The `tsv_file` attribute is overloaded for this pipeline. It must contain a list of subjects
-        with their sessions and all the covariates and factors needed for the GLM.
+    Notes
+    -----
+    The `tsv_file` attribute is overloaded for this pipeline. It must contain a list of subjects
+    with their sessions and all the covariates and factors needed for the GLM.
 
-        Pipeline parameters are explained in StatisticsSurfaceCLI.define_options()
-
-    Returns:
-        A clinica pipeline object containing the StatisticsSurface pipeline.
+    Pipeline parameters are explained in StatisticsSurfaceCLI.define_options()
     """
 
     def check_pipeline_parameters(self):
@@ -21,44 +19,46 @@ def check_pipeline_parameters(self):
         from clinica.utils.exceptions import ClinicaException
         from clinica.utils.group import check_group_label
 
-        from ._inputs import _get_t1_freesurfer_custom_file_template
+        from ._utils import get_pet_surface_custom_file, get_t1_freesurfer_custom_file
+        from .surfstat import get_t1_freesurfer_custom_file_template
 
-        # Clinica compulsory parameters
         self.parameters.setdefault("group_label", None)
         check_group_label(self.parameters["group_label"])
 
-        if "orig_input_data" not in self.parameters.keys():
-            raise KeyError(
-                "Missing compulsory orig_input_data key in pipeline parameter."
-            )
-
-        self.parameters.setdefault("glm_type", None)
-        if self.parameters["glm_type"] not in ["group_comparison", "correlation"]:
-            raise ClinicaException(
-                f"The glm_type you specified is wrong: it should be group_comparison or "
-                f"correlation (given value: {self.parameters['glm_type']})."
-            )
-
-        if "contrast" not in self.parameters.keys():
-            raise KeyError("Missing compulsory contrast key in pipeline parameter.")
-
-        # Optional parameters
+        for compulsory_parameter_name in ("orig_input_data", "contrast"):
+            if compulsory_parameter_name not in self.parameters:
+                raise KeyError(
+                    f"Missing compulsory parameter {compulsory_parameter_name}."
+                )
         self.parameters.setdefault("covariates", None)
         self.parameters.setdefault("full_width_at_half_maximum", 20)
-
-        # Optional parameters for inputs from pet-surface pipeline
         self.parameters.setdefault("acq_label", None)
         self.parameters.setdefault("suvr_reference_region", None)
-
-        # Optional parameters for custom pipeline
         self.parameters.setdefault(
             "custom_file",
-            _get_t1_freesurfer_custom_file_template(self.caps_directory + "/subjects"),
+            get_t1_freesurfer_custom_file_template(self.caps_directory / "subjects"),
         )
         self.parameters.setdefault("measure_label", "ct")
-
-        # Advanced parameters
         self.parameters.setdefault("cluster_threshold", 0.001)
+        self.parameters.setdefault("glm_type", None)
+
+        if self.parameters["orig_input_data"] == "pet-surface":
+            if not self.parameters["acq_label"]:
+                raise ClinicaException(
+                    "You selected pet-surface pipeline without providing the acq_label "
+                    "(by setting the --acq_label option). Clinica will now exit."
+                )
+            if not self.parameters["suvr_reference_region"]:
+                raise ClinicaException(
+                    "You selected pet-surface pipeline without providing the suvr "
+                    "reference region (by setting the --suvr_reference_region option). "
+                    "Clinica will now exit."
+                )
+        if self.parameters["glm_type"] not in ("group_comparison", "correlation"):
+            raise ClinicaException(
+                f"The glm_type you specified is wrong: it should be group_comparison or "
+                f"correlation (given value: {self.parameters['glm_type']})."
+            )
         if (
             self.parameters["cluster_threshold"] < 0
             or self.parameters["cluster_threshold"] > 1
@@ -67,6 +67,23 @@ def check_pipeline_parameters(self):
                 f"Cluster threshold should be between 0 and 1 "
                 f"(given value: {self.parameters['cluster_threshold']})."
             )
+        if self.parameters["orig_input_data"] == "t1-freesurfer":
+            self.parameters["custom_file"] = get_t1_freesurfer_custom_file()
+            self.parameters["measure_label"] = "ct"
+        elif self.parameters["orig_input_data"] == "pet-surface":
+            self.parameters["custom_file"] = get_pet_surface_custom_file(
+                self.parameters["acq_label"],
+                self.parameters["suvr_reference_region"],
+            )
+            self.parameters["measure_label"] = self.parameters["acq_label"]
+        else:
+            if not all(
+                [self.parameters["custom_file"], self.parameters["measure_label"]]
+            ):
+                raise ClinicaException(
+                    "You must provide measure label (use the --measure_label option) "
+                    "and a custom file (use the --custom_file option)."
+                )
 
     def check_custom_dependencies(self):
         """Check dependencies that can not be listed in the `info.json` file."""
@@ -89,11 +106,8 @@ def get_output_fields(self):
 
     def build_input_node(self):
         """Build and connect an input node to the pipeline."""
-        import os
-
         from clinica.utils.exceptions import ClinicaException
         from clinica.utils.inputs import clinica_file_reader
-        from clinica.utils.stream import cprint
 
         # Check if already present in CAPS
         # ================================
@@ -101,19 +115,17 @@ def build_input_node(self):
         # Note(AR): if the user wants to compare Cortical Thickness measure with PET measure
         # using the group_id, Clinica won't allow it.
         # TODO: Modify this behaviour
-        if os.path.exists(
-            os.path.join(
-                self.caps_directory, "groups", f"group-{self.parameters['group_label']}"
-            )
-        ):
+        group_folder = (
+            self.caps_directory / "groups" / f"group-{self.parameters['group_label']}"
+        )
+        if group_folder.exists():
             raise ClinicaException(
-                f"Group label {self.parameters['group_label']} already exists, "
-                f"please choose another one or delete the existing folder and "
-                f"also the working directory and rerun the pipeline"
+                f"Group label {self.parameters['group_label']} already exists (found in {group_folder})."
+                "Please choose another one or delete the existing folder and "
+                "also the working directory and rerun the pipeline"
             )
 
-        # Check input files before calling SurfStat with Matlab
-        # =====================================================
+        # Check input files
         all_errors = []
         # clinica_files_reader expects regexp to start at subjects/ so sub-*/ses-*/ is removed here
         fwhm = str(self.parameters["full_width_at_half_maximum"])
@@ -136,35 +148,28 @@ def build_input_node(self):
                 )
             except ClinicaException as e:
                 all_errors.append(e)
-        # Raise all errors if something happened
+
         if len(all_errors) > 0:
             error_message = "Clinica faced errors while trying to read files in your CAPS directory.\n"
             for msg in all_errors:
                 error_message += str(msg)
             raise RuntimeError(error_message)
 
-        # Give pipeline info
-        # ==================
-        cprint(
-            "The pipeline will last a few minutes. Images generated by Matlab will popup during the pipeline."
-        )
-
     def build_output_node(self):
         """Build and connect an output node to the pipeline."""
         import nipype.interfaces.utility as nutil
         import nipype.pipeline.engine as npe
 
-        from .statistics_surface_utils import save_to_caps
+        from ._utils import save_to_caps
 
-        # Writing results into CAPS
-        # =========================
         save_to_caps = npe.Node(
             interface=nutil.Function(
                 input_names=[
                     "source_dir",
                     "caps_dir",
                     "overwrite_caps",
-                    "pipeline_parameters",
+                    "group_label",
+                    "glm_type",
                 ],
                 function=save_to_caps,
             ),
@@ -172,7 +177,8 @@ def build_output_node(self):
         )
         save_to_caps.inputs.caps_dir = self.caps_directory
         save_to_caps.inputs.overwrite_caps = self.overwrite_caps
-        save_to_caps.inputs.pipeline_parameters = self.parameters
+        save_to_caps.inputs.group_label = self.parameters["group_label"]
+        save_to_caps.inputs.glm_type = self.parameters["glm_type"]
 
         self.connect(
             [
@@ -182,14 +188,10 @@ def build_output_node(self):
 
     def build_core_nodes(self):
         """Build and connect the core nodes of the pipeline."""
-        import os
-
         import nipype.interfaces.utility as nutil
         import nipype.pipeline.engine as npe
 
-        import clinica.pipelines.statistics_surface.statistics_surface_utils as utils
-
-        from .statistics_surface_utils import init_input_node
+        from ._utils import init_input_node, run_clinica_surfstat
 
         init_input = npe.Node(
             interface=nutil.Function(
@@ -200,12 +202,11 @@ def build_core_nodes(self):
             name="0-InitPipeline",
         )
         init_input.inputs.parameters = self.parameters
-        init_input.inputs.base_dir = os.path.join(self.base_dir, self.name)
+        init_input.inputs.base_dir = self.base_dir / self.name
         init_input.inputs.subjects_visits_tsv = self.tsv_file
 
-        # Node to wrap the SurfStat matlab script
         surfstat = npe.Node(
-            name="1-RunSurfStat",
+            name="RunSurfStat",
             interface=nutil.Function(
                 input_names=[
                     "caps_dir",
@@ -214,15 +215,13 @@ def build_core_nodes(self):
                     "pipeline_parameters",
                 ],
                 output_names=["output_dir"],
-                function=utils.run_matlab,
+                function=run_clinica_surfstat,
             ),
         )
         surfstat.inputs.caps_dir = self.caps_directory
         surfstat.inputs.subjects_visits_tsv = self.tsv_file
         surfstat.inputs.pipeline_parameters = self.parameters
 
-        # Connection
-        # ==========
         self.connect(
             [
                 (init_input, surfstat, [("surfstat_results_dir", "output_dir")]),
diff --git a/clinica/pipelines/statistics_surface/statistics_surface_utils.py b/clinica/pipelines/statistics_surface/statistics_surface_utils.py
deleted file mode 100644
index 7dc8459c39..0000000000
--- a/clinica/pipelines/statistics_surface/statistics_surface_utils.py
+++ /dev/null
@@ -1,276 +0,0 @@
-def get_t1_freesurfer_custom_file():
-    import os
-
-    custom_file = os.path.join(
-        "@subject",
-        "@session",
-        "t1",
-        "freesurfer_cross_sectional",
-        "@subject_@session",
-        "surf",
-        "@hemi.thickness.fwhm@fwhm.fsaverage.mgh",
-    )
-    return custom_file
-
-
-def get_pet_surface_custom_file(acq_label, suvr_reference_region):
-    import os
-
-    custom_file = os.path.join(
-        "@subject",
-        "@session",
-        "pet",
-        "surface",
-        f"@subject_@session_trc-{acq_label}_pet"
-        f"_space-fsaverage_suvr-{suvr_reference_region}_pvc-iy_hemi-@hemi_fwhm-@fwhm_projection.mgh",
-    )
-    return custom_file
-
-
-def init_input_node(parameters, base_dir, subjects_visits_tsv):
-    """Initialize the pipeline.
-
-    This function will:
-        - Create `surfstat_results_dir` in `base_dir`/<group_id> for SurfStat;
-        - Save pipeline parameters in JSON file;
-        - Copy TSV file with covariates;
-        - Print begin execution message.
-    """
-    import json
-    import os
-    import shutil
-
-    from clinica.pipelines.statistics_surface.statistics_surface_utils import (
-        create_glm_info_dictionary,
-    )
-    from clinica.utils.ux import print_begin_image
-
-    group_id = "group-" + parameters["group_label"]
-
-    # Create surfstat_results_dir for SurfStat
-    surfstat_results_dir = os.path.join(base_dir, group_id)
-    os.makedirs(surfstat_results_dir, exist_ok=True)
-
-    # Save pipeline parameters in JSON file
-    glm_dict = create_glm_info_dictionary(subjects_visits_tsv, parameters)
-    json_filename = os.path.join(surfstat_results_dir, group_id + "_glm.json")
-    with open(json_filename, "w") as json_file:
-        json.dump(glm_dict, json_file, indent=4)
-
-    # Copy TSV file with covariates
-    tsv_filename = os.path.join(surfstat_results_dir, group_id + "_covariates.tsv")
-    shutil.copyfile(subjects_visits_tsv, tsv_filename)
-
-    # Print begin message
-    list_keys = ["AnalysisType", "Covariates", "Contrast", "FWHM", "ClusterThreshold"]
-    list_values = [
-        parameters["glm_type"],
-        parameters["covariates"],
-        parameters["contrast"],
-        str(parameters["full_width_at_half_maximum"]),
-        str(parameters["cluster_threshold"]),
-    ]
-    group_id = "group-" + parameters["group_label"]
-    print_begin_image(group_id, list_keys, list_values)
-
-    return parameters["group_label"], surfstat_results_dir
-
-
-def get_string_format_from_tsv(tsv_file):
-    """
-    Determine string format from TSV file.
-
-    If the TSV file is like:
-
-    participant_id  session_id  sex     group   age
-    sub-CLNC0001    ses-M000     Female  CN      71.1
-    sub-CLNC0002    ses-M000     Male    CN      81.3
-    sub-CLNC0003    ses-M000     Male    CN      75.4
-
-    The columns of the TSV file contains consecutively strings, strings,
-    strings, strings and float. The string_format is therefore "%s %s %s %s %f".
-
-    Args:
-        tsv_file: TSV file.
-
-    Returns:
-        String formatting of the TSV file (e.g. "%s %s %s %s %f")
-    """
-    import pandas as pd
-
-    demographics_df = pd.read_csv(tsv_file, sep="\t")
-
-    def dtype_to_str_format(dtype):
-        """Convert pandas dtypes (e.g. int64) to string format (e.g. %d)"""
-        import numpy as np
-
-        if dtype == np.int64:
-            str_format = "%d"
-        elif dtype == np.float64:
-            str_format = "%f"
-        elif dtype == np.object:
-            str_format = "%s"
-        else:
-            raise ValueError("Unknown dtype (given: %s)" % dtype)
-        return str_format
-
-    list_str_format = []
-    for column in demographics_df.columns:
-        list_str_format.append(dtype_to_str_format(demographics_df[column].dtype))
-
-    return " ".join(list_str_format)
-
-
-def covariates_to_design_matrix(contrast, covariates=None):
-    """
-    Generate design matrix for SurfStat based on the contrast and the optional list of covariates.
-
-    Design matrix "1 + <contrast> + <covariate_1> + ... + <covariate_n>"
-
-    Example:
-        >>> from clinica.pipelines.statistics_surface.statistics_surface_utils import covariates_to_design_matrix
-        >>> covariates_to_design_matrix('group', 'age sex group')
-        1 + group + age + sex
-        >>> covariates_to_design_matrix('group', 'age')
-        1 + group + age
-        >>> covariates_to_design_matrix('group', None)
-        1 + group
-    """
-    if covariates:
-        # Convert string to list while handling case where several spaces are present
-        list_covariates = list(covariates)
-        try:
-            list_covariates.remove("")
-        except ValueError:
-            pass
-
-        if contrast in list_covariates:
-            design_matrix = "1 + " + " + ".join(
-                covariate for covariate in list_covariates
-            )
-        else:
-            design_matrix = (
-                "1 + "
-                + contrast
-                + " + "
-                + " + ".join(covariate for covariate in list_covariates)
-            )
-    else:
-        design_matrix = "1 + " + contrast
-
-    return design_matrix
-
-
-def run_matlab(caps_dir, output_dir, subjects_visits_tsv, pipeline_parameters):
-    """
-    Wrap the call of SurfStat using clinicasurfstat.m Matlab script.
-
-    Args:
-        caps_dir (str): CAPS directory containing surface-based features
-        output_dir (str): Output directory that will contain outputs of clinicasurfstat.m
-        subjects_visits_tsv (str): TSV file containing the GLM information
-        pipeline_parameters (dict): parameters of StatisticsSurface pipeline
-    """
-    import os
-
-    from clinica.pipelines.statistics_surface.clinica_surfstat import clinica_surfstat
-    from clinica.pipelines.statistics_surface.statistics_surface_utils import (
-        covariates_to_design_matrix,
-    )
-    from clinica.utils.check_dependency import check_environment_variable
-
-    freesurfer_home = check_environment_variable("FREESURFER_HOME", "FreeSurfer")
-
-    clinica_surfstat(
-        os.path.join(caps_dir, "subjects"),
-        output_dir,
-        subjects_visits_tsv,
-        covariates_to_design_matrix(
-            pipeline_parameters["contrast"], pipeline_parameters["covariates"]
-        ),
-        pipeline_parameters["contrast"],
-        pipeline_parameters["glm_type"],
-        pipeline_parameters["group_label"],
-        freesurfer_home,
-        pipeline_parameters["custom_file"],
-        pipeline_parameters["measure_label"],
-        fwhm=pipeline_parameters["full_width_at_half_maximum"],
-        cluster_threshold=pipeline_parameters["cluster_threshold"],
-    )
-    return output_dir
-
-
-def create_glm_info_dictionary(tsv_file, pipeline_parameters):
-    """Create dictionary containing the GLM information that will be stored in a JSON file."""
-    out_dict = {
-        # Clinica compulsory arguments
-        "AnalysisType": pipeline_parameters["glm_type"],
-        "DesignMatrix": covariates_to_design_matrix(
-            pipeline_parameters["contrast"], pipeline_parameters["covariates"]
-        ),
-        "StringFormatTSV": get_string_format_from_tsv(tsv_file),
-        "Contrast": pipeline_parameters["contrast"],
-        "GroupLabel": pipeline_parameters["group_label"],
-        # Optional arguments
-        "Covariates": pipeline_parameters["covariates"],
-        "FWHM": pipeline_parameters["full_width_at_half_maximum"],
-        # Optional arguments for custom pipeline
-        "custom_file": pipeline_parameters["custom_file"],
-        "measure_label": pipeline_parameters["measure_label"],
-        # Advanced arguments (i.e. tricky parameters)
-        "ThresholdUncorrectedPvalue": 0.001,
-        "ThresholdCorrectedPvalue": 0.05,
-        "ClusterThreshold": pipeline_parameters["cluster_threshold"],
-    }
-    # Optional arguments for inputs from pet-surface pipeline
-    if (
-        pipeline_parameters["acq_label"]
-        and pipeline_parameters["suvr_reference_region"]
-    ):
-        out_dict["acq_label"] = pipeline_parameters["acq_label"]
-        out_dict["suvr_reference_region"] = pipeline_parameters["suvr_reference_region"]
-
-    return out_dict
-
-
-def save_to_caps(source_dir, caps_dir, overwrite_caps, pipeline_parameters):
-    """Save `source_dir`/ to CAPS folder.
-
-    This function copies outputs of `source_dir`/ to
-    `caps_dir`/groups/<group_id>/<statistics>/surfstat_<glm_type>/
-
-    The `source_dir`/ folder should contain the following elements:
-        - group-<group_label>_<group_1_or_2>-lt-<group_1_or_2>_measure-<measure>_fwhm-<label>_suffix.ext
-    or
-        - group-<group_label>_correlation-<label>_contrast-{-|+}_measure-<measure>_fwhm-<label>_suffix.ext
-    and
-        - group-<group_label>_covariates.tsv
-        - group-<group_label>_glm.json
-
-    Raise:
-        NotImplementedError: If overwrite_caps=True.
-    """
-    import os
-    import shutil
-
-    from clinica.utils.ux import print_end_image
-
-    group_id = "group-" + pipeline_parameters["group_label"]
-
-    if pipeline_parameters["glm_type"] == "group_comparison":
-        surfstat_folder = "surfstat_" + pipeline_parameters["glm_type"]
-    elif pipeline_parameters["glm_type"] == "correlation":
-        surfstat_folder = "surfstat_" + pipeline_parameters["glm_type"] + "_analysis"
-    else:
-        raise NotImplementedError(
-            "The other GLM situations have not been implemented in this pipeline."
-        )
-
-    destination_dir = os.path.join(
-        os.path.expanduser(caps_dir), "groups", group_id, "statistics", surfstat_folder
-    )
-
-    if overwrite_caps:
-        raise NotImplementedError("save_to_caps(overwrite_caps=True) not implemented")
-    shutil.copytree(source_dir, destination_dir, symlinks=True)
-    print_end_image(group_id)
diff --git a/clinica/pipelines/statistics_surface/surfstat/__init__.py b/clinica/pipelines/statistics_surface/surfstat/__init__.py
new file mode 100644
index 0000000000..e7ba8129a9
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/__init__.py
@@ -0,0 +1,4 @@
+from ._surfstat import clinica_surfstat
+from ._utils import get_t1_freesurfer_custom_file_template
+
+__all__ = ["clinica_surfstat", "get_t1_freesurfer_custom_file_template"]
diff --git a/clinica/pipelines/statistics_surface/clinica_surfstat.py b/clinica/pipelines/statistics_surface/surfstat/_surfstat.py
similarity index 78%
rename from clinica/pipelines/statistics_surface/clinica_surfstat.py
rename to clinica/pipelines/statistics_surface/surfstat/_surfstat.py
index 8ca7f74e89..bf1712947e 100644
--- a/clinica/pipelines/statistics_surface/clinica_surfstat.py
+++ b/clinica/pipelines/statistics_surface/surfstat/_surfstat.py
@@ -1,27 +1,18 @@
-from os import PathLike
 from pathlib import Path
-from typing import Dict, Optional
-
-from ._inputs import (
-    _build_thickness_array,
-    _get_average_surface,
-    _get_t1_freesurfer_custom_file_template,
-    _read_and_check_tsv_file,
-)
-from ._model import create_glm_model
+from typing import Optional
 
 
 def clinica_surfstat(
-    input_dir: PathLike,
-    output_dir: PathLike,
-    tsv_file: PathLike,
+    input_dir: Path,
+    output_dir: Path,
+    tsv_file: Path,
     design_matrix: str,
     contrast: str,
     glm_type: str,
     group_label: str,
-    freesurfer_home: PathLike,
-    surface_file: Optional[PathLike],
+    freesurfer_home: Path,
     feature_label: str,
+    surface_file: Optional[str] = None,
     fwhm: Optional[int] = 20,
     threshold_uncorrected_pvalue: Optional[float] = 0.001,
     threshold_corrected_pvalue: Optional[float] = 0.05,
@@ -73,14 +64,14 @@ def clinica_surfstat(
 
     Parameters
     ----------
-    input_dir : PathLike
-        Path to the input folder.
+    input_dir : Path
+        The path to the input folder.
 
-    output_dir : PathLike
-        Path to the output folder for storing results.
+    output_dir : Path
+        The path to the output folder for storing results.
 
-    tsv_file : PathLike
-        Path to the TSV file `subjects.tsv` which contains the
+    tsv_file : Path
+        The path to the TSV file `subjects.tsv` which contains the
         necessary metadata to run the statistical analysis.
 
         .. warning::
@@ -108,11 +99,11 @@ def clinica_surfstat(
         The label for the group. This is used in the output file names
         (see main description of the function).
 
-    freesurfer_home : PathLike
+    freesurfer_home : Path
         The path to the home folder of Freesurfer.
         This is required to get the fsaverage templates.
 
-    surface_file : PathLike, optional
+    surface_file : str, optional
         The path to the surface file to analyze.
         Typically the cortical thickness.
         If `None`, the surface file will be the t1 freesurfer template.
@@ -134,18 +125,28 @@ def clinica_surfstat(
     cluster_threshold : float, optional
         The threshold to be used to declare clusters as significant. Default=0.05.
     """
-    # Load subjects data
-    df_subjects = _read_and_check_tsv_file(tsv_file)
-    surface_file = surface_file or _get_t1_freesurfer_custom_file_template(input_dir)
-    thickness = _build_thickness_array(input_dir, surface_file, df_subjects, fwhm)
+    from ._utils import (
+        build_thickness_array,
+        get_average_surface,
+        get_t1_freesurfer_custom_file_template,
+        read_and_check_tsv_file,
+    )
+    from .models import GLMModelType, create_glm_model
+
+    df_subjects = read_and_check_tsv_file(tsv_file)
+    surface_file: str = surface_file or get_t1_freesurfer_custom_file_template(
+        input_dir
+    )
+    thickness = build_thickness_array(input_dir, surface_file, df_subjects, fwhm)
 
     # Load average surface template
-    fsaverage_path = freesurfer_home / Path("subjects/fsaverage/surf")
-    average_surface, average_mesh = _get_average_surface(fsaverage_path)
+    average_surface, average_mesh = get_average_surface(
+        freesurfer_home / "subjects" / "fsaverage" / "surf"
+    )
 
     # Build and run GLM model
     glm_model = create_glm_model(
-        glm_type,
+        GLMModelType(glm_type),
         design_matrix,
         df_subjects,
         contrast,
@@ -158,4 +159,4 @@ def clinica_surfstat(
     )
     glm_model.fit(thickness, average_surface)
     glm_model.save_results(output_dir, ["json", "mat"])
-    # glm_model.plot_results(output_dir, ["nilearn_plot_surf_stat_map"], average_mesh)
+    glm_model.plot_results(output_dir, ["nilearn_plot_surf_stat_map"], average_mesh)
diff --git a/clinica/pipelines/statistics_surface/_inputs.py b/clinica/pipelines/statistics_surface/surfstat/_utils.py
similarity index 88%
rename from clinica/pipelines/statistics_surface/_inputs.py
rename to clinica/pipelines/statistics_surface/surfstat/_utils.py
index fd7296dc36..e284d06558 100644
--- a/clinica/pipelines/statistics_surface/_inputs.py
+++ b/clinica/pipelines/statistics_surface/surfstat/_utils.py
@@ -13,7 +13,15 @@
 TSV_SECOND_COLUMN = "session_id"
 
 
-def _read_and_check_tsv_file(tsv_file: PathLike) -> pd.DataFrame:
+__all__ = [
+    "read_and_check_tsv_file",
+    "get_t1_freesurfer_custom_file_template",
+    "build_thickness_array",
+    "get_average_surface",
+]
+
+
+def read_and_check_tsv_file(tsv_file: PathLike) -> pd.DataFrame:
     """This function reads the TSV file provided and performs some basic checks.
 
     Parameters
@@ -44,7 +52,7 @@ def _read_and_check_tsv_file(tsv_file: PathLike) -> pd.DataFrame:
 )
 
 
-def _get_t1_freesurfer_custom_file_template(base_dir: PathLike) -> str:
+def get_t1_freesurfer_custom_file_template(base_dir: PathLike) -> str:
     """Returns a Template for the path to the desired surface file.
 
     Parameters
@@ -60,8 +68,8 @@ def _get_t1_freesurfer_custom_file_template(base_dir: PathLike) -> str:
     return str(base_dir) + T1_FREESURFER_TEMPLATE_PATH_FROM_CAPS_ROOT
 
 
-def _build_thickness_array(
-    input_dir: PathLike,
+def build_thickness_array(
+    input_dir: Path,
     surface_file: str,
     df: pd.DataFrame,
     fwhm: float,
@@ -93,9 +101,9 @@ def _build_thickness_array(
     for idx, row in df.iterrows():
         subject, session = idx
         parts = []
-        for hemi in ["lh", "rh"]:
+        for hemi in ("lh", "rh"):
             query = {"subject": subject, "session": session, "fwhm": fwhm, "hemi": hemi}
-            surface_file_path = str(Path(input_dir) / Path(str(surface_file % query)))
+            surface_file_path = str(input_dir / (surface_file % query))
             parts.append(load(surface_file_path).get_fdata())
         combined = np.vstack(parts)
         thickness.append(combined.flatten())
@@ -108,7 +116,7 @@ def _build_thickness_array(
     return thickness
 
 
-def _get_average_surface(fsaverage_path: PathLike) -> Tuple[Dict, Mesh]:
+def get_average_surface(fsaverage_path: Path) -> Tuple[Dict, Mesh]:
     """This function extracts the average surface and the average mesh
     from the path to the fsaverage templates.
 
@@ -145,8 +153,7 @@ def _get_average_surface(fsaverage_path: PathLike) -> Tuple[Dict, Mesh]:
     from nilearn.surface import Mesh, load_surf_mesh
 
     meshes = [
-        load_surf_mesh(str(fsaverage_path / Path(f"{hemi}.pial")))
-        for hemi in ["lh", "rh"]
+        load_surf_mesh(str(fsaverage_path / f"{hemi}.pial")) for hemi in ("lh", "rh")
     ]
     coordinates = np.vstack([mesh.coordinates for mesh in meshes])
     faces = np.vstack(
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/__init__.py b/clinica/pipelines/statistics_surface/surfstat/models/__init__.py
new file mode 100644
index 0000000000..8f7ab69a63
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/__init__.py
@@ -0,0 +1,3 @@
+from ._factory import GLMModelType, create_glm_model
+
+__all__ = ["create_glm_model", "GLMModelType"]
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/_base.py b/clinica/pipelines/statistics_surface/surfstat/models/_base.py
new file mode 100644
index 0000000000..74d15a47c9
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/_base.py
@@ -0,0 +1,234 @@
+import abc
+from pathlib import Path
+from typing import Dict, List, Optional, Union
+
+import numpy as np
+import pandas as pd
+from brainstat.stats.SLM import SLM
+from brainstat.stats.terms import FixedEffect
+from nilearn.surface import Mesh
+
+from clinica.utils.stream import cprint
+
+from ._contrast import Contrast
+from ._utils import build_model, print_clusters
+from .results import (
+    StatisticsResults,
+    StatisticsResultsPlotter,
+    StatisticsResultsSerializer,
+)
+
+__all__ = ["GLM"]
+
+
+class GLM:
+    """This class implements the functionalities common to all GLM models
+    used in the Clinica SurfaceStatistics pipeline.
+
+    Attributes
+    ----------
+    design : str
+        The design matrix specified in string format.
+        If this contains a "*", it will be interpreted as an interaction effect.
+
+    df : pd.DataFrame
+        The subjects DataFrame.
+
+    feature_label : str
+        The label used for building output filenames.
+
+    contrast : str
+        The contrast specified in string format.
+
+    fwhm : int, optional
+        The smoothing FWHM. This is used in the output file names.
+        Default=20.
+
+    threshold_uncorrected_pvalue : float, optional
+        The threshold to be used with uncorrected P-values. Default=0.001.
+
+    threshold_corrected_pvalue : float, optional
+        The threshold to be used with corrected P-values. Default=0.05.
+
+    cluster_threshold : float, optional
+        The threshold to be used to declare clusters as significant. Default=0.001.
+    """
+
+    default_threshold_uncorrected_pvalue = 0.001
+    default_threshold_corrected_pvalue = 0.05
+    default_cluster_threshold = 0.001
+
+    def __init__(
+        self,
+        design: str,
+        df: pd.DataFrame,
+        feature_label: str,
+        contrast: str,
+        fwhm: Optional[int] = 20,
+        threshold_uncorrected_pvalue: Optional[float] = None,
+        threshold_corrected_pvalue: Optional[float] = None,
+        cluster_threshold: Optional[float] = None,
+    ):
+        self._two_tailed: bool = False
+        self._correction = ["fdr", "rft"]
+        self.feature_label: str = feature_label
+        self.fwhm: Optional[int] = fwhm
+        self.threshold_uncorrected_pvalue: float = (
+            threshold_uncorrected_pvalue or self.default_threshold_uncorrected_pvalue
+        )
+        self.threshold_corrected_pvalue: float = (
+            threshold_corrected_pvalue or self.default_threshold_corrected_pvalue
+        )
+        self.cluster_threshold: float = (
+            cluster_threshold or self.default_cluster_threshold
+        )
+        self.results_ = None
+        self.slm_models_ = None
+        self.filenames: dict = {}
+        self.model: FixedEffect = build_model(design, df)
+        self.contrasts: List[Contrast] = self._build_contrasts(contrast, df)
+
+    @abc.abstractmethod
+    def _build_contrasts(
+        self, contrast: str, subjects_df: pd.DataFrame
+    ) -> List[Contrast]:
+        raise NotImplementedError
+
+    @property
+    def contrast_names(self) -> List[str]:
+        if self.contrasts is not None:
+            return [contrast.name for contrast in self.contrasts]
+        return list()
+
+    def get_contrast_by_name(self, contrast_name: str) -> Contrast:
+        if self.contrasts:
+            contrast = [c for c in self.contrasts if c.name == contrast_name]
+            if len(contrast) == 1:
+                return contrast[0]
+        raise ValueError(f"Unknown contrast {contrast_name}")
+
+    @property
+    def results(self):
+        if self._is_fitted():
+            return self.results_
+
+    def get_output_filename(self, contrast_name: str) -> str:
+        """Returns the output file name root for the provided contrast.
+
+        .. note::
+            This method needs to be implemented in subclasses.
+
+        Parameters
+        ----------
+        contrast_name : str
+            Contrast for which to get the output filename.
+        """
+        contrast = self.get_contrast_by_name(contrast_name)
+        return self._get_output_filename(contrast)
+
+    @abc.abstractmethod
+    def _get_output_filename(self, contrast: Contrast) -> str:
+        raise NotImplementedError
+
+    def _is_fitted(self) -> bool:
+        return self.results_ is not None
+
+    def fit(
+        self, data: np.ndarray, surface: Dict, mask: Optional[np.ndarray] = None
+    ) -> None:
+        """Fit the GLM model instance.
+
+        Parameters
+        ----------
+        data : np.ndarray
+            The data on which to fit the GLM model.
+
+        surface : dict
+            The Brainstat surface on which to fit the GLM model.
+
+        mask : np.ndarray, optional
+            The mask to be used to mask the data. Default=None.
+        """
+        if mask is None:
+            mask = data[0, :] > 0
+        self.results_ = dict()
+        self.slm_models_ = dict()
+        for contrast in self.contrasts:
+            slm_model = SLM(
+                self.model,
+                contrast=contrast.built_contrast,
+                surf=surface,
+                mask=mask,
+                two_tailed=self._two_tailed,
+                correction=self._correction,
+                cluster_threshold=self.cluster_threshold,
+            )
+            cprint(
+                msg=f"Fitting the GLM model with contrast {contrast.name}...",
+                lvl="info",
+            )
+            slm_model.fit(data)
+            print_clusters(slm_model, self.threshold_corrected_pvalue)
+            self.results_[contrast.name] = StatisticsResults.from_slm_model(
+                slm_model,
+                mask,
+                self.threshold_uncorrected_pvalue,
+                self.threshold_corrected_pvalue,
+            )
+            self.slm_models_[contrast.name] = slm_model
+
+    def save_results(self, output_dir: Path, method: Union[str, List[str]]) -> None:
+        """Save results to the provided output directory.
+
+        Parameters
+        ----------
+        output_dir : PathLike
+            The output directory in which to write the results.
+
+        method : str or List[str]
+            The method(s) to write the results.
+        """
+        if not self._is_fitted():
+            raise ValueError(
+                "GLM model needs to be fitted before accessing the results."
+            )
+        if isinstance(method, str):
+            method = [method]
+        for contrast_name, result in self.results_.items():
+            result_serializer = StatisticsResultsSerializer(
+                output_dir / self.get_output_filename(contrast_name)
+            )
+            for meth in method:
+                result_serializer.save(result, meth)
+
+    def plot_results(
+        self,
+        output_dir: Path,
+        method: Union[str, List[str]],
+        mesh: Mesh,
+    ) -> None:
+        """Plot results to the provided directory.
+
+        Parameters
+        ----------
+        output_dir : PathLike
+            The output directory in which to write the plot files.
+
+        method : str or List[str]
+            The method(s) to make the plots.
+
+        mesh : nilearn.surface.Mesh
+            The mesh on which to plot the result data.
+        """
+        if not self._is_fitted():
+            raise ValueError(
+                "GLM model needs to be fitted before accessing the results."
+            )
+        if isinstance(method, str):
+            method = [method]
+        for contrast_name, result in self.results_.items():
+            plotter = StatisticsResultsPlotter(
+                output_dir / self.get_output_filename(contrast_name), mesh
+            )
+            for meth in method:
+                plotter.plot(result, meth)
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/_contrast.py b/clinica/pipelines/statistics_surface/surfstat/models/_contrast.py
new file mode 100644
index 0000000000..f03ab43ba1
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/_contrast.py
@@ -0,0 +1,87 @@
+import numpy as np
+import pandas as pd
+
+from ._utils import check_column_in_df, is_categorical
+
+__all__ = [
+    "Contrast",
+    "CorrelationContrast",
+    "GroupContrast",
+    "GroupContrastWithInteraction",
+]
+
+
+class Contrast:
+    def __init__(self, name: str, built_contrast: pd.Series):
+        self.name = name
+        self.built_contrast = built_contrast
+
+
+class CorrelationContrast(Contrast):
+    def __init__(
+        self, name: str, absolute_name: str, built_contrast: pd.Series, sign: str
+    ):
+        super().__init__(name, built_contrast)
+        self.sign = sign
+        self.absolute_name = absolute_name
+
+    @classmethod
+    def from_string(cls, contrast: str, df: pd.DataFrame):
+        absolute_contrast_name = contrast
+        contrast_sign = "positive"
+        if contrast.startswith("-"):
+            absolute_contrast_name = contrast[1:].lstrip()
+            contrast_sign = "negative"
+        check_column_in_df(df, absolute_contrast_name)
+        built_contrast = df[absolute_contrast_name]
+        if contrast_sign == "negative":
+            built_contrast *= -1
+        return cls(contrast, absolute_contrast_name, built_contrast, contrast_sign)
+
+
+class GroupContrastWithInteraction(Contrast):
+    def __init__(self, name: str, built_contrast: pd.Series):
+        super().__init__(name, built_contrast)
+
+    @classmethod
+    def from_string(cls, contrast: str, df: pd.DataFrame):
+        contrast_elements = [_.strip() for _ in contrast.split("*")]
+        for contrast_element in contrast_elements:
+            check_column_in_df(df, contrast_element)
+        categorical = [is_categorical(df, _) for _ in contrast_elements]
+        if len(contrast_elements) != 2 or sum(categorical) != 1:
+            raise ValueError(
+                "The contrast must be an interaction between one continuous "
+                "variable and one categorical variable. Your contrast contains "
+                f"the following variables : {contrast_elements}"
+            )
+        idx = 0 if categorical[0] else 1
+        categorical_contrast = contrast_elements[idx]
+        continue_contrast = contrast_elements[(idx + 1) % 2]
+        group_values = np.unique(df[categorical_contrast])
+        built_contrast = df[continue_contrast].where(
+            df[categorical_contrast] == group_values[0], 0
+        ) - df[continue_contrast].where(df[categorical_contrast] == group_values[1], 0)
+        return cls(contrast, built_contrast)
+
+
+class GroupContrast(Contrast):
+    def __int__(self, name: str, built_contrast: pd.Series):
+        super().__init__(name, built_contrast)
+
+    @classmethod
+    def from_string(cls, contrast: str, df: pd.DataFrame, sign: str):
+        check_column_in_df(df, contrast)
+        if not is_categorical(df, contrast):
+            raise ValueError(
+                "Contrast should refer to a categorical variable for group comparison. "
+                "Please select 'correlation' for 'glm_type' otherwise."
+            )
+        group_values = np.unique(df[contrast])
+        i, j = (0, 1) if sign == "positive" else (1, 0)
+        contrast_name = f"{group_values[j]}-lt-{group_values[i]}"
+        built_contrast = (df[contrast] == group_values[i]).astype(int) - (
+            df[contrast] == group_values[j]
+        ).astype(int)
+
+        return cls(contrast_name, built_contrast)
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/_correlation.py b/clinica/pipelines/statistics_surface/surfstat/models/_correlation.py
new file mode 100644
index 0000000000..0ba151245b
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/_correlation.py
@@ -0,0 +1,61 @@
+from typing import List, Optional
+
+import pandas as pd
+
+from ._base import GLM
+from ._contrast import CorrelationContrast
+
+
+class CorrelationGLM(GLM):
+    """Class implementing the correlation type GLM model.
+
+    Attributes
+    ----------
+    See documentation for `GLM` class.
+
+    group_label : str, optional
+        The label to use for group GLM models. Default=None.
+    """
+
+    def __init__(
+        self,
+        design: str,
+        df: pd.DataFrame,
+        feature_label: str,
+        contrast: str,
+        group_label: Optional[str],
+        fwhm: Optional[int] = 20,
+        threshold_uncorrected_pvalue: Optional[float] = 0.001,
+        threshold_corrected_pvalue: Optional[float] = 0.05,
+        cluster_threshold: Optional[float] = 0.001,
+    ):
+        super().__init__(
+            design,
+            df,
+            feature_label,
+            contrast,
+            fwhm,
+            threshold_uncorrected_pvalue,
+            threshold_corrected_pvalue,
+            cluster_threshold,
+        )
+        self.with_interaction: bool = False
+        self.group_label = group_label
+
+    def _build_contrasts(
+        self, contrast: str, subjects_df: pd.DataFrame
+    ) -> List[CorrelationContrast]:
+        return [CorrelationContrast.from_string(contrast, subjects_df)]
+
+    def _get_output_filename(self, contrast: CorrelationContrast) -> str:
+        """Build the filename from class attributes and provided contrast.
+
+        Parameters
+        ----------
+        contrast : CorrelationContrast
+            The contrast to use for building the filename.
+        """
+        return (
+            f"group-{self.group_label}_correlation-{contrast.absolute_name}"
+            f"-{contrast.sign}_measure-{self.feature_label}_fwhm-{self.fwhm}"
+        )
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/_factory.py b/clinica/pipelines/statistics_surface/surfstat/models/_factory.py
new file mode 100644
index 0000000000..49917a547f
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/_factory.py
@@ -0,0 +1,99 @@
+from enum import Enum
+from typing import Optional
+
+import pandas as pd
+
+from ._base import GLM
+from ._correlation import CorrelationGLM
+from ._group import GroupGLM, GroupGLMWithInteraction
+
+__all__ = ["GLMModelType", "create_glm_model"]
+
+
+class GLMModelType(str, Enum):
+    """Supported types of GLM models."""
+
+    CORRELATION = "correlation"
+    GROUP_COMPARISON = "group_comparison"
+
+
+def create_glm_model(
+    glm_type: GLMModelType,
+    design: str,
+    df: pd.DataFrame,
+    contrast: str,
+    feature_label: str,
+    group_label: Optional[str] = "group",
+    fwhm: Optional[int] = 20,
+    threshold_uncorrected_pvalue: Optional[float] = 0.001,
+    threshold_corrected_pvalue: Optional[float] = 0.05,
+    cluster_threshold: Optional[float] = 0.001,
+) -> GLM:
+    """Factory method for building a GLM model instance corresponding to the
+    provided type and design matrix.
+
+    Parameters
+    ----------
+    glm_type : GLMModelType
+        The type of GLM to be created.
+
+    design : str
+        The design matrix specified in string format.
+        If this contains a "*", it will be interpreted as an interaction effect.
+
+    df : pd.DataFrame
+        The subjects DataFrame.
+
+    contrast : str
+        The contrast specified in string format.
+
+    feature_label : str
+        The label used for building output filenames.
+
+    group_label : str, optional
+        The label to use for group GLM models. Default="group".
+
+    fwhm : int, optional
+        The smoothing FWHM. This is used in the output file names.
+        Default=20.
+
+    threshold_uncorrected_pvalue : float, optional
+        The threshold to be used with uncorrected P-values. Default=0.001.
+
+    threshold_corrected_pvalue : float, optional
+        The threshold to be used with corrected P-values. Default=0.05.
+
+    cluster_threshold : float, optional
+        The threshold to be used to declare clusters as significant. Default=0.001.
+
+    Returns
+    -------
+    model : GLM
+        An instance of the `GLM` class.
+
+    Raises
+    ------
+    ValueError
+        If the glm_type is not supported.
+    """
+    from clinica.utils.stream import cprint
+
+    cprint(
+        msg=f"The GLM model is: {design} and the GLM type is: {glm_type}",
+        lvl="info",
+    )
+    params = {
+        "group_label": group_label,
+        "fwhm": fwhm,
+        "threshold_uncorrected_pvalue": threshold_uncorrected_pvalue,
+        "threshold_corrected_pvalue": threshold_corrected_pvalue,
+        "cluster_threshold": cluster_threshold,
+    }
+    if glm_type == GLMModelType.CORRELATION:
+        return CorrelationGLM(design, df, feature_label, contrast, **params)
+    if glm_type == GLMModelType.GROUP_COMPARISON:
+        if "*" in design:
+            return GroupGLMWithInteraction(
+                design, df, feature_label, contrast, **params
+            )
+        return GroupGLM(design, df, feature_label, contrast, **params)
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/_group.py b/clinica/pipelines/statistics_surface/surfstat/models/_group.py
new file mode 100644
index 0000000000..39e0c0ed37
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/_group.py
@@ -0,0 +1,118 @@
+import warnings
+from typing import List, Optional
+
+import pandas as pd
+
+from ._base import GLM
+from ._contrast import GroupContrast, GroupContrastWithInteraction
+
+
+class GroupGLM(GLM):
+    """Class implementing group GLM models.
+
+    Attributes
+    ----------
+    See documentation for `GLM` class.
+
+    group_label : str, optional
+        The Label to use for group GLM models. Default="group".
+    """
+
+    def __init__(
+        self,
+        design: str,
+        df: pd.DataFrame,
+        feature_label: str,
+        contrast: str,
+        group_label: Optional[str] = "group",
+        fwhm: Optional[int] = 20,
+        threshold_uncorrected_pvalue: Optional[float] = 0.001,
+        threshold_corrected_pvalue: Optional[float] = 0.05,
+        cluster_threshold: Optional[float] = 0.001,
+    ):
+        super().__init__(
+            design,
+            df,
+            feature_label,
+            contrast,
+            fwhm,
+            threshold_uncorrected_pvalue,
+            threshold_corrected_pvalue,
+            cluster_threshold,
+        )
+        self.with_interaction = False
+        self.group_label = group_label
+
+    def _build_contrasts(
+        self, contrast: str, subjects_df: pd.DataFrame
+    ) -> List[GroupContrast]:
+        return [
+            GroupContrast.from_string(contrast, subjects_df, sign)
+            for sign in ("positive", "negative")
+        ]
+
+    def _get_output_filename(self, contrast: GroupContrast) -> str:
+        """Build the filename root part from class attributes and provided contrast.
+
+        Parameters
+        ----------
+        contrast : GroupContrast
+            The contrast to use for building the filename.
+        """
+        return f"group-{self.group_label}_{contrast.name}_measure-{self.feature_label}_fwhm-{self.fwhm}"
+
+
+class GroupGLMWithInteraction(GroupGLM):
+    """This class implements a GLM model for group comparison with
+    interaction effects.
+
+    Attributes
+    ----------
+    See attributes of parent class `GroupGLM`.
+    """
+
+    def __init__(
+        self,
+        design: str,
+        df: pd.DataFrame,
+        feature_label: str,
+        contrast: str,
+        group_label: Optional[str] = "group",
+        fwhm: Optional[int] = 20,
+        threshold_uncorrected_pvalue: Optional[float] = 0.001,
+        threshold_corrected_pvalue: Optional[float] = 0.05,
+        cluster_threshold: Optional[float] = 0.001,
+    ):
+        super().__init__(
+            design,
+            df,
+            feature_label,
+            contrast,
+            group_label,
+            fwhm,
+            threshold_uncorrected_pvalue,
+            threshold_corrected_pvalue,
+            cluster_threshold,
+        )
+        self.with_interaction: bool = True
+        warnings.warn(
+            "You included interaction as covariate in your model, "
+            "please carefully check the format of your tsv files."
+        )
+
+    def _build_contrasts(
+        self, contrast: str, subjects_df: pd.DataFrame
+    ) -> List[GroupContrastWithInteraction]:
+        return [GroupContrastWithInteraction.from_string(contrast, subjects_df)]
+
+    def _get_output_filename(self, contrast: GroupContrastWithInteraction) -> str:
+        """Build the filename from class attributes and provided contrast.
+
+        Parameters
+        ----------
+        contrast : GroupContrastWithInteraction
+            The contrast to use for building the filename.
+        """
+        return (
+            f"interaction-{contrast.name}_measure-{self.feature_label}_fwhm-{self.fwhm}"
+        )
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/_utils.py b/clinica/pipelines/statistics_surface/surfstat/models/_utils.py
new file mode 100644
index 0000000000..a4344199ef
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/_utils.py
@@ -0,0 +1,152 @@
+from string import Template
+from typing import Optional
+
+import pandas as pd
+from brainstat.stats.SLM import SLM
+from brainstat.stats.terms import FixedEffect
+
+__all__ = ["build_model", "print_clusters", "check_column_in_df", "is_categorical"]
+
+
+MISSING_TERM_ERROR_MSG = Template(
+    "Term ${term} from the design matrix is not in the columns of the "
+    "provided TSV file. Please make sure that there is no typo."
+)
+
+
+def print_clusters(model: SLM, threshold: float) -> None:
+    """This function prints the results related to total number
+    of clusters, as well as the significative clusters.
+
+    Parameters
+    ----------
+    model : brainstat.stats.SLM
+        Fitted SLM model.
+
+    threshold : float
+        Cluster defining threshold.
+    """
+    from clinica.utils.stream import cprint
+
+    cprint("#" * 40)
+    cprint("After correction (Cluster-wise Correction for Multiple Comparisons): ")
+    df = model.P["clus"][0]
+    cprint(df)
+    cprint(f"Clusters found: {len(df)}")
+    cprint(
+        f"Significative clusters (after correction): {len(df[df['P'] <= threshold])}"
+    )
+
+
+def build_model(design_matrix: str, df: pd.DataFrame) -> FixedEffect:
+    """Build a brainstat model from the design matrix in string format.
+
+    This function assumes that the design matrix is formatted
+    in the following way:
+
+        1 + factor_1 + factor_2 + ...
+
+    Or:
+
+        factor_1 + factor_2 + ...
+
+    in the latter case the intercept will be added automatically.
+
+    Parameters
+    ----------
+    design_matrix : str
+        Design matrix specified as a string.
+
+    df : pd.DataFrame
+        Subjects DataFrame.
+
+    Returns
+    -------
+    model : FixedEffect
+        BrainStats model.
+    """
+    from functools import reduce
+
+    if len(design_matrix) == 0:
+        raise ValueError("Design matrix cannot be empty.")
+    if "+" in design_matrix:
+        terms = [_.strip() for _ in design_matrix.split("+")]
+    else:
+        terms = [design_matrix.strip()]
+    model = []
+    for term in terms:
+        # Intercept is automatically included in brainstat
+        if term == "1":
+            continue
+        # Handles the interaction effects
+        if "*" in term:
+            sub_terms = [_.strip() for _ in term.split("*")]
+            model_term = reduce(
+                lambda x, y: x * y, [_build_model_term(_, df) for _ in sub_terms]
+            )
+        else:
+            model_term = _build_model_term(term, df)
+        model.append(model_term)
+    return reduce(lambda x, y: x + y, model)
+
+
+def _build_model_term(
+    term: str,
+    df: pd.DataFrame,
+    add_intercept: Optional[bool] = True,
+) -> FixedEffect:
+    """Builds a BrainStats model term from the subjects
+    DataFrame and a column name.
+
+    Parameters
+    ----------
+    term : str
+        The name of the column of the DataFrame to be used.
+
+    df : pd.DataFrame
+        The subjects DataFrame.
+
+    add_intercept : bool
+        If `True`, adds an intercept term.
+
+    Returns
+    -------
+    FixedEffect :
+        BrainStats model term.
+    """
+    return FixedEffect(df[term], add_intercept=add_intercept)
+
+
+def check_column_in_df(df: pd.DataFrame, column: str) -> None:
+    """Checks if the provided column name is in the provided DataFrame.
+    Raises a ValueError if not.
+
+    Parameters
+    ----------
+    df : pd.DataFrame
+        DataFrame to analyze.
+
+    column : str
+        Name of the column to check.
+    """
+    if column not in df.columns:
+        raise ValueError(MISSING_TERM_ERROR_MSG.safe_substitute(term=column))
+
+
+def is_categorical(df: pd.DataFrame, column: str) -> bool:
+    """Returns `True` if the column is categorical and `False` otherwise.
+
+    Parameters
+    ----------
+    df : pd.DataFrame
+        The DataFrame to analyze.
+
+    column : str
+        The name of the column to check.
+
+    Returns
+    -------
+    bool :
+        `True` if the column contains categorical values, `False` otherwise.
+    """
+    return not df[column].dtype.name.startswith("float")
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/results/__init__.py b/clinica/pipelines/statistics_surface/surfstat/models/results/__init__.py
new file mode 100644
index 0000000000..b793ef8cb5
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/results/__init__.py
@@ -0,0 +1,9 @@
+from ._plot import StatisticsResultsPlotter
+from ._serialize import StatisticsResultsSerializer
+from ._statistics import StatisticsResults
+
+__all__ = [
+    "StatisticsResults",
+    "StatisticsResultsSerializer",
+    "StatisticsResultsPlotter",
+]
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/results/_base.py b/clinica/pipelines/statistics_surface/surfstat/models/results/_base.py
new file mode 100644
index 0000000000..58207c4fc7
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/results/_base.py
@@ -0,0 +1,77 @@
+from typing import Optional
+
+import numpy as np
+
+__all__ = ["Results"]
+
+
+def _convert_arrays_to_lists(data: dict) -> dict:
+    """If the input dictionary contains numpy arrays, this function will
+    cast them to lists and return the same dictionary with the lists instead
+    of the numpy arrays.
+
+    Parameters
+    ----------
+    data : dict
+        The dictionary to clean.
+
+    Returns
+    -------
+    new_data : dict
+        The dictionary with arrays casted to lists.
+    """
+    new_data = dict()
+    for k, v in data.items():
+        if isinstance(v, dict):
+            new_data[k] = _convert_arrays_to_lists(v)
+        elif isinstance(v, np.ndarray):
+            new_data[k] = v.tolist()
+        else:
+            new_data[k] = v
+    return new_data
+
+
+class Results:
+    """Common class for GLM results."""
+
+    def to_dict(self) -> dict:
+        """Returns the `Results` instance in dict format.
+
+        Private attributes and all methods are not returned.
+
+        This function does not perform any casting.
+
+        Returns
+        -------
+        data : dict
+            Resulting dictionary.
+        """
+        import inspect
+
+        data = dict()
+        for attribute in inspect.getmembers(self):
+            name, value = attribute
+            if not name.startswith("_"):
+                if not inspect.ismethod(value):
+                    if hasattr(value, "to_dict"):
+                        data[name] = value.to_dict()
+                    else:
+                        data[name] = value
+        return data
+
+    def to_json(self, indent: Optional[int] = 4) -> str:
+        """Returns the json of the `Results` instance.
+
+        Parameters
+        ----------
+        indent : int, optional
+            Indent to use. Default=4.
+
+        Returns
+        -------
+        str :
+            The JSON dumps of the results.
+        """
+        import json
+
+        return json.dumps(_convert_arrays_to_lists(self.to_dict()), indent=indent)
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/results/_plot.py b/clinica/pipelines/statistics_surface/surfstat/models/results/_plot.py
new file mode 100644
index 0000000000..942a39f1d4
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/results/_plot.py
@@ -0,0 +1,89 @@
+from pathlib import Path
+from typing import Callable
+
+from nilearn.surface import Mesh
+
+from ._statistics import StatisticsResults
+
+__all__ = ["StatisticsResultsPlotter"]
+
+
+class StatisticsResultsPlotter:
+    """Class responsible to plotting results of GLM fit.
+
+    Attributes
+    ----------
+    output_file : PathLike
+        Path to the output file.
+
+    mesh : nilearn.surface.Mesh
+        The mesh to be used for plotting results.
+    """
+
+    def __init__(self, output_file: Path, mesh: Mesh):
+        self.output_file = output_file
+        self.mesh = mesh
+        self.plotting_extension = ".png"
+        self.no_plot = {"coefficients"}  # Elements which should not be plotted
+
+    def plot(self, result: StatisticsResults, method: str) -> None:
+        """Plot the results.
+
+        Parameters
+        ----------
+        result : StatisticsResults
+            The results to be plotted.
+
+        method : str
+            The plotting method to use.
+        """
+        plotter = self._get_plotter(method)
+        plotter(result)
+
+    def _get_plotter(self, method: str) -> Callable[[StatisticsResults], None]:
+        """Returns the plotting method from its name.
+
+        Parameters
+        ----------
+        method : str
+            Name of the plotting method to use.
+
+        Returns
+        -------
+        Callable :
+            Plotting method.
+        """
+        if method == "nilearn_plot_surf_stat_map":
+            return self._plot_stat_maps
+        raise NotImplementedError(f"Plotting method {method} is not implemented.")
+
+    def _plot_stat_maps(self, result: StatisticsResults) -> None:
+        """Wrapper around the `nilearn.plotting.plot_surf_stat_map` method.
+
+        Parameters
+        ----------
+        result : StatisticsResults
+            The results to plot.
+        """
+        from nilearn.plotting import plot_surf_stat_map
+
+        from clinica.utils.stream import cprint
+
+        for name, res in result.to_dict().items():
+            if name not in self.no_plot:
+                texture = res
+                threshold = None
+                plot_filename = (
+                    str(self.output_file) + "_" + name + self.plotting_extension
+                )
+                if isinstance(res, dict):
+                    texture = res["P"]
+                    threshold = res["thresh"]
+                cprint(msg=f"Saving plot to {plot_filename}", lvl="info")
+                plot_surf_stat_map(
+                    self.mesh,
+                    texture,
+                    threshold=threshold,
+                    output_file=plot_filename,
+                    title=name,
+                )
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/results/_serialize.py b/clinica/pipelines/statistics_surface/surfstat/models/results/_serialize.py
new file mode 100644
index 0000000000..3edf65327c
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/results/_serialize.py
@@ -0,0 +1,110 @@
+from pathlib import Path
+from typing import Callable
+
+from ._statistics import StatisticsResults
+
+__all__ = ["StatisticsResultsSerializer"]
+
+
+class StatisticsResultsSerializer:
+    """This class is responsible for writing instances of `StatisticsResults`
+    to disk through different methods.
+
+    Attributes
+    ----------
+    output_file : PathLike
+        Path and filename root to be used.
+    """
+
+    def __init__(self, output_file: Path):
+        self.output_file = output_file
+        self.json_extension = "_results.json"
+        self.json_indent = 4
+        self.mat_extension = ".mat"
+
+    def save(self, result: StatisticsResults, method: str) -> None:
+        """Save provided `StatisticsResults` to disk with provided method.
+
+        Parameters
+        ----------
+        result : StatisticsResults
+            Results to be saved.
+
+        method : str
+            Name of the saving method to use.
+        """
+        writer = self._get_writer(method)
+        writer(result)
+
+    def _get_writer(self, method: str) -> Callable[[StatisticsResults], None]:
+        """Returns a writer method from its name.
+
+        Parameters
+        ----------
+        method : str
+            The name of the writing method to use.
+
+        Returns
+        -------
+        Callable :
+            The writing method.
+        """
+        if method.lower() == "json":
+            return self._write_to_json
+        elif method.lower() == "mat":
+            return self._write_to_mat
+        raise NotImplementedError(f"Serializing method {method} is not implemented.")
+
+    def _write_to_json(self, results: StatisticsResults) -> None:
+        """Write the provided `StatisticsResults` to JSON format.
+
+        Parameters
+        ----------
+        results : StatisticsResults
+            The results to write to disk in JSON format.
+        """
+        import json
+        import os
+
+        from clinica.utils.stream import cprint
+
+        out_json_file = Path(str(self.output_file) + self.json_extension)
+        if not os.path.exists(out_json_file.parents[0]):
+            os.makedirs(out_json_file.parents[0])
+        cprint(
+            msg=f"Writing results to JSON in {out_json_file}...",
+            lvl="info",
+        )
+        with open(out_json_file, "w") as fp:
+            json.dump(results.to_json(indent=self.json_indent), fp)
+
+    def _write_to_mat(self, results: StatisticsResults) -> None:
+        """Write the provided `StatisticsResults` to MAT format.
+
+        Parameters
+        ----------
+        results : StatisticsResults
+            The results to write to disk in MAT format.
+        """
+        from scipy.io import savemat
+
+        from clinica.utils.stream import cprint
+
+        # These labels are used for compatibility with the previous
+        # MATLAB implementation of the Statistics Surface Pipeline
+        # of Clinica.
+        struct_labels = {
+            "coefficients": "coef",
+            "TStatistics": "tvaluewithmask",
+            "uncorrectedPValue": "uncorrectedpvaluesstruct",
+            "correctedPValue": "correctedpvaluesstruct",
+            "FDR": "FDR",
+        }
+        for name, res in results.to_dict().items():
+            if name in struct_labels:
+                mat_filename = str(self.output_file) + "_" + name + self.mat_extension
+                cprint(
+                    msg=f"Writing {name} results to MAT in  {mat_filename}",
+                    lvl="info",
+                )
+                savemat(mat_filename, {struct_labels[name]: res})
diff --git a/clinica/pipelines/statistics_surface/surfstat/models/results/_statistics.py b/clinica/pipelines/statistics_surface/surfstat/models/results/_statistics.py
new file mode 100644
index 0000000000..bf8e3c91df
--- /dev/null
+++ b/clinica/pipelines/statistics_surface/surfstat/models/results/_statistics.py
@@ -0,0 +1,187 @@
+from dataclasses import dataclass
+
+import numpy as np
+import pandas as pd
+from brainstat.stats.SLM import SLM
+
+from ._base import Results
+
+__all__ = ["StatisticsResults"]
+
+
+@dataclass
+class PValueResults(Results):
+    """This class implements a container for raw (uncorrected)
+    P-value results obtained with a GLM model.
+
+    Attributes
+    ----------
+    pvalues : np.ndarray
+        Array of uncorrected P-values.
+
+    mask : np.ndarray
+        The binary mask.
+
+    threshold : float
+        The threshold used.
+    """
+
+    pvalues: np.ndarray
+    mask: np.ndarray
+    threshold: float
+
+    @property
+    def thresh(self):
+        """For compatibility with previous Matlab implementation."""
+        return self.threshold
+
+    @property
+    def P(self):
+        """For compatibility with previous Matlab implementation."""
+        return self.pvalues
+
+    @classmethod
+    def from_t_statistics(
+        cls,
+        tstats: np.ndarray,
+        df: pd.DataFrame,
+        mask: np.ndarray,
+        threshold: float,
+    ):
+        """Instantiate the class from an array of T-statistics.
+
+        Parameters
+        ----------
+        tstats : np.ndarray
+            Array of T-statistics.
+
+        df : pd.DataFrame
+            The subjects DataFrame.
+
+        mask : np.ndarray
+            The binary mask.
+
+        threshold : float
+            The threshold to be used.
+        """
+        from scipy.stats import t
+
+        return cls(1 - t.cdf(tstats, df), mask, threshold)
+
+
+@dataclass
+class CorrectedPValueResults(PValueResults):
+    """This class implements a container for corrected P-value
+    results obtained with a GLM model.
+
+    Attributes
+    ----------
+    cluster_pvalues : np.ndarray
+        The cluster P-values.
+    """
+
+    cluster_pvalues: np.ndarray
+
+    @property
+    def C(self):
+        """For compatibility with previous Matlab implementation."""
+        return self.cluster_pvalues
+
+
+@dataclass
+class StatisticsResults(Results):
+    """This class implements a container for results obtained with
+    the GLM model classes. It holds information relative to a GLM
+    run with one specific contrast.
+
+    Attributes
+    ----------
+    coefficients : np.ndarray
+        The beta coefficients of the fitted GLM model.
+
+    tstats : np.ndarray
+        The corresponding T-statistics.
+
+    uncorrected_p_value : PValueResults
+        The corresponding uncorrected p values, stored in a `PValueResults` instance.
+
+    fdr : np.ndarray
+        The corresponding False Discovery Rate.
+
+    corrected_p_value : CorrectedPValueResults
+        The corresponding corrected p values, stored in a `CorrectedPValueResults` instance.
+    """
+
+    coefficients: np.ndarray
+    tstats: np.ndarray
+    uncorrected_p_values: PValueResults
+    fdr: np.ndarray
+    corrected_p_values: CorrectedPValueResults
+
+    @property
+    def TStatistics(self):
+        """Needed for compatibility with previous implementation in Matlab."""
+        return self.tstats
+
+    @property
+    def uncorrectedPValue(self):
+        """Needed for compatibility with previous implementation in Matlab."""
+        return self.uncorrected_p_values
+
+    @property
+    def correctedPValue(self):
+        """Needed for compatibility with previous implementation in Matlab."""
+        return self.corrected_p_values
+
+    @property
+    def FDR(self):
+        """Needed for compatibility with previous implementation in Matlab."""
+        return self.fdr
+
+    @classmethod
+    def from_slm_model(
+        cls,
+        model: SLM,
+        mask: np.ndarray,
+        threshold_uncorrected_p_value: float,
+        threshold_corrected_p_value: float,
+    ):
+        """Instantiate from a SLM model.
+
+        Parameters
+        ----------
+        model : brainstat.stats.SLM
+            SLM model instance to use.
+
+        mask : np.ndarray
+            The binary mask to use.
+
+        threshold_uncorrected_p_value : float
+            The threshold to use with uncorrected P-values.
+
+        threshold_corrected_p_value : float
+            The threshold to use with corrected P-values.
+        """
+        idx = np.argwhere(np.isnan(model.t))
+        corrected_pvals = model.P["pval"]["P"]
+        corrected_pvals[idx] = 1.0
+        tstats = np.nan_to_num(model.t)
+        uncorrected_p_values = PValueResults.from_t_statistics(
+            tstats,
+            model.df,
+            mask,
+            threshold_uncorrected_p_value,
+        )
+        corrected_p_values = CorrectedPValueResults(
+            corrected_pvals,
+            mask,
+            threshold_corrected_p_value,
+            model.P["pval"]["C"],
+        )
+        return cls(
+            np.nan_to_num(model.coef),
+            tstats,
+            uncorrected_p_values,
+            model.Q,
+            corrected_p_values,
+        )
diff --git a/test/nonregression/pipelines/test_run_pipelines_stats.py b/test/nonregression/pipelines/test_run_pipelines_stats.py
index fa8470428f..9e5e24b2e0 100644
--- a/test/nonregression/pipelines/test_run_pipelines_stats.py
+++ b/test/nonregression/pipelines/test_run_pipelines_stats.py
@@ -7,7 +7,6 @@
 
 import warnings
 from os import fspath
-from pathlib import Path
 from test.nonregression.testing_tools import *
 
 import pytest
@@ -17,7 +16,6 @@
 
 
 @pytest.mark.fast
-# @pytest.mark.skip(reason="This test is currently broken.")
 def test_statistics_surface(cmdopt, tmp_path):
     base_dir = Path(cmdopt["input"])
     working_dir = Path(cmdopt["wd"])
@@ -77,9 +75,7 @@ def run_statistics_surface(
     import numpy as np
     from scipy.io import loadmat
 
-    from clinica.pipelines.statistics_surface.statistics_surface_pipeline import (
-        StatisticsSurface,
-    )
+    from clinica.pipelines.statistics_surface.pipeline import StatisticsSurface
 
     caps_dir = output_dir / "caps"
     tsv = input_dir / "subjects.tsv"
@@ -88,25 +84,23 @@ def run_statistics_surface(
     shutil.copytree(input_dir / "caps", caps_dir, copy_function=shutil.copy)
 
     parameters = {
-        # Clinica compulsory parameters
         "group_label": "UnitTest",
         "orig_input_data": "t1-freesurfer",
         "glm_type": "group_comparison",
         "contrast": "group",
-        # Optional parameters
         "covariates": ["age", "sex"],
     }
     pipeline = StatisticsSurface(
-        caps_directory=fspath(caps_dir),
-        tsv_file=fspath(tsv),
-        base_dir=fspath(working_dir),
+        caps_directory=caps_dir,
+        tsv_file=tsv,
+        base_dir=working_dir,
         parameters=parameters,
     )
     pipeline.build()
     pipeline.run(plugin="MultiProc", plugin_args={"n_procs": 1}, bypass_check=True)
 
     # Check files
-    for contrast in ["AD-lt-CN", "CN-lt-AD"]:
+    for contrast in ("AD-lt-CN", "CN-lt-AD"):
         for suffix, struct in zip(
             ["coefficients", "uncorrectedPValue", "FDR", "correctedPValue"],
             ["coef", "uncorrectedpvaluesstruct", "FDR", "correctedpvaluesstruct"],
@@ -121,15 +115,17 @@ def run_statistics_surface(
                 / filename
             )
             ref_file = ref_dir / filename
-            out_file_mat = loadmat(fspath(out_file))[struct]
-            ref_file_mat = loadmat(fspath(ref_file))[struct]
+            out_file_mat = loadmat(out_file)[struct]
+            ref_file_mat = loadmat(ref_file)[struct]
             if suffix in ["coefficients", "FDR"]:
                 assert np.allclose(
                     out_file_mat, ref_file_mat, rtol=1e-8, equal_nan=True
                 )
             else:
-                length = 4 if suffix == "correctedPValue" else 3
-                for i in range(length):
+                keys_to_compare = ["P", "mask", "thresh"]
+                if suffix == "correctedPValue":
+                    keys_to_compare.append("C")
+                for i in keys_to_compare:
                     assert np.allclose(
                         out_file_mat[0][0][i],
                         ref_file_mat[0][0][i],
diff --git a/test/unittests/pipelines/statistics_surface/test_inputs.py b/test/unittests/pipelines/statistics_surface/test_inputs.py
index 02b204c85c..3807f412c5 100644
--- a/test/unittests/pipelines/statistics_surface/test_inputs.py
+++ b/test/unittests/pipelines/statistics_surface/test_inputs.py
@@ -8,17 +8,21 @@
 
 
 def test_read_and_check_tsv_file_filenotfound_error(tmpdir):
-    from clinica.pipelines.statistics_surface._inputs import _read_and_check_tsv_file
+    from clinica.pipelines.statistics_surface.surfstat._utils import (
+        read_and_check_tsv_file,
+    )
 
     with pytest.raises(FileNotFoundError, match="File foo.tsv does not exist"):
-        _read_and_check_tsv_file(Path("foo.tsv"))
+        read_and_check_tsv_file(Path("foo.tsv"))
 
 
 @pytest.mark.parametrize(
     "columns", [["foo"], ["foo", "bar"], ["participant_id", "bar"]]
 )
 def test_read_and_check_tsv_file_data_errors(tmpdir, columns):
-    from clinica.pipelines.statistics_surface._inputs import _read_and_check_tsv_file
+    from clinica.pipelines.statistics_surface.surfstat._utils import (
+        read_and_check_tsv_file,
+    )
 
     df = pd.DataFrame(columns=columns)
     df.to_csv(tmpdir / "foo.tsv", sep="\t", index=False)
@@ -26,12 +30,14 @@ def test_read_and_check_tsv_file_data_errors(tmpdir, columns):
         ValueError,
         match=r"The TSV data should have at least two columns: participant_id and session_id",
     ):
-        _read_and_check_tsv_file(tmpdir / "foo.tsv")
+        read_and_check_tsv_file(tmpdir / "foo.tsv")
 
 
 def test_read_and_check_tsv_file():
-    from clinica.pipelines.statistics_surface._inputs import _read_and_check_tsv_file
+    from clinica.pipelines.statistics_surface.surfstat._utils import (
+        read_and_check_tsv_file,
+    )
 
-    df = _read_and_check_tsv_file(Path(CURRENT_DIR) / "data/subjects.tsv")
+    df = read_and_check_tsv_file(Path(CURRENT_DIR) / "data/subjects.tsv")
     assert len(df) == 7
     assert set(df.columns) == {"group", "age", "sex"}
diff --git a/test/unittests/pipelines/statistics_surface/test_model.py b/test/unittests/pipelines/statistics_surface/test_model.py
index 57de384e3c..b262d890ad 100644
--- a/test/unittests/pipelines/statistics_surface/test_model.py
+++ b/test/unittests/pipelines/statistics_surface/test_model.py
@@ -7,6 +7,14 @@
 from brainstat.stats.terms import FixedEffect
 from numpy.testing import assert_array_almost_equal, assert_array_equal
 
+from clinica.pipelines.statistics_surface.surfstat.models._correlation import (
+    CorrelationGLM,
+)
+from clinica.pipelines.statistics_surface.surfstat.models._group import (
+    GroupGLM,
+    GroupGLMWithInteraction,
+)
+
 CURRENT_DIR = os.path.dirname(os.path.realpath(__file__))
 
 
@@ -16,7 +24,9 @@ def df():
 
 
 def test_missing_column_error(df):
-    from clinica.pipelines.statistics_surface._model import _check_column_in_df
+    from clinica.pipelines.statistics_surface.surfstat.models._utils import (
+        check_column_in_df,
+    )
 
     with pytest.raises(
         ValueError,
@@ -25,18 +35,22 @@ def test_missing_column_error(df):
             "provided TSV file. Please make sure that there is no typo"
         ),
     ):
-        _check_column_in_df(df, "foo")
+        check_column_in_df(df, "foo")
 
 
 def test_is_categorical(df):
-    from clinica.pipelines.statistics_surface._model import _categorical_column
+    from clinica.pipelines.statistics_surface.surfstat.models._utils import (
+        is_categorical,
+    )
 
-    assert _categorical_column(df, "sex")
-    assert not _categorical_column(df, "age")
+    assert is_categorical(df, "sex")
+    assert not is_categorical(df, "age")
 
 
 def test_build_model_term_error(df):
-    from clinica.pipelines.statistics_surface._model import _build_model_term
+    from clinica.pipelines.statistics_surface.surfstat.models._utils import (
+        _build_model_term,
+    )
 
     assert isinstance(_build_model_term("sex", df), FixedEffect)
 
@@ -47,9 +61,9 @@ def test_build_model_intercept(design, df):
     Especially, the fact that adding explicitly the intercept doesn't change the results.
     Test also that spaces in the design expression have no effect.
     """
-    from clinica.pipelines.statistics_surface._model import _build_model
+    from clinica.pipelines.statistics_surface.surfstat.models._utils import build_model
 
-    model = _build_model(design, df)
+    model = build_model(design, df)
     assert isinstance(model, FixedEffect)
     assert len(model.m.columns) == 2
     assert_array_equal(model.intercept, np.array([1, 1, 1, 1, 1, 1, 1]))
@@ -57,16 +71,16 @@ def test_build_model_intercept(design, df):
 
 
 def test_build_model(df):
-    from clinica.pipelines.statistics_surface._model import _build_model
+    from clinica.pipelines.statistics_surface.surfstat.models._utils import build_model
 
-    model = _build_model("1 + age + sex", df)
+    model = build_model("1 + age + sex", df)
     assert isinstance(model, FixedEffect)
     assert len(model.m.columns) == 4
     assert_array_equal(model.intercept, np.array([1, 1, 1, 1, 1, 1, 1]))
     assert_array_equal(model.age, np.array([78.0, 73.4, 70.8, 82.3, 60.6, 72.1, 74.2]))
     assert_array_equal(model.sex_Female, np.array([1, 0, 1, 1, 1, 0, 1]))
     assert_array_equal(model.sex_Male, np.array([0, 1, 0, 0, 0, 1, 0]))
-    model = _build_model("1 + age + sex + age * sex", df)
+    model = build_model("1 + age + sex + age * sex", df)
     assert isinstance(model, FixedEffect)
     assert len(model.m.columns) == 6
     assert_array_equal(model.intercept, np.array([1, 1, 1, 1, 1, 1, 1]))
@@ -82,6 +96,22 @@ def test_build_model(df):
     )
 
 
+def test_base_glm_instantiation_error(df):
+    """Test that the base abstract GLM class cannot be instantiated."""
+    from clinica.pipelines.statistics_surface.surfstat.models._base import GLM
+
+    with pytest.raises(NotImplementedError):
+        GLM("1 + age", df, "feature_label", "age")
+
+
+@pytest.mark.parametrize(
+    "model,contrast",
+    [
+        (CorrelationGLM, "age"),
+        (GroupGLM, "sex"),
+        (GroupGLMWithInteraction, "age * sex"),
+    ],
+)
 @pytest.mark.parametrize(
     "parameters",
     [
@@ -94,51 +124,48 @@ def test_build_model(df):
         },
     ],
 )
-def test_glm_instantiation(df, parameters):
-    from clinica.pipelines.statistics_surface._model import GLM
+def test_common_parameters_glm_instantiation(df, model, contrast, parameters):
+    model_instance = model("1 + age", df, "feature_label", contrast, "group")
 
-    model = GLM("1 + age", df, "feature_label", "age")
-    assert not model._two_tailed
-    assert model._correction == ["fdr", "rft"]
-    assert model.feature_label == "feature_label"
-    assert model.fwhm == 20
-    assert model.threshold_uncorrected_pvalue == 0.001
-    assert model.threshold_corrected_pvalue == 0.05
-    assert model.cluster_threshold == 0.001
-    assert model.contrasts == dict()
-    assert model.filenames == dict()
-    assert model.contrast_names == list()
-    assert isinstance(model.model, FixedEffect)
+    assert not model_instance._two_tailed
+    assert model_instance._correction == ["fdr", "rft"]
+    assert model_instance.feature_label == "feature_label"
+    assert model_instance.fwhm == 20
+    assert model_instance.threshold_uncorrected_pvalue == 0.001
+    assert model_instance.threshold_corrected_pvalue == 0.05
+    assert model_instance.cluster_threshold == 0.001
+    assert model_instance.filenames == dict()
+    assert isinstance(model_instance.model, FixedEffect)
 
 
 @pytest.mark.parametrize("contrast", ["age", "-age"])
 def test_correlation_glm_instantiation(df, contrast):
-    from clinica.pipelines.statistics_surface._model import CorrelationGLM
+    from clinica.pipelines.statistics_surface.surfstat.models._contrast import (
+        CorrelationContrast,
+    )
 
-    model = CorrelationGLM("1 + age", df, "feature_label", contrast, "group_label")
+    model = CorrelationGLM("1 + age", df, "feature_label", contrast, "group")
     assert not model.with_interaction
-    assert model.group_label == "group_label"
+    assert model.group_label == "group"
     assert model.feature_label == "feature_label"
     assert model.fwhm == 20
     sign = "positive" if contrast == "age" else "negative"
-    assert model.contrast_sign == sign
-    assert model.absolute_contrast_name == "age"
-    assert isinstance(model.contrasts, dict)
     assert len(model.contrasts) == 1
+    assert isinstance(model.contrasts[0], CorrelationContrast)
+    assert model.contrasts[0].sign == sign
+    assert model.contrasts[0].name == contrast
     mult = 1 if sign == "positive" else -1
     assert_array_equal(
-        model.contrasts[contrast].values,
+        model.contrasts[0].built_contrast.values,
         mult * np.array([78.0, 73.4, 70.8, 82.3, 60.6, 72.1, 74.2]),
     )
     with pytest.raises(ValueError, match="Unknown contrast foo"):
-        model.filename_root("foo")
-    expected = f"group-group_label_correlation-age-{sign}_measure-feature_label_fwhm-20"
-    assert model.filename_root(contrast) == expected
+        model.get_output_filename("foo")
+    expected = f"group-group_correlation-age-{sign}_measure-feature_label_fwhm-20"
+    assert model.get_output_filename(contrast) == expected
 
 
 def test_group_glm_instantiation(df):
-    from clinica.pipelines.statistics_surface._model import GroupGLM
-
     with pytest.raises(
         ValueError,
         match="Contrast should refer to a categorical variable for group comparison.",
@@ -148,24 +175,22 @@ def test_group_glm_instantiation(df):
     assert not model.with_interaction
     assert model.group_label == "group_label"
     assert model.fwhm == 20
-    assert isinstance(model.contrasts, dict)
+    assert isinstance(model.contrasts, list)
     contrast_names = ["Female-lt-Male", "Male-lt-Female"]
-    assert set(model.contrasts.keys()) == set(contrast_names)
+    assert set(model.contrast_names) == set(contrast_names)
     for contrast_name, sign in zip(contrast_names, [-1, 1]):
         assert_array_equal(
-            model.contrasts[contrast_name].values,
+            model.get_contrast_by_name(contrast_name).built_contrast,
             sign * np.array([1, -1, 1, 1, 1, -1, 1]),
         )
     with pytest.raises(ValueError, match="Unknown contrast foo"):
-        model.filename_root("foo")
+        model.get_output_filename("foo")
     for contrast_name in contrast_names:
         expected = f"group-group_label_{contrast_name}_measure-feature_label_fwhm-20"
-        assert model.filename_root(contrast_name) == expected
+        assert model.get_output_filename(contrast_name) == expected
 
 
 def test_group_glm_with_interaction_instantiation(df):
-    from clinica.pipelines.statistics_surface._model import GroupGLMWithInteraction
-
     with pytest.raises(
         ValueError,
         match=(
@@ -173,34 +198,29 @@ def test_group_glm_with_interaction_instantiation(df):
             "variable and one categorical variable."
         ),
     ):
-        GroupGLMWithInteraction("1 + age", df, "feature_label", "age", "group_label")
+        GroupGLMWithInteraction("1 + age", df, "feature_label", "age", "group")
     model = GroupGLMWithInteraction(
-        "1 + age", df, "feature_label", "age * sex", "group_label"
+        "1 + age", df, "feature_label", "age * sex", "group"
     )
     assert model.with_interaction
-    assert model.group_label == "group_label"
+    assert model.group_label == "group"
     assert model.fwhm == 20
-    assert isinstance(model.contrasts, dict)
+    assert isinstance(model.contrasts, list)
     assert len(model.contrasts) == 1
     assert_array_equal(
-        model.contrasts["age * sex"].values,
+        model.get_contrast_by_name("age * sex").built_contrast,
         np.array([78.0, -73.4, 70.8, 82.3, 60.6, -72.1, 74.2]),
     )
     with pytest.raises(ValueError, match="Unknown contrast foo"):
-        model.filename_root("foo")
+        model.get_output_filename("foo")
     assert (
-        model.filename_root("age * sex")
+        model.get_output_filename("age * sex")
         == "interaction-age * sex_measure-feature_label_fwhm-20"
     )
 
 
 def test_create_glm_model(df):
-    from clinica.pipelines.statistics_surface._model import (
-        CorrelationGLM,
-        GroupGLM,
-        GroupGLMWithInteraction,
-        create_glm_model,
-    )
+    from clinica.pipelines.statistics_surface.surfstat.models import create_glm_model
 
     model = create_glm_model(
         "correlation", "age", df, "age", feature_label="feature_label"
@@ -227,7 +247,9 @@ def test_create_glm_model(df):
 
 
 def test_p_value_results():
-    from clinica.pipelines.statistics_surface._model import PValueResults
+    from clinica.pipelines.statistics_surface.surfstat.models.results._statistics import (
+        PValueResults,
+    )
 
     pvalues = np.random.random((5, 10))
     threshold = 0.3
@@ -248,29 +270,34 @@ def test_statistics_results_serializer(tmp_path):
 
     from scipy.io import loadmat
 
-    from clinica.pipelines.statistics_surface._model import (
-        CorrectedPValueResults,
-        PValueResults,
+    from clinica.pipelines.statistics_surface.surfstat.models.results import (
         StatisticsResults,
         StatisticsResultsSerializer,
     )
+    from clinica.pipelines.statistics_surface.surfstat.models.results._statistics import (
+        CorrectedPValueResults,
+        PValueResults,
+    )
 
     dummy_input = np.empty([3, 6])
     uncorrected = PValueResults(*[dummy_input] * 2, 0.1)
     corrected = CorrectedPValueResults(*[dummy_input] * 3, 0.2)
     results = StatisticsResults(*[dummy_input] * 2, uncorrected, dummy_input, corrected)
-    serializer = StatisticsResultsSerializer(str(tmp_path / Path("out/dummy")))
-    assert serializer.output_file == str(tmp_path / Path("out/dummy"))
+
+    out_file = tmp_path / "out" / "dummy"
+    serializer = StatisticsResultsSerializer(out_file)
+    assert serializer.output_file == out_file
     assert serializer.json_extension == "_results.json"
     assert serializer.json_indent == 4
     assert serializer.mat_extension == ".mat"
+
     with pytest.raises(
         NotImplementedError, match="Serializing method foo is not implemented."
     ):
         serializer.save(results, "foo")
     serializer.save(results, "json")
-    assert os.path.exists(tmp_path / Path("out/dummy_results.json"))
-    with open(tmp_path / Path("out/dummy_results.json"), "r") as fp:
+    assert (tmp_path / "out" / "dummy_results.json").exists()
+    with open(tmp_path / "out" / "dummy_results.json", "r") as fp:
         serialized = json.load(fp)
     serializer.save(results, "mat")
     names = [
@@ -288,9 +315,9 @@ def test_statistics_results_serializer(tmp_path):
         "FDR",
     ]
     for name, key in zip(names, keys):
-        assert os.path.exists(tmp_path / Path(f"out/dummy_{name}.mat"))
-        mat = loadmat(tmp_path / Path(f"out/dummy_{name}.mat"))
-        if key in ["uncorrectedpvaluesstruct", "correctedpvaluesstruct"]:
+        assert (tmp_path / "out" / f"dummy_{name}.mat").exists()
+        mat = loadmat(tmp_path / "out" / f"dummy_{name}.mat")
+        if key in ("uncorrectedpvaluesstruct", "correctedpvaluesstruct"):
             assert_array_almost_equal(mat[key]["P"][0, 0], dummy_input)
             assert_array_almost_equal(mat[key]["mask"][0, 0], dummy_input)
         else: