gallantlab
diff --git a/‎tutorials/movies_3T/00_download_vim4.py‎
Lines changed: 1 addition & 1 deletion b/‎tutorials/movies_3T/00_download_vim4.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎tutorials/movies_3T/02_plot_wordnet_model.py‎
Lines changed: 5 additions & 118 deletions b/‎tutorials/movies_3T/02_plot_wordnet_model.py‎
Lines changed: 5 additions & 118 deletions
diff --git a/‎tutorials/movies_3T/03_plot_hemodynamic_response.py‎
Lines changed: 247 additions & 0 deletions b/‎tutorials/movies_3T/03_plot_hemodynamic_response.py‎
Lines changed: 247 additions & 0 deletions
diff --git a/‎…movies_3T/03_plot_motion_energy_model.py‎ ‎…movies_3T/04_plot_motion_energy_model.py‎tutorials/movies_3T/03_plot_motion_energy_model.py renamed to tutorials/movies_3T/04_plot_motion_energy_model.py b/‎…movies_3T/03_plot_motion_energy_model.py‎ ‎…movies_3T/04_plot_motion_energy_model.py‎tutorials/movies_3T/03_plot_motion_energy_model.py renamed to tutorials/movies_3T/04_plot_motion_energy_model.py
diff --git a/‎…/movies_3T/04_plot_banded_ridge_model.py‎ ‎…/movies_3T/05_plot_banded_ridge_model.py‎tutorials/movies_3T/04_plot_banded_ridge_model.py renamed to tutorials/movies_3T/05_plot_banded_ridge_model.py b/‎…/movies_3T/04_plot_banded_ridge_model.py‎ ‎…/movies_3T/05_plot_banded_ridge_model.py‎tutorials/movies_3T/04_plot_banded_ridge_model.py renamed to tutorials/movies_3T/05_plot_banded_ridge_model.py
@@ -23,7 +23,7 @@
     Gallant Lab Natural Movie 3T fMRI Data. CRCNS.org.
     http://dx.doi.org/10.6080/TBD
 """
-# sphinx_gallery_thumbnail_path = "_static/crcns.png"
+# sphinx_gallery_thumbnail_path = "static/crcns.png"
 
 ###############################################################################
 # Download
 
@@ -136,10 +136,11 @@
 # Then we concatenate the features with multiple delays to account for the
 # hemodynamic response. Indeed, the BOLD signal recorded in fMRI experiments is
 # delayed in time with respect to the stimulus. With different delayed versions
-# of the features, the linear regression model will weight each
-# delayed feature with a different weight, to maximize the predictions.
-# With a sample every 2 seconds, we typically use 4 delays [1, 2, 3, 4] to
-# cover the most part of the hemodynamic response peak.
+# of the features, the linear regression model will weight each delayed feature
+# with a different weight, to maximize the predictions. With a sample every 2
+# seconds, we typically use 4 delays [1, 2, 3, 4] to cover the most part of the
+# hemodynamic response peak. In the next example, we further describe this
+# hemodynamic response estimation.
 from voxelwise_tutorials.delayer import Delayer
 delayer = Delayer(delays=[1, 2, 3, 4])
 
@@ -299,120 +300,6 @@
 plot_alphas_diagnostic(best_alphas=best_alphas, alphas=alphas)
 plt.show()
 
-###############################################################################
-# Compare with a model without delays
-# -----------------------------------
-#
-# To present an example of model comparison, we define here another model,
-# without feature delays (i.e. no ``Delayer``). Because the BOLD signal is
-# inherently slow due to the dynamics of neuro-vascular coupling, this model is
-# unlikely to perform well.
-
-pipeline_nodelay = make_pipeline(
-    StandardScaler(with_mean=True, with_std=False),
-    KernelRidgeCV(
-        alphas=alphas, cv=cv,
-        solver_params=dict(n_targets_batch=500, n_alphas_batch=5,
-                           n_targets_batch_refit=100)),
-)
-pipeline_nodelay
-
-###############################################################################
-# We fit and score the model as the previous one.
-pipeline_nodelay.fit(X_train, Y_train)
-scores_nodelay = pipeline_nodelay.score(X_test, Y_test)
-scores_nodelay = backend.to_numpy(scores_nodelay)
-print("(n_voxels,) =", scores_nodelay.shape)
-###############################################################################
-# Then, we plot the comparison of model performances with a 2D histogram.
-# All ~70k voxels are represented in this histogram, where the diagonal
-# corresponds to identical performance for both models. A distibution deviating
-# from the diagonal means that one model has better predictive performances
-# than the other.
-
-from voxelwise_tutorials.viz import plot_hist2d
-
-ax = plot_hist2d(scores_nodelay, scores)
-ax.set(
-    title='Generalization R2 scores',
-    xlabel='model without delays',
-    ylabel='model with delays',
-)
-plt.show()
-
-###############################################################################
-# We see that the model with delays performs much better than the model without
-# delays. This can be seen in voxels with scores above 0. The distribution
-# of scores below zero is not very informative, since it corresponds to voxels
-# with poor predictive performances anyway, and it only shows which model is
-# overfitting the most.
-
-###############################################################################
-# Visualize the HRF
-# -----------------
-#
-# We just saw that delays are necessary to model BOLD responses. Here we show
-# how the fitted ridge regression weights follow the hemodynamic response
-# function (HRF).
-#
-# Fitting a kernel ridge regression results in a set of coefficients called the
-# "dual" coefficients :math:`w`. These coefficients differ from the "primal"
-# coefficients :math:`\beta` obtained with a ridge regression, but the primal
-# coefficients can be computed from the dual coefficients using the training
-# features :math:`X`:
-#
-# .. math::
-#
-#     \beta = X^\top w
-#
-# To better visualize the HRF, we will refit a model with more delays, but only
-# on a selection of voxels to speed up the computations.
-
-# pick the 10 best voxels
-voxel_selection = np.argsort(scores)[-10:]
-
-# define a pipeline with more delays
-pipeline_many_delays = make_pipeline(
-    StandardScaler(with_mean=True, with_std=False),
-    Delayer(delays=[0, 1, 2, 3, 4, 5, 6]),
-    KernelRidgeCV(
-        alphas=alphas, cv=cv,
-        solver_params=dict(n_targets_batch=500, n_alphas_batch=5,
-                           n_targets_batch_refit=100)),
-)
-
-pipeline_many_delays.fit(X_train, Y_train[:, voxel_selection])
-
-# get the (primal) ridge regression coefficients
-primal_coef = pipeline_many_delays[-1].get_primal_coef()
-primal_coef = backend.to_numpy(primal_coef)
-
-# get the delays
-delays = pipeline_many_delays.named_steps['delayer'].delays
-# split the ridge coefficients per delays
-primal_coef_per_delay = np.stack(np.split(primal_coef, len(delays), axis=0))
-
-# select the feature with the largest coefficients for each voxel
-feature_selection = np.argmax(np.sum(np.abs(primal_coef_per_delay), axis=0),
-                              axis=0)
-primal_coef_selection = primal_coef_per_delay[:, feature_selection,
-                                              np.arange(len(voxel_selection))]
-
-plt.plot(delays, primal_coef_selection)
-plt.xlabel('Delays')
-plt.xticks(delays)
-plt.ylabel('Ridge coefficients')
-plt.title(f'Largest feature for the {len(voxel_selection)} best voxels')
-plt.axhline(0, color='k', linewidth=0.5)
-plt.show()
-
-###############################################################################
-# In this dataset, the brain responses are recorded every two seconds.
-#
-# We see that the hemodynamic response function (HRF) is captured in the model
-# weights. In this dataset, we can limit the number of features by using only
-# the most informative delays, for example [1, 2, 3, 4].
-
 ###############################################################################
 # Visualize the regression coefficients
 # -------------------------------------
 
@@ -0,0 +1,247 @@
+"""
+==================================
+Visualize the hemodynamic response
+==================================
+
+In this example, we describe how the hemodynamic response is estimated in the
+previous model. We fit the same ridge model as in the previous example, and
+further describe the need to delay the features in time.
+
+As explained in previous example, the BOLD signal recorded in fMRI experiments
+is delayed in time with respect to the stimulus. With different delayed
+versions of the features, the linear regression model weight each delayed
+feature with a different weight, to maximize the predictions. With a sample
+every 2 seconds, we typically use 4 delays [1, 2, 3, 4] to cover the most part
+of the hemodynamic response peak.
+
+In this example, we show the descrease in prediction performances when using no
+delays. We also show how to visualize the estimated hemodynamic response
+function (HRF) using more delays.
+"""
+# sphinx_gallery_thumbnail_number = 2
+###############################################################################
+# Path of the data directory
+import os
+from voxelwise_tutorials.io import get_data_home
+directory = os.path.join(get_data_home(), "vim-4")
+print(directory)
+
+###############################################################################
+
+# modify to use another subject
+subject = "S01"
+
+###############################################################################
+# Load the data
+# -------------
+#
+# We first load the fMRI responses.
+import numpy as np
+from voxelwise_tutorials.io import load_hdf5_array
+
+file_name = os.path.join(directory, "responses", f"{subject}_responses.hdf")
+Y_train = load_hdf5_array(file_name, key="Y_train")
+Y_test = load_hdf5_array(file_name, key="Y_test")
+
+print("(n_samples_train, n_voxels) =", Y_train.shape)
+print("(n_repeats, n_samples_test, n_voxels) =", Y_test.shape)
+
+###############################################################################
+# We average the test repeats, to remove the non-repeatable part of fMRI
+# responses.
+Y_test = Y_test.mean(0)
+
+print("(n_samples_test, n_voxels) =", Y_test.shape)
+
+###############################################################################
+# We fill potential NaN (not-a-number) values with zeros.
+Y_train = np.nan_to_num(Y_train)
+Y_test = np.nan_to_num(Y_test)
+
+###############################################################################
+# Then, we load the semantic "wordnet" features.
+feature_space = "wordnet"
+
+file_name = os.path.join(directory, "features", f"{feature_space}.hdf")
+X_train = load_hdf5_array(file_name, key="X_train")
+X_test = load_hdf5_array(file_name, key="X_test")
+
+print("(n_samples_train, n_features) =", X_train.shape)
+print("(n_samples_test, n_features) =", X_test.shape)
+
+###############################################################################
+# Define the cross-validation scheme
+# ----------------------------------
+#
+# We define the same leave-one-run-out cross-validation split as in the
+# previous example.
+
+from sklearn.model_selection import check_cv
+from voxelwise_tutorials.utils import generate_leave_one_run_out
+
+# indice of first sample of each run
+run_onsets = load_hdf5_array(file_name, key="run_onsets")
+print(run_onsets)
+
+###############################################################################
+# We define a cross-validation splitter, compatible with ``scikit-learn`` API.
+n_samples_train = X_train.shape[0]
+cv = generate_leave_one_run_out(n_samples_train, run_onsets)
+cv = check_cv(cv)  # copy the cross-validation splitter into a reusable list
+
+###############################################################################
+# Define the model
+# ----------------
+#
+# We define the same model as in the previous example. See the previous
+# example for more details about the model definition.
+
+from sklearn.pipeline import make_pipeline
+from sklearn.preprocessing import StandardScaler
+from voxelwise_tutorials.delayer import Delayer
+from himalaya.kernel_ridge import KernelRidgeCV
+from himalaya.backend import set_backend
+backend = set_backend("torch_cuda", on_error="warn")
+
+X_train = X_train.astype("float32")
+X_test = X_test.astype("float32")
+
+alphas = np.logspace(1, 20, 20)
+
+pipeline = make_pipeline(
+    StandardScaler(with_mean=True, with_std=False),
+    Delayer(delays=[1, 2, 3, 4]),
+    KernelRidgeCV(
+        alphas=alphas, cv=cv,
+        solver_params=dict(n_targets_batch=500, n_alphas_batch=5,
+                           n_targets_batch_refit=100)),
+)
+
+###############################################################################
+from sklearn import set_config
+set_config(display='diagram')
+pipeline
+
+###############################################################################
+# Fit the model
+# -------------
+#
+# We fit on the train set, and score on the test set.
+
+pipeline.fit(X_train, Y_train)
+
+scores = pipeline.score(X_test, Y_test)
+scores = backend.to_numpy(scores)
+print("(n_voxels,) =", scores.shape)
+
+###############################################################################
+# Compare with a model without delays
+# -----------------------------------
+#
+# We define here another model without feature delays (i.e. no ``Delayer``).
+# Because the BOLD signal is inherently slow due to the dynamics of
+# neuro-vascular coupling, this model is unlikely to perform well.
+
+pipeline_nodelay = make_pipeline(
+    StandardScaler(with_mean=True, with_std=False),
+    KernelRidgeCV(
+        alphas=alphas, cv=cv,
+        solver_params=dict(n_targets_batch=500, n_alphas_batch=5,
+                           n_targets_batch_refit=100)),
+)
+pipeline_nodelay
+
+###############################################################################
+# We fit and score the model as the previous one.
+pipeline_nodelay.fit(X_train, Y_train)
+scores_nodelay = pipeline_nodelay.score(X_test, Y_test)
+scores_nodelay = backend.to_numpy(scores_nodelay)
+print("(n_voxels,) =", scores_nodelay.shape)
+
+###############################################################################
+# Then, we plot the comparison of model performances with a 2D histogram.
+# All ~70k voxels are represented in this histogram, where the diagonal
+# corresponds to identical performance for both models. A distibution deviating
+# from the diagonal means that one model has better predictive performances
+# than the other.
+import matplotlib.pyplot as plt
+from voxelwise_tutorials.viz import plot_hist2d
+
+ax = plot_hist2d(scores_nodelay, scores)
+ax.set(
+    title='Generalization R2 scores',
+    xlabel='model without delays',
+    ylabel='model with delays',
+)
+plt.show()
+
+###############################################################################
+# We see that the model with delays performs much better than the model without
+# delays. This can be seen in voxels with scores above 0. The distribution
+# of scores below zero is not very informative, since it corresponds to voxels
+# with poor predictive performances anyway, and it only shows which model is
+# overfitting the most.
+
+###############################################################################
+# Visualize the HRF
+# -----------------
+#
+# We just saw that delays are necessary to model BOLD responses. Here we show
+# how the fitted ridge regression weights follow the hemodynamic response
+# function (HRF).
+#
+# Fitting a kernel ridge regression results in a set of coefficients called the
+# "dual" coefficients :math:`w`. These coefficients differ from the "primal"
+# coefficients :math:`\beta` obtained with a ridge regression, but the primal
+# coefficients can be computed from the dual coefficients using the training
+# features :math:`X`:
+#
+# .. math::
+#
+#     \beta = X^\top w
+#
+# To better visualize the HRF, we will refit a model with more delays, but only
+# on a selection of voxels to speed up the computations.
+
+# pick the 10 best voxels
+voxel_selection = np.argsort(scores)[-10:]
+
+# define a pipeline with more delays
+pipeline_many_delays = make_pipeline(
+    StandardScaler(with_mean=True, with_std=False),
+    Delayer(delays=[0, 1, 2, 3, 4, 5, 6]),
+    KernelRidgeCV(
+        alphas=alphas, cv=cv,
+        solver_params=dict(n_targets_batch=500, n_alphas_batch=5,
+                           n_targets_batch_refit=100)),
+)
+
+pipeline_many_delays.fit(X_train, Y_train[:, voxel_selection])
+
+# get the (primal) ridge regression coefficients
+primal_coef = pipeline_many_delays[-1].get_primal_coef()
+primal_coef = backend.to_numpy(primal_coef)
+
+# get the delays
+delays = pipeline_many_delays.named_steps['delayer'].delays
+# split the ridge coefficients per delays
+primal_coef_per_delay = np.stack(np.split(primal_coef, len(delays), axis=0))
+
+# select the feature with the largest coefficients for each voxel
+feature_selection = np.argmax(np.sum(np.abs(primal_coef_per_delay), axis=0),
+                              axis=0)
+primal_coef_selection = primal_coef_per_delay[:, feature_selection,
+                                              np.arange(len(voxel_selection))]
+
+plt.plot(delays, primal_coef_selection)
+plt.xlabel('Delays')
+plt.xticks(delays)
+plt.ylabel('Ridge coefficients')
+plt.title(f'Largest feature for the {len(voxel_selection)} best voxels')
+plt.axhline(0, color='k', linewidth=0.5)
+plt.show()
+
+###############################################################################
+# We see that the hemodynamic response function (HRF) is captured in the model
+# weights. Note that in this dataset, the brain responses are recorded every
+# two seconds.