# Import necessary python modules
from glob import glob
import nibabel as nib
import numpy as np
from nilearn.plotting import plot_stat_map
from scipy.stats import zscore
import matplotlib.pyplot as plt
import seaborn as sns
import brainiak.funcalign.srm
from brainiak.fcma.util import compute_correlation


# Download and extract example data from Zenodo
!wget https://zenodo.org/record/4300825/files/brainiak-aperture-srm-data.tgz
!tar -xzf brainiak-aperture-srm-data.tgz
!rm brainiak-aperture-srm-data.tgz

--2020-12-07 02:06:15--  https://zenodo.org/record/4300825/files/brainiak-aperture-srm-data.tgz
Resolving zenodo.org (zenodo.org)... 137.138.76.77
Connecting to zenodo.org (zenodo.org)|137.138.76.77|:443... connected.
HTTP request sent, awaiting response... 200 OK
Length: 9927319659 (9.2G) [application/octet-stream]
Saving to: ‘brainiak-aperture-srm-data.tgz’

brainiak-aperture-s 100%[===================>]   9.25G  4.37MB/s    in 13m 37s 

2020-12-07 02:20:30 (11.6 MB/s) - ‘brainiak-aperture-srm-data.tgz’ saved [9927319659/9927319659]


# Get filenames for example data and atlas
data_fns = sorted(glob('brainiak-aperture-srm-data/sub-*_task-black_*bold.nii.gz'))
atlas_fn = 'brainiak-aperture-srm-data/Schaefer2018_400Parcels_17Networks_order_FSLMNI152_2.5mm.nii.gz'

# Load in the Schaefer 400-parcel atlas
atlas_nii = nib.load(atlas_fn)
atlas_img = atlas_nii.get_fdata()

# Left temporal parietal ROI labels
parcel_labels = [195, 196, 197, 198, 199, 200]


# Load in functional data and mask with "temporal parietal" ROI
data = []
for data_fn in data_fns:
    voxel_data = nib.load(data_fn).get_fdata()
    
    # Take union of all parcels (brain areas) comprising the full ROI 
    roi_data = np.column_stack([voxel_data[atlas_img == parcel, :].T
                                for parcel in parcel_labels])
    data.append(roi_data)


# Visualize the left temporal parietal ROI
sns.set(palette='colorblind')
roi_img = np.zeros(atlas_img.shape)
for parcel in parcel_labels:
    roi_img[atlas_img == parcel] = 1

# Convert to a NIfTI image for visualization with Nilearn
roi_nii = nib.Nifti1Image(roi_img, atlas_nii.affine, atlas_nii.header)

# Plot plot left temporal parietal ROI
plot_stat_map(roi_nii, cmap='tab10_r', cut_coords=(-53, -46, 10),
              colorbar=False, title='left temporal parietal ROI');
plt.show()

# Print short "figure caption" describing visualization
print('The left "temporal parietal" ROI comprises auditory '
      "association\ncortex extending from anterior superior "
      "temporal cortex to the\ntemporoparietal junction.")

The left "temporal parietal" ROI comprises auditory association
cortex extending from anterior superior temporal cortex to the
temporoparietal junction.


# Get the number of subjects and TRs
n_subjects = len(data)
n_trs = data[0].shape[0]

# Set a train/test split ratio
train_test_ratio = .5
test_size = int(n_trs * train_test_ratio)

# Split/compile data into training and test halves
train_data = []
test_data = []
for subject in np.arange(n_subjects):
    
    # Take the first chunk of TRs as training
    train_data.append(zscore(data[subject][:-test_size, :], axis=0).T)
    
    # Take the second chunk of TRs as testing
    test_data.append(zscore(data[subject][-test_size:, :], axis=0).T)


# Set the number of features of shared space and number of iterations
features = 50
n_iter = 10

# Create an SRM object
srm = brainiak.funcalign.srm.SRM(n_iter=n_iter, features=features)

# Fit the SRM data
print('Fitting SRM')
srm.fit(train_data)
print('SRM has been fit')
print(f'Share response shape: {srm.s_.shape[0]} '
      f'Features x {srm.s_.shape[1]} Time-points')

Fitting SRM
SRM has been fit
Share response shape: 50 Features x 275 Time-points


# Use the first subject as an example
subject = 0

sns.set_style('white')
fig, ax = plt.subplots(1)
m = ax.matshow(srm.w_[subject].T.dot(srm.w_[subject]))
ax.set_title(f'Weight matrix orthogonality for subject {subject}', pad=10)
ax.set_xlabel('SRM features')
ax.set_ylabel('SRM features')
ax.tick_params(length=0)
cbar = fig.colorbar(m, ax=ax, ticks=[0, 1])
cbar.ax.tick_params(length=0)
plt.show()

print(f'Weight matrix shape: {srm.w_[subject].shape[0]} '
      f'Voxels x {srm.w_[subject].shape[1]} Features\n')

# Check against identity matrix
if np.allclose(np.identity(features), srm.w_[subject].T.dot(srm.w_[subject])):
    print("This test confirms that the weight matrix for "
          f"subject {subject} is orthogonal.")
else:
    print("Weight matrix is not orthogonal.")

Weight matrix shape: 935 Voxels x 50 Features

This test confirms that the weight matrix for subject 0 is orthogonal.


# Transform subject-space test data into shared space
test_shared = srm.transform(test_data)

# z-score the transformed test data
test_shared = [zscore(ts, axis=1) for ts in test_shared]


def time_segment_classification(data, win_size=10): 
    n_subjects = len(data)
    (n_features, n_trs) = data[0].shape
    accuracy = np.zeros(shape=n_subjects)
    n_segments = n_trs - win_size + 1
    
    # Set up container for training data
    train_data = np.zeros((n_features * win_size, n_segments), order='f')
    
    # Training data (includes test data, but will be removed)
    for m in range(n_subjects):
        for w in range(win_size):
            train_data[w * n_features:(w + 1) * n_features, :] += \
                data[m][:, w:(w + n_segments)]
            
    # Analyze each subject (leave-one-out)
    print("Between-subject time-segment classification accuracy "
          "for each subject:", end=' ')
    for test_subject in range(n_subjects):
        test_data = np.zeros((n_features * win_size, n_segments), order='f')
        for w in range(win_size):
            test_data[w * n_features:(w + 1) * n_features, :] = \
                data[test_subject][:, w:(w + n_segments)]

        A = np.nan_to_num(zscore((train_data - test_data), axis=0))
        B = np.nan_to_num(zscore(test_data, axis=0))

        # Compute correlation matrix
        correlations = compute_correlation(B.T, A.T)

        # Correlation-based classification
        for i in range(n_segments):
            for j in range(n_segments):
                
                # Exclude segments overlapping with the testing segment
                if abs(i - j) < win_size and i != j:
                    correlations[i, j] = -np.inf

        max_idx =  np.argmax(correlations, axis=1)
        accuracy[test_subject] = sum(max_idx == range(n_segments)) / n_segments

        # Print accuracy for each subject as we go
        print(f"{accuracy[test_subject]:.3f}",
              end=', ', flush=True)
        
    # Get a rough estimate of chance (accounting for excluded segments)
    chance = 1 / np.sum(~np.isinf(correlations[n_trs // 2]))
        
    print("\nThe average accuracy among all subjects is "
          f"{np.mean(accuracy):.3f} +/- {np.std(accuracy):.3f}")
    return accuracy, chance


# Time-segment classification on anatomically-aligned data
win_size = 10
acc_anat_test, chance = time_segment_classification(test_data, win_size=win_size)

Between-subject time-segment classification accuracy for each subject: 0.094, 0.173, 0.090, 0.004, 0.158, 0.064, 0.064, 0.075, 0.143, 0.135, 0.132, 0.162, 0.083, 0.098, 0.053, 0.083, 0.169, 0.132, 0.030, 0.188, 0.075, 0.124, 0.083, 0.094, 0.135, 0.180, 0.195, 0.135, 0.102, 0.128, 0.109, 0.120, 0.060, 0.132, 0.041, 0.113, 0.132, 0.135, 0.165, 0.113, 
The average accuracy among all subjects is 0.113 +/- 0.044


# Time-segment classification on SRM data
acc_shared_test, chance = time_segment_classification(test_shared, win_size=win_size)

Between-subject time-segment classification accuracy for each subject: 0.267, 0.462, 0.331, 0.038, 0.808, 0.188, 0.278, 0.462, 0.654, 0.876, 0.688, 0.553, 0.120, 0.327, 0.282, 0.440, 0.459, 0.312, 0.079, 0.523, 0.109, 0.583, 0.391, 0.436, 0.575, 0.511, 0.665, 0.308, 0.429, 0.320, 0.538, 0.571, 0.481, 0.372, 0.395, 0.229, 0.410, 0.451, 0.613, 0.526, 
The average accuracy among all subjects is 0.427 +/- 0.186


# Box plot for the classification results
labels = ['anatomical\nalignment', 'SRM']

plt.figure()
plt.boxplot([acc_anat_test, acc_shared_test], vert=True,
            patch_artist=True, labels=labels)
plt.axhline(chance, linestyle='--', color='.4')
plt.xlabel('alignment')
plt.ylabel('classification accuracy')
plt.title('Between-subject time-segment classification')
plt.show()

print("SRM functional alignment provides a marked improvement in "
      "between-\nsubject time-segment classification over "
      "anatomical alignment.\nThe dotted line indicates chance "
      f"performance (chance = {chance:.3f})")

SRM functional alignment provides a marked improvement in between-
subject time-segment classification over anatomical alignment.
The dotted line indicates chance performance (chance = 0.004)

Shared response model¶

Annotated bibliography¶

Table of contents¶

Example fMRI data and atlas¶

Estimating the SRM¶

Between-subject time-segment classification¶

Summary¶

References¶