# the next two lines suppress a (meaningless) warning about the graphics backend
import warnings
warnings.simplefilter('ignore')

# data science and visualization libraries
import numpy as np
import pandas as pd
import nibabel as nb
import nilearn as nl
import nltools as nlt
import timecorr as tc
import seaborn as sns

from IPython.display import HTML

# system libraries
from mpi4py import MPI
import os, sys
from glob import glob as lsdir
import pickle as pkl

# brainiak
from brainiak.factoranalysis.htfa import HTFA

# convenience functions from helpers.py
from helpers import nii2cmu, cmu2nii, animate_chord, animate_connectome, opts, opts2str, htfa2dict, dict2htfa, local_params, global_params, plot_nodes


# set to True for a faster run (~20ish minutes)
# set to False for a more accurate run (overnight on a powerful MPI-enabled multi-processor
# machine or several days on a recent single-core machine or VM)
debug_mode = True


# data (change paths if running outside of Docker)
intact = lsdir('/data/Pieman2/sub-*/func/*intact*.nii.gz')
scrambled = lsdir('/data/Pieman2/sub-*/func/*word*.nii.gz')

if debug_mode:
    intact = intact[:3]
    scrambled = scrambled[:3]

combined_fnames = list.copy(intact)
combined_fnames.extend(scrambled)


# convert data (.nii or .nii.gz files) to CMU format
cmu_data = [nii2cmu(f) for f in combined_fnames]


# convert to HTFA format
htfa_data = [{'R': x['R'], 'Z': x['Y'].T} for x in cmu_data]


# configure MPI:
#  - if the local environment supports MPI, do computations in parallel (fast!)
#  - if MPI is not supported, do computations in serial (slower)
comm = MPI.COMM_WORLD
rank = comm.Get_rank()
size = comm.Get_size()

if rank == 0:
    import logging
    logging.basicConfig(stream=sys.stdout, level=logging.INFO)


# set up HTFA model
params = opts(debug=debug_mode)
nvoxels, ntimepoints = htfa_data[0]['Z'].shape

# API specification: https://brainiak.org/docs/brainiak.factoranalysis.html#module-brainiak.factoranalysis.htfa
htfa = HTFA(K=params['K'],
            n_subj=len(htfa_data),
            max_global_iter=params['max_global_iter'], # decrease for speed, increase for greater accuracy (min: 1)
            max_local_iter=params['max_local_iter'],  # decrease for speed, increase for greater accuracy (min: 1)
            voxel_ratio=params['voxel_ratio'],   # decrease for speed, increase for greater accuracy (positive; max: 1.0)
            tr_ratio=params['tr_ratio'],      # decrease for speed, increase for greater accuracy (positive; max: 1.0)
            max_voxel=int(nvoxels*params['max_voxel_scale']), # decrease for speed, increase for greater accuracy (max: number of voxels)
            max_tr=int(ntimepoints*params['max_tr_scale']), # decrease for speed, increase for greater accuracy (max: number of TRs)
            verbose=params['verbose'])


# load or save a pickled model
savedir = os.path.join('/data', 'htfa')
if not os.path.exists(savedir):
    os.makedirs(savedir)
htfa_fname = os.path.join(savedir, 'htfa_' + opts2str(params) + '.pkl')

if not os.path.exists(htfa_fname):    
    # fit HTFA to htfa_data and save result
    htfa.fit([x['Z'] for x in htfa_data], [x['R'] for x in htfa_data])
    pkl.dump(htfa2dict(htfa), open(htfa_fname, 'wb'))
htfa_dict = pkl.load(open(htfa_fname, 'rb'))
htfa = dict2htfa(htfa_dict) # overwrite htfa object with saved copy


n_timepoints = [x['Z'].shape[1] for x in htfa_data] # number of timepoints for each person
plot_nodes(htfa, n_timepoints, cmap='Spectral', global_scale=100, local_scale=25)

<nilearn.plotting.displays.OrthoProjector at 0x7f4969dd32d0>


centers, widths, weights = local_params(htfa, n_timepoints)


# filter out intact vs. (word) scrambled subjects
intact_weights = [w for i, w in enumerate(weights) if 'intact' in combined_fnames[i]]
scrambled_weights = [w for i, w in enumerate(weights) if 'word' in combined_fnames[i]]

# compute dynamic ISFC for intact, (word) scrambled
intact_disfc = tc.timecorr(intact_weights, cfun=tc.isfc, combine=tc.corrmean_combine)
scrambled_disfc = tc.timecorr(scrambled_weights, cfun=tc.isfc, combine=tc.corrmean_combine)


# intact
if debug_mode:
    pthresh = 50
    max_frames = np.min([20, intact_disfc.shape[0], scrambled_disfc.shape[0]])
else:
    pthresh = 95
    max_frames = np.min([intact_disfc.shape[0], scrambled_disfc.shape[0]])
cthresh = np.min([np.percentile(np.abs(scrambled_disfc), pthresh), np.percentile(np.abs(intact_disfc), pthresh)])

max_frames = np.min([max_frames, 100]) # comment out this line to display the full animation (takes a long time!)
animate_chord(intact_disfc[:max_frames, :], cthresh=cthresh)


# scrambled
animate_chord(scrambled_disfc[:max_frames, :], cthresh=cthresh)


# intact
global_centers, global_widths = global_params(htfa)

intact_ani = animate_connectome(global_centers, intact_disfc[:max_frames, :], cthresh=cthresh, figdir='intact_frames')
HTML(intact_ani.to_html5_video())

INFO:matplotlib.animation:Animation.save using <class 'matplotlib.animation.FFMpegWriter'>
INFO:matplotlib.animation:MovieWriter._run: running command: ffmpeg -f rawvideo -vcodec rawvideo -s 432x288 -pix_fmt rgba -r 20.0 -loglevel error -i pipe: -vcodec h264 -pix_fmt yuv420p -y /tmp/tmpcgcso4cq/temp.m4v


# scrambled
scrambled_ani = animate_connectome(global_centers, scrambled_disfc[:max_frames, :], cthresh=cthresh, figdir='scrambled_frames')
HTML(scrambled_ani.to_html5_video())

INFO:matplotlib.animation:Animation.save using <class 'matplotlib.animation.FFMpegWriter'>
INFO:matplotlib.animation:MovieWriter._run: running command: ffmpeg -f rawvideo -vcodec rawvideo -s 432x288 -pix_fmt rgba -r 20.0 -loglevel error -i pipe: -vcodec h264 -pix_fmt yuv420p -y /tmp/tmpwrq7s60h/temp.m4v

Hierarchical Topographic Factor Analysis¶

Overview¶

Annotated bibliography¶

Table of contents:¶

Getting started¶

Code¶

Initialization¶

Fit HTFA to data¶

Plotting HTFA global and local node locations¶

Compute dynamic correlations¶

Generate animated chord diagrams¶

Generate animated brain network plots¶

Summary¶