3 years ago · d1227b920c
--- a/.gitattributes
+++ b/.gitattributes
@@ -2,4 +2,5 @@
 
				 * annex.backend=MD5E
			
 
				 **/.git* annex.largefiles=nothing
			
 
				 CHANGELOG.md annex.largefiles=nothing
			
 
				-README.md annex.largefiles=nothing
			
 
				+README.md annex.largefiles=nothing
			
 
				+highspeed-glm.Rproj annex.largefiles=nothing
			
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1,7 @@
 
				+.Rproj.user
			
 
				+.Rhistory
			
 
				+.RData
			
 
				+.Ruserdata
			
 
				+code/*/*.html
			
 
				+logs
			
 
				+work
			
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
--- a/code/docs/highspeed-glm-docs.Rmd
+++ b/code/docs/highspeed-glm-docs.Rmd
@@ -0,0 +1,29 @@
 
				+```{r, echo=FALSE, message=FALSE, include=FALSE}
			
 
				+if (!requireNamespace("pacman")) install.packages("pacman")
			
 
				+packages_cran <- c("here")
			
 
				+pacman::p_load(char = packages_cran)
			
 
				+if (basename(here::here()) == "highspeed"){
			
 
				+  path_root = here::here("highspeed-glm")
			
 
				+} else {
			
 
				+  path_root = here::here()
			
 
				+}
			
 
				+```
			
 
				+
			
 
				+## First-level GLMs
			
 
				+
			
 
				+### Main GLM workflow (`highspeed-glm-main.py`)
			
 
				+
			
 
				+```{python, echo=TRUE, code=readLines(file.path(path_root, "code", "glm", "highspeed-glm-main.py")), eval=FALSE, python.reticulate=FALSE}
			
 
				+```
			
 
				+
			
 
				+### Extra GLM functions ((`highspeed-glm-functions.py`))
			
 
				+
			
 
				+```{python, echo=TRUE, code=readLines(file.path(path_root, "code", "glm", "highspeed_glm_functions.py")), eval=FALSE, python.reticulate=FALSE}
			
 
				+```
			
 
				+
			
 
				+### Requirements
			
 
				+
			
 
				+The `requirements.txt` file lists the required packages which can be installed e.g., using `pip install -r requirements.txt`
			
 
				+
			
 
				+```{bash, echo=TRUE, code=readLines(file.path(path_root, "code", "glm", "requirements.txt")), eval=FALSE}
			
 
				+```
			
--- a/code/glm/highspeed-glm-main.py
+++ b/code/glm/highspeed-glm-main.py
@@ -0,0 +1,471 @@
 
				+#!/usr/bin/env python3
			
 
				+# -*- coding: utf-8 -*-
			
 
				+# ======================================================================
			
 
				+# SCRIPT INFORMATION:
			
 
				+# ======================================================================
			
 
				+# SCRIPT: FIRST LEVEL GLM
			
 
				+# PROJECT: HIGHSPEED
			
 
				+# WRITTEN BY LENNART WITTKUHN, 2018 - 2020
			
 
				+# CONTACT: WITTKUHN AT MPIB HYPHEN BERLIN DOT MPG DOT DE
			
 
				+# MAX PLANCK RESEARCH GROUP NEUROCODE
			
 
				+# MAX PLANCK INSTITUTE FOR HUMAN DEVELOPMENT
			
 
				+# MAX PLANCK UCL CENTRE FOR COMPUTATIONAL PSYCHIATRY AND AGEING RESEARCH
			
 
				+# LENTZEALLEE 94, 14195 BERLIN, GERMANY
			
 
				+# ACKNOWLEDGEMENTS: THANKS TO HRVOJE STOJIC (UCL) FOR HELP
			
 
				+# ======================================================================
			
 
				+# IMPORT RELEVANT PACKAGES
			
 
				+# ======================================================================
			
 
				+# import basic libraries:
			
 
				+import os
			
 
				+import sys
			
 
				+import warnings
			
 
				+from os.path import join as opj
			
 
				+# import nipype libraries:
			
 
				+from nipype.interfaces.utility import Function, IdentityInterface
			
 
				+from nipype.interfaces.io import SelectFiles, DataSink
			
 
				+from nipype.pipeline.engine import Workflow, Node, MapNode
			
 
				+from nipype.utils.profiler import log_nodes_cb
			
 
				+from nipype import config, logging
			
 
				+# import spm and matlab interfaces:
			
 
				+from nipype.algorithms.modelgen import SpecifySPMModel
			
 
				+from nipype.interfaces.spm.model import (
			
 
				+    Level1Design, EstimateModel, EstimateContrast, ThresholdStatistics,
			
 
				+    Threshold)
			
 
				+from nipype.interfaces.matlab import MatlabCommand
			
 
				+from nipype.interfaces import spm
			
 
				+# import fsl interfaces:
			
 
				+from nipype.workflows.fmri.fsl import create_susan_smooth
			
 
				+from nipype.interfaces.fsl.utils import ExtractROI
			
 
				+# import libraries for bids interaction:
			
 
				+from bids.layout import BIDSLayout
			
 
				+# import freesurfer interfaces:
			
 
				+# import custom functions:
			
 
				+from highspeed_glm_functions import (
			
 
				+    get_subject_info, plot_stat_maps, leave_one_out)
			
 
				+# ======================================================================
			
 
				+# ENVIRONMENT SETTINGS (DEALING WITH ERRORS AND WARNINGS):
			
 
				+# ======================================================================
			
 
				+# set the fsl output type environment variable:
			
 
				+os.environ['FSLOUTPUTTYPE'] = 'NIFTI_GZ'
			
 
				+# deal with nipype-related warnings:
			
 
				+os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
			
 
				+# inhibit CTF lock
			
 
				+os.environ['MCR_INHIBIT_CTF_LOCK'] = '1'
			
 
				+# filter out warnings related to the numpy package:
			
 
				+warnings.filterwarnings("ignore", message="numpy.dtype size changed*")
			
 
				+warnings.filterwarnings("ignore", message="numpy.ufunc size changed*")
			
 
				+# ======================================================================
			
 
				+# SET PATHS AND SUBJECTS
			
 
				+# ======================================================================
			
 
				+# define paths depending on the operating system (OS) platform:
			
 
				+project = 'highspeed'
			
 
				+# initialize empty paths:
			
 
				+path_root = None
			
 
				+sub_list = None
			
 
				+if 'darwin' in sys.platform:
			
 
				+    path_root = opj('/Users', 'wittkuhn', 'Volumes', 'tardis_beegfs', project)
			
 
				+    path_spm = '/Users/Shared/spm12'
			
 
				+    path_matlab = '/Applications/MATLAB_R2017a.app/bin/matlab -nodesktop -nosplash'
			
 
				+    # set paths for spm:
			
 
				+    spm.SPMCommand.set_mlab_paths(paths=path_spm, matlab_cmd=path_matlab)
			
 
				+    MatlabCommand.set_default_paths(path_spm)
			
 
				+    MatlabCommand.set_default_matlab_cmd(path_matlab)
			
 
				+    sub_list = ['sub-01']
			
 
				+elif 'linux' in sys.platform:
			
 
				+    path_root = opj('/home', 'mpib', 'wittkuhn', project, 'highspeed-glm')
			
 
				+    # path_matlab = '/home/mpib/wittkuhn/spm12.simg eval \$SPMMCRCMD'
			
 
				+    # path_matlab = opj('/home', 'beegfs', 'wittkuhn', 'tools', 'spm', 'spm12.simg eval \$SPMMCRCMD')
			
 
				+    singularity_cmd = 'singularity run -B /home/mpib/wittkuhn -B /mnt/beegfs/home/wittkuhn /home/mpib/wittkuhn/highspeed/highspeed-glm/tools/spm/spm12.simg'
			
 
				+    singularity_spm = 'eval \$SPMMCRCMD'
			
 
				+    path_matlab = ' '.join([singularity_cmd, singularity_spm])
			
 
				+    spm.SPMCommand.set_mlab_paths(matlab_cmd=path_matlab, use_mcr=True)
			
 
				+    # grab the list of subjects from the bids data set:
			
 
				+    path_bids = opj(path_root, 'bids')
			
 
				+    layout = BIDSLayout(path_bids)
			
 
				+    # get all subject ids:
			
 
				+    sub_list = sorted(layout.get_subjects())
			
 
				+    # create a template to add the "sub-" prefix to the ids
			
 
				+    sub_template = ['sub-'] * len(sub_list)
			
 
				+    # add the prefix to all ids:
			
 
				+    sub_list = ["%s%s" % t for t in zip(sub_template, sub_list)]
			
 
				+    # if user defined to run specific subject
			
 
				+    sub_list = sub_list[int(sys.argv[1]):int(sys.argv[2])]
			
 
				+# print the SPM version:
			
 
				+print('using SPM version %s' % spm.SPMCommand().version)
			
 
				+# ======================================================================
			
 
				+# DEFINE PBS CLUSTER JOB TEMPLATE (NEEDED WHEN RUNNING ON THE CLUSTER):
			
 
				+# ======================================================================
			
 
				+job_template = """
			
 
				+#PBS -l walltime=10:00:00
			
 
				+#PBS -j oe
			
 
				+#PBS -o /home/mpib/wittkuhn/highspeed/highspeed-glm/logs/glm
			
 
				+#PBS -m n
			
 
				+#PBS -v FSLOUTPUTTYPE=NIFTI_GZ
			
 
				+source /etc/bash_completion.d/virtualenvwrapper
			
 
				+workon highspeed-glm
			
 
				+module load fsl/5.0
			
 
				+module load matlab/R2017b
			
 
				+module load freesurfer/6.0.0
			
 
				+"""
			
 
				+# ======================================================================
			
 
				+# SETTING UP LOGGING
			
 
				+# ======================================================================
			
 
				+#path_log = opj(path_root, 'logs', 'l1analyis')
			
 
				+# enable debug mode for logging and configuration:
			
 
				+#config.enable_debug_mode()
			
 
				+# enable logging to file and provide path to the logging file:
			
 
				+#config.update_config({'logging': {'log_directory': path_log,
			
 
				+#                                  'log_to_file': True},
			
 
				+#                      'execution': {'stop_on_first_crash': False,
			
 
				+#                                    'keep_unnecessary_outputs': 'false'},
			
 
				+#                      'monitoring': {'enabled': True}
			
 
				+#                      })
			
 
				+# update the global logging settings:
			
 
				+# logging.update_logging(config)
			
 
				+# callback_log_path = opj(path_log,'ressources.log')
			
 
				+# logger = logging.getLogger('callback')
			
 
				+# logger.setLevel(logging.DEBUG)
			
 
				+# handler = logging.FileHandler(callback_log_path)
			
 
				+# logger.addHandler(handler)
			
 
				+# ======================================================================
			
 
				+# SETTING UP LOGGING
			
 
				+# ======================================================================
			
 
				+#path_log = opj(path_root, 'logs', 'l1analyis')
			
 
				+## create directory to save the log files if it does not exist yet:
			
 
				+#if not os.path.exists(path_log):
			
 
				+#    os.makedirs(path_log)
			
 
				+## configure logging:
			
 
				+#logging.basicConfig(
			
 
				+#        filename=opj(path_log,'log_l1analysis.log'),
			
 
				+#        level=logging.DEBUG,
			
 
				+#        filemode = "a+",
			
 
				+#        format='%(asctime)s - %(levelname)s - %(message)s',
			
 
				+#        datefmt='%d/%m/%Y %H:%M:%S')
			
 
				+#logging.getLogger().addHandler(logging.StreamHandler())
			
 
				+# ======================================================================
			
 
				+# LOG INFORMATION ABOUT THE EXECUTION
			
 
				+# ======================================================================
			
 
				+# print the loaded SPM version:
			
 
				+#analysis_name = "Level 1 GLM analysis"
			
 
				+#logging.info("--------------------------------------------------------")
			
 
				+#logging.info("Analysis: " + analysis_name)
			
 
				+#logging.info("SPM version: " + (spm.SPMCommand().version))
			
 
				+#logging.info("List of subjects:")
			
 
				+#logging.info(sub_list)
			
 
				+# ======================================================================
			
 
				+# DEFINE SETTINGS
			
 
				+# ======================================================================
			
 
				+# time of repetition, in seconds:
			
 
				+time_repetition = 1.25
			
 
				+# total number of runs:
			
 
				+num_runs = 8
			
 
				+# smoothing kernel, in mm:
			
 
				+fwhm = 4
			
 
				+# number of dummy variables to remove from each run:
			
 
				+num_dummy = 0
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: INFOSOURCE
			
 
				+# ======================================================================
			
 
				+# define the infosource node that collects the data:
			
 
				+infosource = Node(IdentityInterface(
			
 
				+    fields=['subject_id']), name='infosource')
			
 
				+# let the node iterate (paralellize) over all subjects:
			
 
				+infosource.iterables = [('subject_id', sub_list)]
			
 
				+# ======================================================================
			
 
				+# DEFINE SELECTFILES NODE
			
 
				+# ======================================================================
			
 
				+# define all relevant files paths:
			
 
				+templates = dict(
			
 
				+    confounds=opj(path_root, 'derivatives', 'fmriprep', '{subject_id}',
			
 
				+                  '*', 'func', '*highspeed*confounds_regressors.tsv'),
			
 
				+    events=opj(path_root, 'bids', '{subject_id}', '*', 'func',
			
 
				+               '*events.tsv'),
			
 
				+    func=opj(path_root, 'derivatives', 'fmriprep', '{subject_id}', '*',
			
 
				+             'func', '*highspeed*space-T1w*preproc_bold.nii.gz'),
			
 
				+    anat=opj(path_root, 'derivatives', 'fmriprep', '{subject_id}',
			
 
				+             'anat', '{subject_id}_desc-preproc_T1w.nii.gz'),
			
 
				+    wholemask=opj(path_root, 'derivatives', 'fmriprep', '{subject_id}',
			
 
				+                  '*', 'func', '*highspeed*space-T1w*brain_mask.nii.gz'),
			
 
				+)
			
 
				+# define the selectfiles node:
			
 
				+selectfiles = Node(SelectFiles(templates, sort_filelist=True),
			
 
				+                   name='selectfiles')
			
 
				+# set expected thread and memory usage for the node:
			
 
				+selectfiles.interface.num_threads = 1
			
 
				+selectfiles.interface.mem_gb = 0.1
			
 
				+# selectfiles.inputs.subject_id = 'sub-20'
			
 
				+# selectfiles_results = selectfiles.run()
			
 
				+# ======================================================================
			
 
				+# DEFINE CREATE_SUSAN_SMOOTH WORKFLOW NODE
			
 
				+# ======================================================================
			
 
				+# define the susan smoothing node and specify the smoothing fwhm:
			
 
				+susan = create_susan_smooth()
			
 
				+# set the smoothing kernel:
			
 
				+susan.inputs.inputnode.fwhm = fwhm
			
 
				+# set expected thread and memory usage for the nodes:
			
 
				+susan.get_node('inputnode').interface.num_threads = 1
			
 
				+susan.get_node('inputnode').interface.mem_gb = 0.1
			
 
				+susan.get_node('median').interface.num_threads = 1
			
 
				+susan.get_node('median').interface.mem_gb = 3
			
 
				+susan.get_node('mask').interface.num_threads = 1
			
 
				+susan.get_node('mask').interface.mem_gb = 3
			
 
				+susan.get_node('meanfunc2').interface.num_threads = 1
			
 
				+susan.get_node('meanfunc2').interface.mem_gb = 3
			
 
				+susan.get_node('merge').interface.num_threads = 1
			
 
				+susan.get_node('merge').interface.mem_gb = 3
			
 
				+susan.get_node('multi_inputs').interface.num_threads = 1
			
 
				+susan.get_node('multi_inputs').interface.mem_gb = 3
			
 
				+susan.get_node('smooth').interface.num_threads = 1
			
 
				+susan.get_node('smooth').interface.mem_gb = 3
			
 
				+susan.get_node('outputnode').interface.num_threads = 1
			
 
				+susan.get_node('outputnode').interface.mem_gb = 0.1
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: FUNCTION TO GET THE SUBJECT-SPECIFIC INFORMATION
			
 
				+# ======================================================================
			
 
				+subject_info = MapNode(Function(
			
 
				+    input_names=['events', 'confounds'],
			
 
				+    output_names=['subject_info', 'event_names'],
			
 
				+    function=get_subject_info),
			
 
				+    name='subject_info', iterfield=['events', 'confounds'])
			
 
				+# set expected thread and memory usage for the node:
			
 
				+subject_info.interface.num_threads = 1
			
 
				+subject_info.interface.mem_gb = 0.1
			
 
				+# subject_info.inputs.events = selectfiles_results.outputs.events
			
 
				+# subject_info.inputs.confounds = selectfiles_results.outputs.confounds
			
 
				+# subject_info_results = subject_info.run()
			
 
				+# subject_info_results.outputs.subject_info
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: REMOVE DUMMY VARIABLES (USING FSL ROI)
			
 
				+# ======================================================================
			
 
				+# function: extract region of interest (ROI) from an image
			
 
				+trim = MapNode(ExtractROI(), name='trim', iterfield=['in_file'])
			
 
				+# define index of the first selected volume (i.e., minimum index):
			
 
				+trim.inputs.t_min = num_dummy
			
 
				+# define the number of volumes selected starting at the minimum index:
			
 
				+trim.inputs.t_size = -1
			
 
				+# define the fsl output type:
			
 
				+trim.inputs.output_type = 'NIFTI'
			
 
				+# set expected thread and memory usage for the node:
			
 
				+trim.interface.num_threads = 1
			
 
				+trim.interface.mem_gb = 3
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: LEAVE-ONE-RUN-OUT SELECTION OF DATA
			
 
				+# ======================================================================
			
 
				+leave_one_run_out = Node(Function(
			
 
				+    input_names=['subject_info', 'event_names', 'data_func', 'run'],
			
 
				+    output_names=['subject_info', 'data_func', 'contrasts'],
			
 
				+    function=leave_one_out),
			
 
				+    name='leave_one_run_out')
			
 
				+# define the number of rows as an iterable:
			
 
				+leave_one_run_out.iterables = ('run', range(num_runs))
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: SPECIFY SPM MODEL (GENERATE SPM-SPECIFIC MODEL)
			
 
				+# ======================================================================
			
 
				+# function: makes a model specification compatible with spm designers
			
 
				+# adds SPM specific options to SpecifyModel
			
 
				+l1model = Node(SpecifySPMModel(), name="l1model")
			
 
				+# input: concatenate runs to a single session (boolean, default: False):
			
 
				+l1model.inputs.concatenate_runs = False
			
 
				+# input: units of event onsets and durations (secs or scans):
			
 
				+l1model.inputs.input_units = 'secs'
			
 
				+# input: units of design event onsets and durations (secs or scans):
			
 
				+l1model.inputs.output_units = 'secs'
			
 
				+# input: time of repetition (a float):
			
 
				+l1model.inputs.time_repetition = time_repetition
			
 
				+# high-pass filter cutoff in secs (a float, default = 128 secs):
			
 
				+l1model.inputs.high_pass_filter_cutoff = 128
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: LEVEL 1 DESIGN (GENERATE AN SPM DESIGN MATRIX)
			
 
				+# ======================================================================
			
 
				+# function: generate an SPM design matrix
			
 
				+l1design = Node(Level1Design(), name="l1design")
			
 
				+# input: (a dictionary with keys which are 'hrf' or 'fourier' or
			
 
				+# 'fourier_han' or 'gamma' or 'fir' and with values which are any value)
			
 
				+l1design.inputs.bases = {'hrf': {'derivs': [0, 0]}}
			
 
				+# input: units for specification of onsets ('secs' or 'scans'):
			
 
				+l1design.inputs.timing_units = 'secs'
			
 
				+# input: interscan interval / repetition time in secs (a float):
			
 
				+l1design.inputs.interscan_interval = time_repetition
			
 
				+# input: Model serial correlations AR(1), FAST or none:
			
 
				+l1design.inputs.model_serial_correlations = 'AR(1)'
			
 
				+# input: number of time-bins per scan in secs (an integer):
			
 
				+l1design.inputs.microtime_resolution = 16
			
 
				+# input: the onset/time-bin in seconds for alignment (a float):
			
 
				+l1design.inputs.microtime_onset = 1
			
 
				+# set expected thread and memory usage for the node:
			
 
				+l1design.interface.num_threads = 1
			
 
				+l1design.interface.mem_gb = 2
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: ESTIMATE MODEL (ESTIMATE THE PARAMETERS OF THE MODEL)
			
 
				+# ======================================================================
			
 
				+# function: use spm_spm to estimate the parameters of a model
			
 
				+l1estimate = Node(EstimateModel(), name="l1estimate")
			
 
				+# input: (a dictionary with keys which are 'Classical' or 'Bayesian2'
			
 
				+# or 'Bayesian' and with values which are any value)
			
 
				+l1estimate.inputs.estimation_method = {'Classical': 1}
			
 
				+# set expected thread and memory usage for the node:
			
 
				+l1estimate.interface.num_threads = 1
			
 
				+l1estimate.interface.mem_gb = 2
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: ESTIMATE CONTRASTS (ESTIMATES THE CONTRASTS)
			
 
				+# ======================================================================
			
 
				+# function: use spm_contrasts to estimate contrasts of interest
			
 
				+l1contrasts = Node(EstimateContrast(), name="l1contrasts")
			
 
				+# input: list of contrasts with each contrast being a list of the form:
			
 
				+# [('name', 'stat', [condition list], [weight list], [session list])]:
			
 
				+# l1contrasts.inputs.contrasts = l1contrasts_list
			
 
				+# node input: overwrite previous results:
			
 
				+l1contrasts.overwrite = True
			
 
				+# set expected thread and memory usage for the node:
			
 
				+l1contrasts.interface.num_threads = 1
			
 
				+l1contrasts.interface.mem_gb = 1.5
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: FUNCTION TO PLOT CONTRASTS
			
 
				+# ======================================================================
			
 
				+plot_contrasts = MapNode(Function(
			
 
				+    input_names=['anat', 'stat_map', 'thresh'],
			
 
				+    output_names=['out_path'],
			
 
				+    function=plot_stat_maps),
			
 
				+    name='plot_contrasts', iterfield=['thresh'])
			
 
				+# input: plot data with set of different thresholds:
			
 
				+plot_contrasts.inputs.thresh = [None, 1, 2, 3]
			
 
				+# set expected thread and memory usage for the node:
			
 
				+plot_contrasts.interface.num_threads = 1
			
 
				+plot_contrasts.interface.mem_gb = 0.2
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: THRESHOLD
			
 
				+# ======================================================================
			
 
				+# function: Topological FDR thresholding based on cluster extent/size.
			
 
				+# Smoothness is estimated from GLM residuals but is assumed to be the
			
 
				+# same for all of the voxels.
			
 
				+thresh = Node(Threshold(), name="thresh")
			
 
				+# input: whether to use FWE (Bonferroni) correction for initial threshold
			
 
				+# (a boolean, nipype default value: True):
			
 
				+thresh.inputs.use_fwe_correction = False
			
 
				+# input: whether to use FDR over cluster extent probabilities (boolean)
			
 
				+thresh.inputs.use_topo_fdr = True
			
 
				+ # input: value for initial thresholding (defining clusters):
			
 
				+thresh.inputs.height_threshold = 0.05
			
 
				+# input: is the cluster forming threshold a stat value or p-value?
			
 
				+# ('p-value' or 'stat', nipype default value: p-value):
			
 
				+thresh.inputs.height_threshold_type = 'p-value'
			
 
				+# input: which contrast in the SPM.mat to use (an integer):
			
 
				+thresh.inputs.contrast_index = 1
			
 
				+# input: p threshold on FDR corrected cluster size probabilities (float):
			
 
				+thresh.inputs.extent_fdr_p_threshold = 0.05
			
 
				+# input: minimum cluster size in voxels (an integer, default = 0):
			
 
				+thresh.inputs.extent_threshold = 0
			
 
				+# set expected thread and memory usage for the node:
			
 
				+thresh.interface.num_threads = 1
			
 
				+thresh.interface.mem_gb = 0.2
			
 
				+# ======================================================================
			
 
				+# DEFINE NODE: THRESHOLD STATISTICS
			
 
				+# ======================================================================
			
 
				+# function: Given height and cluster size threshold calculate
			
 
				+# theoretical probabilities concerning false positives
			
 
				+thresh_stat = Node(ThresholdStatistics(), name="thresh_stat")
			
 
				+# input: which contrast in the SPM.mat to use (an integer):
			
 
				+thresh_stat.inputs.contrast_index = 1
			
 
				+# ======================================================================
			
 
				+# CREATE DATASINK NODE (OUTPUT STREAM):
			
 
				+# ======================================================================
			
 
				+# create a node of the function:
			
 
				+l1datasink = Node(DataSink(), name='datasink')
			
 
				+# assign the path to the base directory:
			
 
				+l1datasink.inputs.base_directory = opj(path_root, 'l1pipeline')
			
 
				+# create a list of substitutions to adjust the file paths of datasink:
			
 
				+substitutions = [('_subject_id_', '')]
			
 
				+# assign the substitutions to the datasink command:
			
 
				+l1datasink.inputs.substitutions = substitutions
			
 
				+# determine whether to store output in parameterized form:
			
 
				+l1datasink.inputs.parameterization = True
			
 
				+# set expected thread and memory usage for the node:
			
 
				+l1datasink.interface.num_threads = 1
			
 
				+l1datasink.interface.mem_gb = 0.2
			
 
				+# ======================================================================
			
 
				+# DEFINE THE LEVEL 1 ANALYSIS SUB-WORKFLOW AND CONNECT THE NODES:
			
 
				+# ======================================================================
			
 
				+# initiation of the 1st-level analysis workflow:
			
 
				+l1analysis = Workflow(name='l1analysis')
			
 
				+# connect the 1st-level analysis components
			
 
				+l1analysis.connect(l1model, 'session_info', l1design, 'session_info')
			
 
				+l1analysis.connect(l1design, 'spm_mat_file', l1estimate, 'spm_mat_file')
			
 
				+l1analysis.connect(l1estimate, 'spm_mat_file', l1contrasts, 'spm_mat_file')
			
 
				+l1analysis.connect(l1estimate, 'beta_images', l1contrasts, 'beta_images')
			
 
				+l1analysis.connect(l1estimate, 'residual_image', l1contrasts, 'residual_image')
			
 
				+# ======================================================================
			
 
				+# DEFINE META-WORKFLOW PIPELINE:
			
 
				+# ======================================================================
			
 
				+# initiation of the 1st-level analysis workflow:
			
 
				+l1pipeline = Workflow(name='l1pipeline')
			
 
				+# stop execution of the workflow if an error is encountered:
			
 
				+l1pipeline.config = {'execution': {'stop_on_first_crash': True,
			
 
				+                                   'hash_method': 'timestamp'}}
			
 
				+# define the base directory of the workflow:
			
 
				+l1pipeline.base_dir = opj(path_root, 'work')
			
 
				+# ======================================================================
			
 
				+# ENABLE LOGGING:
			
 
				+# ======================================================================
			
 
				+# enable logging to file:
			
 
				+#config.enable_debug_mode()
			
 
				+#config.update_config({'logging': {'log_directory': os.getcwd(),
			
 
				+#                                  'log_to_file': True}})
			
 
				+#logging.update_logging(config)
			
 
				+# ======================================================================
			
 
				+# CONNECT WORKFLOW NODES:
			
 
				+# ======================================================================
			
 
				+# connect infosource to selectfiles node:
			
 
				+l1pipeline.connect(infosource, 'subject_id', selectfiles, 'subject_id')
			
 
				+# generate subject specific events and regressors to subject_info:
			
 
				+l1pipeline.connect(selectfiles, 'events', subject_info, 'events')
			
 
				+l1pipeline.connect(selectfiles, 'confounds', subject_info, 'confounds')
			
 
				+# connect functional files to smoothing workflow:
			
 
				+l1pipeline.connect(selectfiles, 'func', susan, 'inputnode.in_files')
			
 
				+l1pipeline.connect(selectfiles, 'wholemask', susan, 'inputnode.mask_file')
			
 
				+l1pipeline.connect(susan, 'outputnode.smoothed_files', l1datasink, 'smooth')
			
 
				+# connect smoothed functional data to the trimming node:
			
 
				+l1pipeline.connect(susan, 'outputnode.smoothed_files', trim, 'in_file')
			
 
				+# ======================================================================
			
 
				+# INPUT AND OUTPUT STREAM FOR THE LEVEL 1 SPM ANALYSIS SUB-WORKFLOW:
			
 
				+# ======================================================================
			
 
				+# connect regressors to the subsetting node::
			
 
				+l1pipeline.connect(subject_info, 'subject_info', leave_one_run_out, 'subject_info')
			
 
				+# connect event_names to the subsetting node:
			
 
				+l1pipeline.connect(subject_info, 'event_names', leave_one_run_out, 'event_names')
			
 
				+# connect smoothed and trimmed data to subsetting node:
			
 
				+l1pipeline.connect(trim, 'roi_file', leave_one_run_out, 'data_func')
			
 
				+# connect regressors to the level 1 model specification node:
			
 
				+l1pipeline.connect(leave_one_run_out, 'subject_info', l1analysis, 'l1model.subject_info')
			
 
				+# connect smoothed and trimmed data to the level 1 model specification:
			
 
				+l1pipeline.connect(leave_one_run_out, 'data_func', l1analysis, 'l1model.functional_runs')
			
 
				+# connect l1 contrast specification to contrast estimation
			
 
				+l1pipeline.connect(leave_one_run_out, 'contrasts', l1analysis, 'l1contrasts.contrasts')
			
 
				+# connect the anatomical image to the plotting node:
			
 
				+l1pipeline.connect(selectfiles, 'anat', plot_contrasts, 'anat')
			
 
				+# connect spm t-images to the plotting node:
			
 
				+l1pipeline.connect(l1analysis, 'l1contrasts.spmT_images', plot_contrasts, 'stat_map')
			
 
				+# connect the t-images and spm mat file to the threshold node:
			
 
				+l1pipeline.connect(l1analysis, 'l1contrasts.spmT_images', thresh, 'stat_image')
			
 
				+l1pipeline.connect(l1analysis, 'l1contrasts.spm_mat_file', thresh, 'spm_mat_file')
			
 
				+# connect all output results of the level 1 analysis to the datasink:
			
 
				+l1pipeline.connect(l1analysis, 'l1estimate.beta_images', l1datasink, 'estimates.@beta_images')
			
 
				+l1pipeline.connect(l1analysis, 'l1estimate.residual_image', l1datasink, 'estimates.@residual_image')
			
 
				+l1pipeline.connect(l1analysis, 'l1contrasts.spm_mat_file', l1datasink, 'contrasts.@spm_mat')
			
 
				+l1pipeline.connect(l1analysis, 'l1contrasts.spmT_images', l1datasink, 'contrasts.@spmT')
			
 
				+l1pipeline.connect(l1analysis, 'l1contrasts.con_images', l1datasink, 'contrasts.@con')
			
 
				+l1pipeline.connect(plot_contrasts, 'out_path', l1datasink, 'contrasts.@out_path')
			
 
				+l1pipeline.connect(thresh, 'thresholded_map', l1datasink, 'thresh.@threshhold_map')
			
 
				+l1pipeline.connect(thresh, 'pre_topo_fdr_map', l1datasink, 'thresh.@pre_topo_fdr_map')
			
 
				+# ======================================================================
			
 
				+# WRITE GRAPH AND EXECUTE THE WORKFLOW
			
 
				+# ======================================================================
			
 
				+# write the graph:
			
 
				+l1pipeline.write_graph(graph2use='colored', simple_form=True)
			
 
				+# set the maximum resources the workflow can utilize:
			
 
				+# args_dict = {'status_callback' : log_nodes_cb}
			
 
				+# execute the workflow depending on the operating system:
			
 
				+if 'darwin' in sys.platform:
			
 
				+    # will execute the workflow using all available cpus:
			
 
				+    l1pipeline.run(plugin='MultiProc')
			
 
				+elif 'linux' in sys.platform:
			
 
				+    l1pipeline.run(plugin='PBS', plugin_args=dict(template=job_template))
			
--- a/code/glm/highspeed_glm_functions.py
+++ b/code/glm/highspeed_glm_functions.py
@@ -0,0 +1,136 @@
 
				+#!/usr/bin/env python3
			
 
				+# -*- coding: utf-8 -*-
			
 
				+
			
 
				+# ======================================================================
			
 
				+# DEFINE FUNCTION: FUNCTION TO GET THE SUBJECT-SPECIFIC INFORMATION
			
 
				+# ======================================================================
			
 
				+
			
 
				+
			
 
				+def get_subject_info(events, confounds):
			
 
				+    """
			
 
				+    FUNCTION TO GET THE SUBJECT-SPECIFIC INFORMATION
			
 
				+    :param events: list with paths to events files
			
 
				+    :param confounds: list with paths to confounds files
			
 
				+    :return: Bunch object with event onsets, durations and regressors
			
 
				+    """
			
 
				+
			
 
				+    # import libraries (needed to be done in the function):
			
 
				+    import pandas as pd
			
 
				+    from nipype.interfaces.base import Bunch
			
 
				+
			
 
				+    # event types we consider:
			
 
				+    event_spec = {
			
 
				+        'correct_rejection': {'target': 0, 'key_down': 0},
			
 
				+        'hit': {'target': 1, 'key_down': 1},
			
 
				+        'false_alarm': {'target': 0, 'key_down': 1},
			
 
				+        'miss': {'target': 1, 'key_down': 0},
			
 
				+    }
			
 
				+
			
 
				+    #event_names = ['correct_rejection']
			
 
				+
			
 
				+    # read the events and confounds files of the current run:
			
 
				+    #events = selectfiles_results.outputs.events[0]
			
 
				+    #confounds = selectfiles_results.outputs.confounds[0]
			
 
				+    run_events = pd.read_csv(events, sep="\t")
			
 
				+    run_confounds = pd.read_csv(confounds, sep="\t")
			
 
				+
			
 
				+    # define confounds to include as regressors:
			
 
				+    confounds = ['trans', 'rot', 'a_comp_cor', 'framewise_displacement']
			
 
				+
			
 
				+    # search for confounds of interest in the confounds data frame:
			
 
				+    regressor_names = [col for col in run_confounds.columns if
			
 
				+                       any([conf in col for conf in confounds])]
			
 
				+
			
 
				+    def replace_nan(regressor_values):
			
 
				+        # calculate the mean value of the regressor:
			
 
				+        mean_value = regressor_values.mean(skipna=True)
			
 
				+        # replace all values containing nan with the mean value:
			
 
				+        regressor_values[regressor_values.isnull()] = mean_value
			
 
				+        # return list of the regressor values:
			
 
				+        return list(regressor_values)
			
 
				+
			
 
				+    # create a nested list with regressor values
			
 
				+    regressors = [replace_nan(run_confounds[conf]) for conf in regressor_names]
			
 
				+
			
 
				+    onsets = []
			
 
				+    durations = []
			
 
				+    event_names = []
			
 
				+
			
 
				+    for event in event_spec:
			
 
				+
			
 
				+        onset_list = list(
			
 
				+            run_events['onset']
			
 
				+            [(run_events['condition'] == 'oddball') &
			
 
				+             (run_events['target'] == event_spec[event]['target']) &
			
 
				+             (run_events['key_down'] == event_spec[event]['key_down'])])
			
 
				+
			
 
				+        duration_list = list(
			
 
				+            run_events['duration']
			
 
				+            [(run_events['condition'] == 'oddball') &
			
 
				+             (run_events['target'] == event_spec[event]['target']) &
			
 
				+             (run_events['key_down'] == event_spec[event]['key_down'])])
			
 
				+
			
 
				+        if (onset_list != []) & (duration_list != []):
			
 
				+            event_names.append(event)
			
 
				+            onsets.append(onset_list)
			
 
				+            durations.append(duration_list)
			
 
				+
			
 
				+    # create a bunch for each run:
			
 
				+    subject_info = Bunch(
			
 
				+        conditions=event_names, onsets=onsets, durations=durations,
			
 
				+        regressor_names=regressor_names, regressors=regressors)
			
 
				+
			
 
				+    return subject_info, sorted(event_names)
			
 
				+
			
 
				+# ======================================================================
			
 
				+# DEFINE FUNCTION: FUNCTION TO PLOT THE CONTRASTS AGAINST ANATOMICAL
			
 
				+# ======================================================================
			
 
				+
			
 
				+
			
 
				+def plot_stat_maps(anat, stat_map, thresh):
			
 
				+    """
			
 
				+
			
 
				+    :param anat:
			
 
				+    :param stat_map:
			
 
				+    :param thresh:
			
 
				+    :return:
			
 
				+    """
			
 
				+    # import libraries (needed to be done in the function):
			
 
				+    from nilearn.plotting import plot_stat_map
			
 
				+    from os import path as op
			
 
				+
			
 
				+    out_path = op.join(op.dirname(stat_map), 'contrast_thresh_%s.png' % thresh)
			
 
				+    plot_stat_map(
			
 
				+            stat_map, title=('Threshold: %s' % thresh),
			
 
				+            bg_img=anat, threshold=thresh, dim=-1, display_mode='ortho',
			
 
				+            output_file=out_path)
			
 
				+
			
 
				+    return out_path
			
 
				+
			
 
				+
			
 
				+def leave_one_out(subject_info, event_names, data_func, run):
			
 
				+    """
			
 
				+    Select subsets of lists in leave-one-out fashion:
			
 
				+    :param subject_info: list of subject info bunch objects
			
 
				+    :param data_func: list of functional runs
			
 
				+    :param run: current run
			
 
				+    :return: return list of subject info and data excluding the current run
			
 
				+    """
			
 
				+
			
 
				+    # create new list with event_names of all runs except current run:
			
 
				+    event_names = [info for i, info in enumerate(event_names) if i != run]
			
 
				+    num_events = [len(i) for i in event_names]
			
 
				+    max_events = event_names[num_events.index(max(num_events))]
			
 
				+
			
 
				+    # create list of contrasts:
			
 
				+    stim = 'correct_rejection'
			
 
				+    contrast1 = (stim, 'T', max_events, [1 if stim in s else 0 for s in max_events])
			
 
				+    contrasts = [contrast1]
			
 
				+
			
 
				+    # create new list with subject info of all runs except current run:
			
 
				+    subject_info = [info for i, info in enumerate(subject_info) if i != run]
			
 
				+    # create new list with functional data of all runs except current run:
			
 
				+    data_func = [info for i, info in enumerate(data_func) if i != run]
			
 
				+
			
 
				+    # return the new lists
			
 
				+    return subject_info, data_func, contrasts
			
--- a/code/glm/requirements.txt
+++ b/code/glm/requirements.txt
@@ -0,0 +1,89 @@
 
				+alabaster==0.7.10
			
 
				+apipkg==1.4
			
 
				+asn1crypto==0.24.0
			
 
				+atomicwrites==1.1.5
			
 
				+attrs==18.1.0
			
 
				+Babel==2.6.0
			
 
				+bcrypt==3.1.4
			
 
				+certifi==2018.4.16
			
 
				+cffi==1.11.5
			
 
				+chardet==3.0.4
			
 
				+citeproc-py==0.4.0
			
 
				+click==6.7
			
 
				+codecov==2.0.15
			
 
				+configparser==3.5.0
			
 
				+coverage==4.5.1
			
 
				+cryptography==2.2.2
			
 
				+cycler==0.10.0
			
 
				+decorator==4.3.0
			
 
				+dipy==0.14.0
			
 
				+docutils==0.14
			
 
				+duecredit==0.6.3
			
 
				+execnet==1.5.0
			
 
				+funcsigs==1.0.2
			
 
				+future==0.16.0
			
 
				+futures==3.1.1
			
 
				+grabbit==0.2.5
			
 
				+h5py==2.8.0
			
 
				+idna==2.7
			
 
				+imagesize==1.0.0
			
 
				+isodate==0.6.0
			
 
				+Jinja2==2.10
			
 
				+kiwisolver==1.0.1
			
 
				+lxml==4.2.1
			
 
				+MarkupSafe==1.0
			
 
				+matplotlib==2.2.2
			
 
				+mock==2.0.0
			
 
				+more-itertools==4.2.0
			
 
				+mpmath==1.0.0
			
 
				+networkx==2.1
			
 
				+neurdflib==5.0.0.post1
			
 
				+nibabel==2.2.1
			
 
				+nilearn==0.4.1
			
 
				+nipy==0.4.2
			
 
				+nipype==1.1.5
			
 
				+nitime==0.7
			
 
				+num2words==0.5.6
			
 
				+numpy==1.14.4
			
 
				+numpydoc==0.8.0
			
 
				+packaging==17.1
			
 
				+pandas==0.23.4
			
 
				+paramiko==2.4.1
			
 
				+patsy==0.5.0
			
 
				+pbr==4.0.4
			
 
				+pkg-resources==0.0.0
			
 
				+pluggy==0.6.0
			
 
				+prov==1.5.2
			
 
				+psutil==5.4.6
			
 
				+py==1.5.3
			
 
				+pyasn1==0.4.3
			
 
				+pybids==0.6.5
			
 
				+pycparser==2.18
			
 
				+pydeface==2.0
			
 
				+pydot==1.2.4
			
 
				+pydotplus==2.0.2
			
 
				+Pygments==2.2.0
			
 
				+PyNaCl==1.2.1
			
 
				+pyparsing==2.2.0
			
 
				+pytest==3.6.1
			
 
				+pytest-cov==2.5.1
			
 
				+pytest-env==0.6.2
			
 
				+pytest-forked==0.2
			
 
				+pytest-xdist==1.22.2
			
 
				+python-dateutil==2.7.3
			
 
				+pytz==2018.4
			
 
				+rdflib==4.2.2
			
 
				+requests==2.18.4
			
 
				+scikit-learn==0.20.3
			
 
				+scipy==1.1.0
			
 
				+simplejson==3.15.0
			
 
				+six==1.11.0
			
 
				+sklearn==0.0
			
 
				+snowballstemmer==1.2.1
			
 
				+Sphinx==1.7.5
			
 
				+sphinxcontrib-websupport==1.1.0
			
 
				+sympy==1.1.1
			
 
				+traits==4.6.0
			
 
				+urllib3==1.22
			
 
				+xvfbwrapper==0.2.9
			
 
				+yapf==0.22.0
			
--- a/highspeed-glm.Rproj
+++ b/highspeed-glm.Rproj
@@ -0,0 +1,16 @@
 
				+Version: 1.0
			
 
				+
			
 
				+RestoreWorkspace: No
			
 
				+SaveWorkspace: No
			
 
				+AlwaysSaveHistory: No
			
 
				+
			
 
				+EnableCodeIndexing: Yes
			
 
				+UseSpacesForTab: Yes
			
 
				+NumSpacesForTab: 2
			
 
				+Encoding: UTF-8
			
 
				+
			
 
				+RnwWeave: Sweave
			
 
				+LaTeX: pdfLaTeX
			
 
				+
			
 
				+AutoAppendNewline: Yes
			
 
				+StripTrailingWhitespace: Yes