Generate tedana walkthrough figures

Generate tedana walkthrough figures#

Important

The contents of this chapter will be moved into TE_Dependence and, to a lesser extent, Signal_Decay, and this chapter will be removed.

Load data#

Show code cell content

Hide code cell content

func_dir = os.path.join(data_path, "ds006185/sub-24053/ses-1/func/")
data_files = sorted(
    glob(
        os.path.join(
            func_dir,
            "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_echo-*_part-mag_desc-preproc_bold.nii.gz",
        ),
    ),
)
echo_times = []
for f in data_files:
    json_file = f.replace('.nii.gz', '.json')
    with open(json_file, 'r') as fo:
        metadata = json.load(fo)
    echo_times.append(metadata['EchoTime'] * 1000)
echo_times = np.round(np.array(echo_times), 2)
mask_file = os.path.join(
    func_dir,
    "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_part-mag_desc-brain_mask.nii.gz"
)
confounds_file = os.path.join(
    func_dir,
    "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_part-mag_desc-confounds_timeseries.tsv",
)

# Background anatomical image
anat_dir = os.path.join(data_path, "ds006185/sub-24053/ses-1/anat/")
xfm = os.path.join(
    func_dir,
    "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_from-boldref_to-T1w_mode-image_desc-coreg_xfm.txt",
)
xfm = nit.linear.load(xfm, fmt="itk")
t1_file = os.path.join(anat_dir, "sub-24053_ses-1_rec-norm_desc-preproc_T1w.nii.gz")
bg_img = xfm.apply(spatialimage=t1_file, reference=data_files[0])

# Tedana outputs
adaptive_mask_file = os.path.join(
    ted_dir,
    "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-adaptiveGoodSignal_mask.nii.gz",
)
mask = image.math_img("img >= 3", img=adaptive_mask_file)

# Optimally combined data
oc = masking.apply_mask(
    os.path.join(ted_dir, "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-optcom_bold.nii.gz"),
    mask,
)
oc_z = (oc - np.mean(oc, axis=0)) / np.std(oc, axis=0)

# Results from MEPCA
mepca_mmix = pd.read_table(
    os.path.join(ted_dir, "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-PCA_mixing.tsv"),
).values
oc_red = masking.apply_mask(
    os.path.join(
        ted_dir, "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-optcom_whitened_bold.nii.gz"
    ),
    mask,
)

# Results from MEICA
meica_mmix = pd.read_table(
    os.path.join(ted_dir, "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-ICA_mixing.tsv"),
).values
norm_weights = masking.apply_mask(
    os.path.join(
        ted_dir,
        "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-ICAAveragingWeights_components.nii.gz",
    ),
    mask,
)
meica_beta_files = sorted(
    glob(
        os.path.join(
            ted_dir,
            "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_echo-*_desc-ICA_components.nii.gz",
        ),
    ),
)
meica_betas = np.dstack([masking.apply_mask(f, mask).T for f in meica_beta_files])
meica_betas = np.swapaxes(meica_betas, 1, 2)

r2_pred_beta_files = sorted(
    glob(
        os.path.join(
            ted_dir,
            "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_echo-*_desc-ICAT2ModelPredictions_components.nii.gz",
        ),
    ),
)
r2_pred_betas = np.dstack([masking.apply_mask(f, mask).T for f in r2_pred_beta_files])
r2_pred_betas = np.swapaxes(r2_pred_betas, 1, 2)
s0_pred_beta_files = sorted(
    glob(
        os.path.join(
            ted_dir,
            "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_echo-*_desc-ICAS0ModelPredictions_components.nii.gz",
        ),
    ),
)
s0_pred_betas = np.dstack([masking.apply_mask(f, mask).T for f in s0_pred_beta_files])
s0_pred_betas = np.swapaxes(s0_pred_betas, 1, 2)

# Component parameter estimates
betas_file = os.path.join(
    ted_dir, "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-ICA_components.nii.gz"
)
beta_maps = masking.apply_mask(betas_file, mask)

# Multi-echo denoised data
dn_data = masking.apply_mask(
    os.path.join(
        ted_dir, "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-denoised_bold.nii.gz"
    ),
    mask,
)
hk_data = masking.apply_mask(
    os.path.join(
        ted_dir, "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-optcomAccepted_bold.nii.gz"
    ),
    mask,
)

# Post-processed data
dn_t1c_data = masking.apply_mask(
    os.path.join(
        ted_dir, "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-optcomMIRDenoised_bold.nii.gz"
    ),
    mask,
)
hk_t1c_data = masking.apply_mask(
    os.path.join(
        ted_dir, "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-optcomAcceptedMIRDenoised_bold.nii.gz"
    ),
    mask,
)

# Component table
comp_tbl = pd.read_table(
    os.path.join(ted_dir, "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_desc-tedana_metrics.tsv"),
    index_col="Component",
)

# Get voxel index for voxel most related to component with highest kappa value
acc_comp_tbl = comp_tbl.loc[comp_tbl["classification"] == "accepted"]
high_kappa_comp = acc_comp_tbl.sort_values(by="kappa", ascending=False).index.values[0]
high_kappa_comp_val = int(high_kappa_comp.split("_")[1])
voxel_idx = np.where(
    beta_maps[high_kappa_comp_val, :] == np.max(beta_maps[high_kappa_comp_val, :])
)[0][0]

rej_comp_tbl = comp_tbl.loc[comp_tbl["classification"] == "rejected"]
low_kappa_comp = rej_comp_tbl.sort_values(by="rho", ascending=False).index.values[0]

# load data
data = [masking.apply_mask(f, mask) for f in data_files]
ts = [d[:, voxel_idx] for d in data]
ts_1d = np.hstack(ts)

n_echoes = len(echo_times)
n_trs = data[0].shape[0]

pal = sns.color_palette("cubehelix", n_echoes)

---------------------------------------------------------------------------
FileNotFoundError                         Traceback (most recent call last)
Cell In[2], line 32
anat_dir = os.path.join(data_path, "ds006185/sub-24053/ses-1/anat/")
xfm = os.path.join(
   func_dir,
   "sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_from-boldref_to-T1w_mode-image_desc-coreg_xfm.txt",
)
---> 32 xfm = nit.linear.load(xfm, fmt="itk")
t1_file = os.path.join(anat_dir, "sub-24053_ses-1_rec-norm_desc-preproc_T1w.nii.gz")
bg_img = xfm.apply(spatialimage=t1_file, reference=data_files[0])

File /opt/hostedtoolcache/Python/3.12.11/x64/lib/python3.12/site-packages/nitransforms/linear.py:447, in load(filename, fmt, reference, moving)
def load(filename, fmt=None, reference=None, moving=None):
   """
   Load a linear transform file.

   (...)    445 
   """
--> 447     xfm = LinearTransformsMapping.from_filename(
       filename, fmt=fmt, reference=reference, moving=moving
   )
   if isinstance(xfm, LinearTransformsMapping) and len(xfm) == 1:
       xfm = xfm[0]

File /opt/hostedtoolcache/Python/3.12.11/x64/lib/python3.12/site-packages/nitransforms/linear.py:204, in Affine.from_filename(cls, filename, fmt, reference, moving, x5_position)
if fmt is not None and not Path(filename).exists():
   if fmt != "fsl":
--> 204         raise FileNotFoundError(
           f"[Errno 2] No such file or directory: '{filename}'"
       )
   elif not Path(f"{filename}.000").exists():
       raise FileNotFoundError(
           f"[Errno 2] No such file or directory: '{filename}[.000]'"
       )

FileNotFoundError: [Errno 2] No such file or directory: '/home/runner/work/multi-echo-data-analysis/multi-echo-data-analysis/DATA/ds006185/sub-24053/ses-1/func/sub-24053_ses-1_task-rat_rec-nordic_dir-PA_run-01_from-boldref_to-T1w_mode-image_desc-coreg_xfm.txt'

Echo-specific timeseries#

Echo-specific data and echo time#

Adaptive mask#

Longer echo times are more susceptible to signal dropout, which means that certain brain regions (e.g., orbitofrontal cortex, temporal poles) will only have good signal for some echoes. In order to avoid using bad signal from affected echoes in calculating \(T_{2}^*\) and \(S_{0}\) for a given voxel, tedana generates an adaptive mask, where the value for each voxel is the number of echoes with “good” signal. When \(T_{2}^*\) and \(S_{0}\) are calculated below, each voxel’s values are only calculated from the first \(n\) echoes, where \(n\) is the value for that voxel in the adaptive mask.

Log-linear transformation#

Log-linear model#

Let \(S\) be the BOLD signal for a given echo.

Let \(TE\) be the echo time in milliseconds.

(11)#\[\begin{split}\log_{e}(\left|\begin{pmatrix} S(TE_{1}) \\ S(TE_{2}) \\ \vdots \\ S(TE_{n})\end{pmatrix}\right| + \begin{pmatrix} 1 \\ 1 \\ \vdots \\ 1\end{pmatrix} ) = B_{1} \begin{pmatrix} -TE_{1} \\ -TE_{2} \\ \vdots \\ -TE_{n}\end{pmatrix} + \begin{pmatrix} B_{0} \\ B_{0} \\ \vdots \\ B_{0}\end{pmatrix}\end{split}\]

Monoexponential decay model#

Calculation of \(S_{0}\) and \(T_{2}^{*}\)

(12)#\[S_{0} = e^{B_{0}}\]

(13)#\[T_{2}^{*} = \frac{1}{B_{1}}\]

T2*#

Optimal combination weights#

Optimally combined timeseries#

Multi-Echo Principal Components Analysis#

Optimally combined data are decomposed with PCA. The PCA components are selected according to one of multiple possible approaches. Two possible approaches are a decision tree and a threshold using the percentage of variance explained by each component.

Data Whitening#

The selected components from the PCA are recombined to produce a whitened version of the optimally combined data.

Multi-Echo Independent Components Analysis#

The whitened optimally combined data are then decomposed with ICA. The number of ICA components is limited to the number of retained components from the PCA, in order to reflect the true dimensionality of the data. ICA produces a mixing matrix (i.e., timeseries for each component).

\(R_2\) and \(S_0\) Model Fit#

Linear regression is used to fit the component timeseries to each voxel in each echo from the original, echo-specific data. This results in echo- and voxel-specific betas for each of the components. TE-dependence (\(R_2\)) and TE-independence (\(S_0\)) models can then be fit to these betas.

These models allow calculation of F-statistics for the \(R_2\) and \(S_0\) models (referred to as \(\kappa\) and \(\rho\), respectively).

Note that the values here are for a single voxel (the highest-weighted one for the component), but \(\kappa\) and \(\rho\) are averaged across voxels.

ICA Component Selection and Multi-Echo Denoising#

A decision tree is applied to \(\kappa\), \(\rho\), and other metrics in order to classify ICA components as TE-dependent (BOLD signal), TE-independent (non-BOLD noise), or neither (to be ignored).

The ICA components are fitted to the original (not whitened) optimally combined data with linear regression, which is used to weight the components for construction of the denoised data. The residuals from this regression will thus include the variance that was not included in the PCA-whitened optimally combined data.

The MEDN dataset is constructed from the accepted (BOLD) and ignored components, as well as the residual variance not explained by the ICA. The MEHK dataset is constructed just from the accepted (BOLD) components. This means that ignored components and residual variance not explained by the ICA are not included in the resulting dataset.

Post-processing to remove spatially diffuse noise#

Due to the constraints of ICA, MEICA is able to identify and remove spatially localized noise components, but it cannot identify components that are spread out throughout the whole brain.

One of several post-processing strategies may be applied to the ME-DN or ME-HK datasets in order to remove spatially diffuse (ostensibly respiration-related) noise. Methods which have been employed in the past include global signal regression (GSR), Minimum Image Regression, anatomical CompCor, Go Decomposition (GODEC), and robust PCA.

Generate tedana walkthrough figures

Contents

Generate tedana walkthrough figures#

Load data#

Echo-specific timeseries#

Echo-specific data and echo time#

Adaptive mask#

Log-linear transformation#

Log-linear model#

Monoexponential decay model#

T2*#

Optimal combination weights#

Optimally combined timeseries#

Optimally combined timeseries#

Multi-Echo Principal Components Analysis#

Data Whitening#

Multi-Echo Independent Components Analysis#

\(R_2\) and \(S_0\) Model Fit#

ICA Component Selection and Multi-Echo Denoising#

Post-processing to remove spatially diffuse noise#