From 91835ffa924afa0d9d9a51135312c875c85061e4 Mon Sep 17 00:00:00 2001 From: Gab-D-G Date: Thu, 21 Sep 2023 17:28:41 -0400 Subject: [PATCH 1/7] token data is now generated from a function. --- scripts/error_check_rabies.py | 107 ++++++++++++++++++---------------- 1 file changed, 57 insertions(+), 50 deletions(-) diff --git a/scripts/error_check_rabies.py b/scripts/error_check_rabies.py index ad5e618..cc11467 100755 --- a/scripts/error_check_rabies.py +++ b/scripts/error_check_rabies.py @@ -14,47 +14,54 @@ else: tmppath = tempfile.mkdtemp() -os.makedirs(tmppath+'/inputs', exist_ok=True) - -if 'XDG_DATA_HOME' in os.environ.keys(): - rabies_path = os.environ['XDG_DATA_HOME']+'/rabies' -else: - rabies_path = os.environ['HOME']+'/.local/share/rabies' - -template = f"{rabies_path}/DSURQE_40micron_average.nii.gz" -mask = f"{rabies_path}/DSURQE_40micron_mask.nii.gz" - -img = sitk.ReadImage(template) -spacing = (float(1), float(1), float(1)) # resample to 1mmx1mmx1mm -resampled = resample_image_spacing(sitk.ReadImage(template), spacing) -array = sitk.GetArrayFromImage(resampled) -array_4d = np.repeat(array[np.newaxis, :, :, :], 15, axis=0) -array_4d += np.random.normal(0, array_4d.mean() - / 100, array_4d.shape) # add gaussian noise -sitk.WriteImage(resampled, tmppath+'/inputs/sub-token_T1w.nii.gz') -sitk.WriteImage(resampled, tmppath+'/inputs/sub-token2_T1w.nii.gz') -sitk.WriteImage(resampled, tmppath+'/inputs/sub-token3_T1w.nii.gz') -sitk.WriteImage(sitk.GetImageFromArray(array_4d, isVector=False), - tmppath+'/inputs/sub-token_bold.nii.gz') - -resampled = resample_image_spacing(sitk.ReadImage(mask), spacing) -array = sitk.GetArrayFromImage(resampled) -array[array < 1] = 0 -array[array > 1] = 1 -binarized = sitk.GetImageFromArray(array, isVector=False) -binarized.CopyInformation(resampled) -sitk.WriteImage(binarized, tmppath+'/inputs/token_mask.nii.gz') -array[:, :, :6] = 0 -binarized = sitk.GetImageFromArray(array, isVector=False) -binarized.CopyInformation(resampled) -sitk.WriteImage(binarized, tmppath+'/inputs/token_mask_half.nii.gz') - - -sitk.WriteImage(copyInfo_4DImage(sitk.ReadImage(tmppath+'/inputs/sub-token_bold.nii.gz'), sitk.ReadImage(tmppath - + '/inputs/sub-token_T1w.nii.gz'), sitk.ReadImage(tmppath+'/inputs/sub-token_bold.nii.gz')), tmppath+'/inputs/sub-token_bold.nii.gz') +def generate_token_data(tmppath, number_scans): + + os.makedirs(tmppath+'/inputs', exist_ok=True) + + if 'XDG_DATA_HOME' in os.environ.keys(): + rabies_path = os.environ['XDG_DATA_HOME']+'/rabies' + else: + rabies_path = os.environ['HOME']+'/.local/share/rabies' + + template = f"{rabies_path}/DSURQE_40micron_average.nii.gz" + mask = f"{rabies_path}/DSURQE_40micron_mask.nii.gz" + + spacing = (float(1), float(1), float(1)) # resample to 1mmx1mmx1mm + resampled_template = resample_image_spacing(sitk.ReadImage(template), spacing) + # generate template masks + resampled_mask = resample_image_spacing(sitk.ReadImage(mask), spacing) + array = sitk.GetArrayFromImage(resampled_mask) + array[array < 1] = 0 + array[array > 1] = 1 + binarized = sitk.GetImageFromArray(array, isVector=False) + binarized.CopyInformation(resampled_mask) + sitk.WriteImage(binarized, tmppath+'/inputs/token_mask.nii.gz') + array[:, :, :6] = 0 + binarized = sitk.GetImageFromArray(array, isVector=False) + binarized.CopyInformation(resampled_mask) + sitk.WriteImage(binarized, tmppath+'/inputs/token_mask_half.nii.gz') + + # generate fake scans from the template + array = sitk.GetArrayFromImage(resampled_template) + array_4d = np.repeat(array[np.newaxis, :, :, :], 15, axis=0) + + for i in range(number_scans): + # generate anatomical scan + sitk.WriteImage(resampled_template, tmppath+f'/inputs/sub-token{i+1}_T1w.nii.gz') + # generate functional scan + array_4d_ = array_4d + np.random.normal(0, array_4d.mean() + / 100, array_4d.shape) # add gaussian noise + sitk.WriteImage(sitk.GetImageFromArray(array_4d_, isVector=False), + tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz') + + sitk.WriteImage(copyInfo_4DImage(sitk.ReadImage(tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz'), sitk.ReadImage(tmppath + + f'/inputs/sub-token{i+1}_T1w.nii.gz'), sitk.ReadImage(tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz')), tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz') + + +generate_token_data(tmppath, number_scans=1) command = f"rabies --verbose 1 preprocess {tmppath}/inputs {tmppath}/outputs --anat_inho_cor method=disable,otsu_thresh=2,multiotsu=false --bold_inho_cor method=disable,otsu_thresh=2,multiotsu=false \ - --anat_template {tmppath}/inputs/sub-token_T1w.nii.gz --brain_mask {tmppath}/inputs/token_mask.nii.gz --WM_mask {tmppath}/inputs/token_mask.nii.gz --CSF_mask {tmppath}/inputs/token_mask.nii.gz --vascular_mask {tmppath}/inputs/token_mask.nii.gz --labels {tmppath}/inputs/token_mask.nii.gz \ + --anat_template {tmppath}/inputs/sub-token1_T1w.nii.gz --brain_mask {tmppath}/inputs/token_mask.nii.gz --WM_mask {tmppath}/inputs/token_mask.nii.gz --CSF_mask {tmppath}/inputs/token_mask.nii.gz --vascular_mask {tmppath}/inputs/token_mask.nii.gz --labels {tmppath}/inputs/token_mask.nii.gz \ --bold2anat_coreg registration=no_reg,masking=false,brain_extraction=false --commonspace_reg masking=false,brain_extraction=false,fast_commonspace=true,template_registration=no_reg --data_type int16 --bold_only --detect_dummy \ --tpattern seq-z --apply_STC --voxelwise_motion --isotropic_HMC" process = subprocess.run( @@ -65,7 +72,7 @@ shutil.rmtree(f'{tmppath}/outputs/') command = f"rabies --verbose 1 preprocess {tmppath}/inputs {tmppath}/outputs --anat_inho_cor method=disable,otsu_thresh=2,multiotsu=false --bold_inho_cor method=disable,otsu_thresh=2,multiotsu=false \ - --anat_template {tmppath}/inputs/sub-token_T1w.nii.gz --brain_mask {tmppath}/inputs/token_mask.nii.gz --WM_mask {tmppath}/inputs/token_mask.nii.gz --CSF_mask {tmppath}/inputs/token_mask.nii.gz --vascular_mask {tmppath}/inputs/token_mask.nii.gz --labels {tmppath}/inputs/token_mask.nii.gz \ + --anat_template {tmppath}/inputs/sub-token1_T1w.nii.gz --brain_mask {tmppath}/inputs/token_mask.nii.gz --WM_mask {tmppath}/inputs/token_mask.nii.gz --CSF_mask {tmppath}/inputs/token_mask.nii.gz --vascular_mask {tmppath}/inputs/token_mask.nii.gz --labels {tmppath}/inputs/token_mask.nii.gz \ --bold2anat_coreg registration=no_reg,masking=true,brain_extraction=true --commonspace_reg masking=true,brain_extraction=true,fast_commonspace=true,template_registration=no_reg --data_type int16 \ --HMC_option 0" process = subprocess.run( @@ -81,19 +88,19 @@ shell=True, ) -### Add subjects for the group analysis to run -array_4d += np.random.normal(0, array_4d.mean() - / 100, array_4d.shape) # add gaussian noise -sitk.WriteImage(sitk.GetImageFromArray(array_4d, isVector=False), - tmppath+'/inputs/sub-token2_bold.nii.gz') -array_4d += np.random.normal(0, array_4d.mean() - / 100, array_4d.shape) # add gaussian noise -sitk.WriteImage(sitk.GetImageFromArray(array_4d, isVector=False), - tmppath+'/inputs/sub-token3_bold.nii.gz') +#command = f"rabies --verbose 1 analysis {tmppath}/outputs {tmppath}/outputs --data_diagnosis" +#process = subprocess.run( +# command, +# check=True, +# shell=True, +# ) + +shutil.rmtree(f'{tmppath}/inputs/') +generate_token_data(tmppath, number_scans=3) shutil.rmtree(f'{tmppath}/outputs/') command = f"rabies --verbose 1 preprocess {tmppath}/inputs {tmppath}/outputs --anat_inho_cor method=disable,otsu_thresh=2,multiotsu=false --bold_inho_cor method=disable,otsu_thresh=2,multiotsu=false \ - --anat_template {tmppath}/inputs/sub-token_T1w.nii.gz --brain_mask {tmppath}/inputs/token_mask.nii.gz --WM_mask {tmppath}/inputs/token_mask_half.nii.gz --CSF_mask {tmppath}/inputs/token_mask_half.nii.gz --vascular_mask {tmppath}/inputs/token_mask_half.nii.gz --labels {tmppath}/inputs/token_mask.nii.gz \ + --anat_template {tmppath}/inputs/sub-token1_T1w.nii.gz --brain_mask {tmppath}/inputs/token_mask.nii.gz --WM_mask {tmppath}/inputs/token_mask_half.nii.gz --CSF_mask {tmppath}/inputs/token_mask_half.nii.gz --vascular_mask {tmppath}/inputs/token_mask_half.nii.gz --labels {tmppath}/inputs/token_mask.nii.gz \ --bold2anat_coreg registration=no_reg,masking=false,brain_extraction=false --commonspace_reg masking=false,brain_extraction=false,fast_commonspace=true,template_registration=no_reg --data_type int16 \ --HMC_option 0" process = subprocess.run( From 705eca90be9ecf8c3989d47116ce42b29e00aab8 Mon Sep 17 00:00:00 2001 From: Gab-D-G Date: Fri, 22 Sep 2023 14:41:41 -0400 Subject: [PATCH 2/7] Setup of a debugging workflow. The workflow can be executed from python by providing a set of arguments (example in debug_workflow.py). A function to generate token data was moved to rabies.utils. --- rabies/parser.py | 7 ++- rabies/run_main.py | 4 +- rabies/utils.py | 50 ++++++++++++++++ scripts/debug_workflow.py | 105 +++++----------------------------- scripts/error_check_rabies.py | 48 +--------------- 5 files changed, 73 insertions(+), 141 deletions(-) diff --git a/rabies/parser.py b/rabies/parser.py index a287716..f20baf6 100644 --- a/rabies/parser.py +++ b/rabies/parser.py @@ -958,8 +958,11 @@ def get_parser(): return parser -def read_parser(parser): - opts = parser.parse_args() +def read_parser(parser, args): + if args is None: + opts = parser.parse_args() + else: + opts = parser.parse_args(args) if opts.rabies_stage == 'preprocess': opts.anat_inho_cor = parse_argument(opt=opts.anat_inho_cor, diff --git a/rabies/run_main.py b/rabies/run_main.py index 494b254..0503557 100644 --- a/rabies/run_main.py +++ b/rabies/run_main.py @@ -11,10 +11,10 @@ rabies_path = os.environ['HOME']+'/.local/share/rabies' -def execute_workflow(): +def execute_workflow(args=None): # generates the parser CLI and execute the workflow based on specified parameters. parser = get_parser() - opts = read_parser(parser) + opts = read_parser(parser, args) try: # convert the output path to absolute if not already the case opts.output_dir = os.path.abspath(str(opts.output_dir)) diff --git a/rabies/utils.py b/rabies/utils.py index bff9272..d14dd4a 100644 --- a/rabies/utils.py +++ b/rabies/utils.py @@ -437,3 +437,53 @@ def fill_node_dict(d, key_l, e): return d else: return e + + +###################### +#DEBUGGING +###################### + +def generate_token_data(tmppath, number_scans): + # this function generates fake scans at low resolution for quick testing and debugging + + os.makedirs(tmppath+'/inputs', exist_ok=True) + + if 'XDG_DATA_HOME' in os.environ.keys(): + rabies_path = os.environ['XDG_DATA_HOME']+'/rabies' + else: + rabies_path = os.environ['HOME']+'/.local/share/rabies' + + template = f"{rabies_path}/DSURQE_40micron_average.nii.gz" + mask = f"{rabies_path}/DSURQE_40micron_mask.nii.gz" + + spacing = (float(1), float(1), float(1)) # resample to 1mmx1mmx1mm + resampled_template = resample_image_spacing(sitk.ReadImage(template), spacing) + # generate template masks + resampled_mask = resample_image_spacing(sitk.ReadImage(mask), spacing) + array = sitk.GetArrayFromImage(resampled_mask) + array[array < 1] = 0 + array[array > 1] = 1 + binarized = sitk.GetImageFromArray(array, isVector=False) + binarized.CopyInformation(resampled_mask) + sitk.WriteImage(binarized, tmppath+'/inputs/token_mask.nii.gz') + array[:, :, :6] = 0 + binarized = sitk.GetImageFromArray(array, isVector=False) + binarized.CopyInformation(resampled_mask) + sitk.WriteImage(binarized, tmppath+'/inputs/token_mask_half.nii.gz') + + # generate fake scans from the template + array = sitk.GetArrayFromImage(resampled_template) + array_4d = np.repeat(array[np.newaxis, :, :, :], 15, axis=0) + + for i in range(number_scans): + # generate anatomical scan + sitk.WriteImage(resampled_template, tmppath+f'/inputs/sub-token{i+1}_T1w.nii.gz') + # generate functional scan + array_4d_ = array_4d + np.random.normal(0, array_4d.mean() + / 100, array_4d.shape) # add gaussian noise + sitk.WriteImage(sitk.GetImageFromArray(array_4d_, isVector=False), + tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz') + + # necessary to read matrix orientation properly at the analysis stage + sitk.WriteImage(copyInfo_4DImage(sitk.ReadImage(tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz'), sitk.ReadImage(tmppath + + f'/inputs/sub-token{i+1}_T1w.nii.gz'), sitk.ReadImage(tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz')), tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz') diff --git a/scripts/debug_workflow.py b/scripts/debug_workflow.py index 87241e3..24431c4 100644 --- a/scripts/debug_workflow.py +++ b/scripts/debug_workflow.py @@ -1,65 +1,25 @@ #! /usr/bin/env python -import SimpleITK as sitk -import os -import sys -import numpy as np -import tempfile -import shutil -from rabies.utils import resample_image_spacing, copyInfo_4DImage - -if len(sys.argv) == 2: - tmppath = sys.argv[1] -else: - tmppath = tempfile.mkdtemp() - -os.makedirs(tmppath+'/inputs', exist_ok=True) - -if 'XDG_DATA_HOME' in os.environ.keys(): - rabies_path = os.environ['XDG_DATA_HOME']+'/rabies' -else: - rabies_path = os.environ['HOME']+'/.local/share/rabies' - -template = f"{rabies_path}/DSURQE_40micron_average.nii.gz" -mask = f"{rabies_path}/DSURQE_40micron_mask.nii.gz" +from rabies.utils import generate_token_data -img = sitk.ReadImage(template) -spacing = (float(1), float(1), float(1)) # resample to 1mmx1mmx1mm -resampled = resample_image_spacing(sitk.ReadImage(template), spacing) -array = sitk.GetArrayFromImage(resampled) -array_4d = np.repeat(array[np.newaxis, :, :, :], 15, axis=0) -array_4d += np.random.normal(0, array_4d.mean() - / 100, array_4d.shape) # add gaussian noise -sitk.WriteImage(resampled, tmppath+'/inputs/sub-token_T1w.nii.gz') -sitk.WriteImage(resampled, tmppath+'/inputs/sub-token2_T1w.nii.gz') -sitk.WriteImage(resampled, tmppath+'/inputs/sub-token3_T1w.nii.gz') -sitk.WriteImage(sitk.GetImageFromArray(array_4d, isVector=False), - tmppath+'/inputs/sub-token_bold.nii.gz') - -resampled = resample_image_spacing(sitk.ReadImage(mask), spacing) -array = sitk.GetArrayFromImage(resampled) -array[array < 1] = 0 -array[array > 1] = 1 -binarized = sitk.GetImageFromArray(array, isVector=False) -binarized.CopyInformation(resampled) -sitk.WriteImage(binarized, tmppath+'/inputs/token_mask.nii.gz') -array[:, :, :6] = 0 -binarized = sitk.GetImageFromArray(array, isVector=False) -binarized.CopyInformation(resampled) -sitk.WriteImage(binarized, tmppath+'/inputs/token_mask_half.nii.gz') - - -sitk.WriteImage(copyInfo_4DImage(sitk.ReadImage(tmppath+'/inputs/sub-token_bold.nii.gz'), sitk.ReadImage(tmppath - + '/inputs/sub-token_T1w.nii.gz'), sitk.ReadImage(tmppath+'/inputs/sub-token_bold.nii.gz')), tmppath+'/inputs/sub-token_bold.nii.gz') +import tempfile +tmppath = tempfile.mkdtemp() +#### increase the number of scans generated to 3 if running group analysis +generate_token_data(tmppath, number_scans=1) output_folder = f'{tmppath}/outputs' + +#### HERE ARE SET THE DESIRED PARAMETERS FOR PREPROCESSING args = [ #'--debug', 'preprocess', f'{tmppath}/inputs', output_folder, - '--anat_inho_cor_method','disable', '--bold_inho_cor_method', 'disable', - '--coreg_script', 'NULL', '--atlas_reg_script', 'NULL', '--data_type', 'int16', '--bold_only', '--fast_commonspace', - '--anat_template', f'{tmppath}/inputs/sub-token_T1w.nii.gz', + '--anat_inho_cor', 'method=disable,otsu_thresh=2,multiotsu=false', + '--bold_inho_cor', 'method=disable,otsu_thresh=2,multiotsu=false', + '--bold2anat_coreg', 'registration=no_reg,masking=false,brain_extraction=false', + '--commonspace_reg', 'masking=false,brain_extraction=false,fast_commonspace=true,template_registration=no_reg', + '--data_type', 'int16', '--bold_only', + '--anat_template', f'{tmppath}/inputs/sub-token1_T1w.nii.gz', '--brain_mask', f'{tmppath}/inputs/token_mask.nii.gz', '--WM_mask', f'{tmppath}/inputs/token_mask.nii.gz', '--CSF_mask', f'{tmppath}/inputs/token_mask.nii.gz', @@ -67,40 +27,5 @@ '--labels', f'{tmppath}/inputs/token_mask.nii.gz', ] -from rabies.parser import get_parser - -parser = get_parser() - -opts = parser.parse_args(args) - -if not os.path.isdir(output_folder): - os.makedirs(output_folder) - -from rabies.run_main import prep_logging, preprocess, confound_correction, analysis -log = prep_logging(opts, output_folder) - -# print complete CLI command -args = 'CLI INPUTS: \n' -for arg in vars(opts): - input = f'-> {arg} = {getattr(opts, arg)} \n' - args += input -log.info(args) - - -if opts.rabies_stage == 'preprocess': - workflow = preprocess(opts, log) -elif opts.rabies_stage == 'confound_correction': - workflow = confound_correction(opts, log) -elif opts.rabies_stage == 'analysis': - workflow = analysis(opts, log) -else: - parser.print_help() -workflow.base_dir = output_folder - - -log.info(f'Running workflow with {opts.plugin} plugin.') -# execute workflow, with plugin_args limiting the cluster load for parallel execution -graph_out = workflow.run(plugin=opts.plugin, plugin_args={'max_jobs': 50, 'dont_resubmit_completed_jobs': True, - 'n_procs': opts.local_threads, 'qsub_args': f'-pe smp {str(opts.min_proc)}'}) - - +from rabies.run_main import execute_workflow +execute_workflow(args=args) diff --git a/scripts/error_check_rabies.py b/scripts/error_check_rabies.py index cc11467..33715d9 100755 --- a/scripts/error_check_rabies.py +++ b/scripts/error_check_rabies.py @@ -1,63 +1,17 @@ #! /usr/bin/env python -import SimpleITK as sitk import os import sys -import numpy as np import tempfile import shutil import subprocess -from rabies.utils import resample_image_spacing, copyInfo_4DImage +from rabies.utils import generate_token_data if len(sys.argv) == 2: tmppath = sys.argv[1] else: tmppath = tempfile.mkdtemp() -def generate_token_data(tmppath, number_scans): - - os.makedirs(tmppath+'/inputs', exist_ok=True) - - if 'XDG_DATA_HOME' in os.environ.keys(): - rabies_path = os.environ['XDG_DATA_HOME']+'/rabies' - else: - rabies_path = os.environ['HOME']+'/.local/share/rabies' - - template = f"{rabies_path}/DSURQE_40micron_average.nii.gz" - mask = f"{rabies_path}/DSURQE_40micron_mask.nii.gz" - - spacing = (float(1), float(1), float(1)) # resample to 1mmx1mmx1mm - resampled_template = resample_image_spacing(sitk.ReadImage(template), spacing) - # generate template masks - resampled_mask = resample_image_spacing(sitk.ReadImage(mask), spacing) - array = sitk.GetArrayFromImage(resampled_mask) - array[array < 1] = 0 - array[array > 1] = 1 - binarized = sitk.GetImageFromArray(array, isVector=False) - binarized.CopyInformation(resampled_mask) - sitk.WriteImage(binarized, tmppath+'/inputs/token_mask.nii.gz') - array[:, :, :6] = 0 - binarized = sitk.GetImageFromArray(array, isVector=False) - binarized.CopyInformation(resampled_mask) - sitk.WriteImage(binarized, tmppath+'/inputs/token_mask_half.nii.gz') - - # generate fake scans from the template - array = sitk.GetArrayFromImage(resampled_template) - array_4d = np.repeat(array[np.newaxis, :, :, :], 15, axis=0) - - for i in range(number_scans): - # generate anatomical scan - sitk.WriteImage(resampled_template, tmppath+f'/inputs/sub-token{i+1}_T1w.nii.gz') - # generate functional scan - array_4d_ = array_4d + np.random.normal(0, array_4d.mean() - / 100, array_4d.shape) # add gaussian noise - sitk.WriteImage(sitk.GetImageFromArray(array_4d_, isVector=False), - tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz') - - sitk.WriteImage(copyInfo_4DImage(sitk.ReadImage(tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz'), sitk.ReadImage(tmppath - + f'/inputs/sub-token{i+1}_T1w.nii.gz'), sitk.ReadImage(tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz')), tmppath+f'/inputs/sub-token{i+1}_bold.nii.gz') - - generate_token_data(tmppath, number_scans=1) command = f"rabies --verbose 1 preprocess {tmppath}/inputs {tmppath}/outputs --anat_inho_cor method=disable,otsu_thresh=2,multiotsu=false --bold_inho_cor method=disable,otsu_thresh=2,multiotsu=false \ From 7c4237dc19f9f5a8a531ac17214cd24df36b9033 Mon Sep 17 00:00:00 2001 From: Gab-D-G Date: Fri, 22 Sep 2023 16:51:23 -0400 Subject: [PATCH 3/7] Warning for removing empty outputs from confound correction and error to catch an empty list of scans for analysis. --- rabies/analysis_pkg/main_wf.py | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) diff --git a/rabies/analysis_pkg/main_wf.py b/rabies/analysis_pkg/main_wf.py index 547037e..d845eca 100644 --- a/rabies/analysis_pkg/main_wf.py +++ b/rabies/analysis_pkg/main_wf.py @@ -17,6 +17,14 @@ def init_main_analysis_wf(preprocess_opts, cr_opts, analysis_opts): split_dict, split_name_list, target_list = read_confound_workflow(conf_output, nativespace=cr_opts.nativespace_analysis) + if len(split_name_list)==0: + raise ValueError(f""" + No outputs were founds from the confound correction stage. + All scans may have been removed for not meeting the minimum_timepoint threshold + when applying --frame_censoring. Outputs will be named empty.nii.gz if this is + the case. + """) + # update split_name according to the --scan_list option split_name_list = get_iterable_scan_list(analysis_opts.scan_list, split_name_list) @@ -310,6 +318,8 @@ def load_sub_input_dict(maps_dict, bold_file, CR_data_dict, VE_file, STD_file, C def read_confound_workflow(conf_output, nativespace=False): + from nipype import logging + log = logging.getLogger('nipype.workflow') conf_workflow_file = f'{conf_output}/rabies_confound_correction_workflow.pkl' @@ -358,15 +368,26 @@ def read_confound_workflow(conf_output, nativespace=False): # don't include scans that were removed during confound correction corrected_split_name=[] + remove_list = [] import pathlib for name in split_name: filename = pathlib.Path(split_dict[name]['cleaned_path']).name if 'empty' in filename: + remove_list.append(name) del split_dict[name] else: corrected_split_name.append(name) split_name = corrected_split_name + if len(remove_list)>0: + scan_list_str = '' + for name in remove_list: + scan_list_str += f'\n - {name}' + log.warning(f""" + The following scans were not included for analysis as the file was empty: {scan_list_str} + This is likely due to not meeting the minimum_timepoints threshold from --frame_censoring. + """) + return split_dict, split_name, target_list From 5605dd90af908154084ab7d4a2b176bbc4c835f1 Mon Sep 17 00:00:00 2001 From: Gab-D-G Date: Fri, 22 Sep 2023 16:52:12 -0400 Subject: [PATCH 4/7] Test analysis stage with --nativespace_analysis on --- scripts/error_check_rabies.py | 21 +++++++++++++++------ 1 file changed, 15 insertions(+), 6 deletions(-) diff --git a/scripts/error_check_rabies.py b/scripts/error_check_rabies.py index 33715d9..20ac22a 100755 --- a/scripts/error_check_rabies.py +++ b/scripts/error_check_rabies.py @@ -42,12 +42,21 @@ shell=True, ) -#command = f"rabies --verbose 1 analysis {tmppath}/outputs {tmppath}/outputs --data_diagnosis" -#process = subprocess.run( -# command, -# check=True, -# shell=True, -# ) +# rerunning confound correction without censoring, which removes all scans +os.remove(f'{tmppath}/outputs/rabies_confound_correction.pkl') +command = f"rabies --verbose 1 confound_correction {tmppath}/outputs {tmppath}/outputs --nativespace_analysis" +process = subprocess.run( + command, + check=True, + shell=True, + ) + +command = f"rabies --verbose 1 analysis {tmppath}/outputs {tmppath}/outputs --data_diagnosis" +process = subprocess.run( + command, + check=True, + shell=True, + ) shutil.rmtree(f'{tmppath}/inputs/') generate_token_data(tmppath, number_scans=3) From 0195ddc11facdacb85abf167fa7335cc4a217d16 Mon Sep 17 00:00:00 2001 From: Gab-D-G Date: Fri, 22 Sep 2023 19:38:39 -0400 Subject: [PATCH 5/7] Implement flagging system at each pipeline stage with --inclusion_ids argument. --- rabies/analysis_pkg/main_wf.py | 5 ++-- rabies/confound_correction_pkg/main_wf.py | 4 +++ rabies/parser.py | 16 ++++++++++++ rabies/preprocess_pkg/main_wf.py | 2 +- rabies/preprocess_pkg/utils.py | 14 +++++++++- rabies/utils.py | 32 +++++++++++++++++++++++ 6 files changed, 69 insertions(+), 4 deletions(-) diff --git a/rabies/analysis_pkg/main_wf.py b/rabies/analysis_pkg/main_wf.py index d845eca..898f35e 100644 --- a/rabies/analysis_pkg/main_wf.py +++ b/rabies/analysis_pkg/main_wf.py @@ -25,8 +25,9 @@ def init_main_analysis_wf(preprocess_opts, cr_opts, analysis_opts): the case. """) - # update split_name according to the --scan_list option - split_name_list = get_iterable_scan_list(analysis_opts.scan_list, split_name_list) + # filter inclusion/exclusion lists + from rabies.utils import filter_scan_inclusion + split_name_list = filter_scan_inclusion(analysis_opts.inclusion_ids, split_name_list) # setting up iterables from the BOLD scan splits main_split = pe.Node(niu.IdentityInterface(fields=['split_name']), diff --git a/rabies/confound_correction_pkg/main_wf.py b/rabies/confound_correction_pkg/main_wf.py index 961842c..ace0536 100644 --- a/rabies/confound_correction_pkg/main_wf.py +++ b/rabies/confound_correction_pkg/main_wf.py @@ -23,6 +23,10 @@ def init_main_confound_correction_wf(preprocess_opts, cr_opts): else: split_dict, split_name, target_list = read_preproc_workflow(preproc_output, nativespace=cr_opts.nativespace_analysis) + # filter inclusion/exclusion lists + from rabies.utils import filter_scan_inclusion + split_name = filter_scan_inclusion(cr_opts.inclusion_ids, split_name) + # setting up iterables from the BOLD scan splits main_split = pe.Node(niu.IdentityInterface(fields=['split_name']), name="main_split") diff --git a/rabies/parser.py b/rabies/parser.py index f20baf6..ef99a3d 100644 --- a/rabies/parser.py +++ b/rabies/parser.py @@ -80,6 +80,22 @@ def get_parser(): description= "Options for parallel execution and memory management." ) + g_execution.add_argument( + '--inclusion_ids', type=str, + nargs="*", # 0 or more values expected => creates a list + default=['all'], + help= + "Define a list of BOLD scan to include, i.e. run the pipeline on a subset of the data. \n" + "To do so, provide the full path to the corresponding BOLD file in the input BIDS folder. The list \n" + "of scan can be specified manually as a list of file name '--scan_list scan1.nii.gz \n" + "scan2.nii.gz ...' or the files can be imbedded into a .txt file with one filename per row.\n" + "By default, 'all' the scans found in the input BIDS directory or from the previous \n" + "processing step. This can be provided at any processing stage.\n" + "***NOTE: do not enter this parameter right before the processing stage (preprocess, etc...), this will cause \n" + "parsing errors. Instead, provide another parameter after --inclusion_ids (e.g. --verbose or -p). \n" + "(default: %(default)s)\n" + "\n" + ) g_execution.add_argument( "-p", "--plugin", default='Linear', choices=['Linear', 'MultiProc', 'SGE', 'SGEGraph', diff --git a/rabies/preprocess_pkg/main_wf.py b/rabies/preprocess_pkg/main_wf.py index 88d769f..4ef2e18 100644 --- a/rabies/preprocess_pkg/main_wf.py +++ b/rabies/preprocess_pkg/main_wf.py @@ -135,7 +135,7 @@ def init_main_wf(data_dir_path, output_folder, opts, name='main_wf'): bids.config.set_option('extension_initial_dot', True) layout = bids.layout.BIDSLayout(data_dir_path, validate=False) split_name, scan_info, run_iter, scan_list, bold_scan_list = prep_bids_iter( - layout, opts.bold_only) + layout, opts.bold_only, inclusion_list=opts.inclusion_ids) # setting up all iterables main_split = pe.Node(niu.IdentityInterface(fields=['split_name', 'scan_info']), diff --git a/rabies/preprocess_pkg/utils.py b/rabies/preprocess_pkg/utils.py index 02a8031..03f2e4d 100644 --- a/rabies/preprocess_pkg/utils.py +++ b/rabies/preprocess_pkg/utils.py @@ -8,7 +8,7 @@ ) from rabies.utils import run_command -def prep_bids_iter(layout, bold_only=False): +def prep_bids_iter(layout, bold_only=False, inclusion_list=['all']): ''' This function takes as input a BIDSLayout, and generates iteration lists for managing the workflow's iterables depending on whether --bold_only is @@ -38,6 +38,18 @@ def prep_bids_iter(layout, bold_only=False): raise ValueError( "No functional file with the suffix 'bold' were found among the BIDS directory.") + # filter inclusion/exclusion lists + from rabies.utils import filter_scan_inclusion + boldname_list=[pathlib.Path(bold.filename).name.rsplit(".nii")[0] for bold in bold_bids] + updated_split_name = filter_scan_inclusion(inclusion_list, boldname_list) + + filtered_bold_bids=[] + for name in updated_split_name: + for bold in bold_bids: + if name in bold.filename: + filtered_bold_bids.append(bold) + bold_bids = filtered_bold_bids + bold_dict = {} for bold in bold_bids: sub = bold.get_entities()['subject'] diff --git a/rabies/utils.py b/rabies/utils.py index d14dd4a..74539b1 100644 --- a/rabies/utils.py +++ b/rabies/utils.py @@ -389,6 +389,38 @@ def flatten_list(l): return l +def filter_scan_inclusion(inclusion_list, split_name): + # the function will update the list of scan IDs in split_name to correspond to inclusion/exclusion list + + # inclusion_list: the input provided by the user + # split_name: a list of all scan IDs that were found + + import numpy as np + import pandas as pd + if os.path.isfile(os.path.abspath(inclusion_list[0])): + updated_split_name=[] + if '.nii' in pathlib.Path(inclusion_list[0]).name: + for scan in inclusion_list: + updated_split_name.append(find_split(scan, split_name)) + else: + # read the file as a .txt + inclusion_list = np.array(pd.read_csv(os.path.abspath(inclusion_list[0]), header=None)).flatten() + for scan in inclusion_list: + updated_split_name.append(find_split(scan, split_name)) + elif inclusion_list[0]=='all': + updated_split_name = split_name + else: + raise ValueError(f"The --inclusion_ids {inclusion_list} input had improper format. It must the full path to a .txt or .nii files, or 'all' to keep all scans.") + return updated_split_name + + +def find_split(scan, split_name): + for split in split_name: + if split in scan: + return split + raise ValueError(f"No previous file name is matching {scan}") + + ###################### #FUNCTIONS TO READ WORKFLOW GRAPH ###################### From 32f3461f2a3bdcafcc7f3af255c8c853cb1cf699 Mon Sep 17 00:00:00 2001 From: Gab-D-G Date: Mon, 25 Sep 2023 17:44:24 -0400 Subject: [PATCH 6/7] Implemented an option for scan exclusion. --- rabies/analysis_pkg/main_wf.py | 3 ++- rabies/confound_correction_pkg/main_wf.py | 3 ++- rabies/parser.py | 11 ++++++++ rabies/preprocess_pkg/main_wf.py | 2 +- rabies/preprocess_pkg/utils.py | 5 ++-- rabies/run_main.py | 7 +++++ rabies/utils.py | 33 +++++++++++++++++++++++ 7 files changed, 59 insertions(+), 5 deletions(-) diff --git a/rabies/analysis_pkg/main_wf.py b/rabies/analysis_pkg/main_wf.py index 898f35e..ea4d555 100644 --- a/rabies/analysis_pkg/main_wf.py +++ b/rabies/analysis_pkg/main_wf.py @@ -26,8 +26,9 @@ def init_main_analysis_wf(preprocess_opts, cr_opts, analysis_opts): """) # filter inclusion/exclusion lists - from rabies.utils import filter_scan_inclusion + from rabies.utils import filter_scan_inclusion, filter_scan_exclusion split_name_list = filter_scan_inclusion(analysis_opts.inclusion_ids, split_name_list) + split_name_list = filter_scan_exclusion(analysis_opts.exclusion_ids, split_name_list) # setting up iterables from the BOLD scan splits main_split = pe.Node(niu.IdentityInterface(fields=['split_name']), diff --git a/rabies/confound_correction_pkg/main_wf.py b/rabies/confound_correction_pkg/main_wf.py index ace0536..78608bc 100644 --- a/rabies/confound_correction_pkg/main_wf.py +++ b/rabies/confound_correction_pkg/main_wf.py @@ -24,8 +24,9 @@ def init_main_confound_correction_wf(preprocess_opts, cr_opts): split_dict, split_name, target_list = read_preproc_workflow(preproc_output, nativespace=cr_opts.nativespace_analysis) # filter inclusion/exclusion lists - from rabies.utils import filter_scan_inclusion + from rabies.utils import filter_scan_inclusion, filter_scan_exclusion split_name = filter_scan_inclusion(cr_opts.inclusion_ids, split_name) + split_name = filter_scan_exclusion(cr_opts.exclusion_ids, split_name) # setting up iterables from the BOLD scan splits main_split = pe.Node(niu.IdentityInterface(fields=['split_name']), diff --git a/rabies/parser.py b/rabies/parser.py index ef99a3d..c24088e 100644 --- a/rabies/parser.py +++ b/rabies/parser.py @@ -96,6 +96,17 @@ def get_parser(): "(default: %(default)s)\n" "\n" ) + g_execution.add_argument( + '--exclusion_ids', type=str, + nargs="*", # 0 or more values expected => creates a list + default=['none'], + help= + "Instead of providing a list of scans to include, this argument provides a list of scans to exclude (while \n" + "keeping all other scans). This argument follows the same syntax rules as --includion_ids. --exclusion_ids \n" + "and --inclusion_ids cannot be used simultaneously. \n" + "(default: %(default)s)\n" + "\n" + ) g_execution.add_argument( "-p", "--plugin", default='Linear', choices=['Linear', 'MultiProc', 'SGE', 'SGEGraph', diff --git a/rabies/preprocess_pkg/main_wf.py b/rabies/preprocess_pkg/main_wf.py index 4ef2e18..3891dcc 100644 --- a/rabies/preprocess_pkg/main_wf.py +++ b/rabies/preprocess_pkg/main_wf.py @@ -135,7 +135,7 @@ def init_main_wf(data_dir_path, output_folder, opts, name='main_wf'): bids.config.set_option('extension_initial_dot', True) layout = bids.layout.BIDSLayout(data_dir_path, validate=False) split_name, scan_info, run_iter, scan_list, bold_scan_list = prep_bids_iter( - layout, opts.bold_only, inclusion_list=opts.inclusion_ids) + layout, opts.bold_only, inclusion_list=opts.inclusion_ids, exclusion_list=opts.exclusion_ids) # setting up all iterables main_split = pe.Node(niu.IdentityInterface(fields=['split_name', 'scan_info']), diff --git a/rabies/preprocess_pkg/utils.py b/rabies/preprocess_pkg/utils.py index 03f2e4d..c4b4d8f 100644 --- a/rabies/preprocess_pkg/utils.py +++ b/rabies/preprocess_pkg/utils.py @@ -8,7 +8,7 @@ ) from rabies.utils import run_command -def prep_bids_iter(layout, bold_only=False, inclusion_list=['all']): +def prep_bids_iter(layout, bold_only=False, inclusion_list=['all'], exclusion_list=['none']): ''' This function takes as input a BIDSLayout, and generates iteration lists for managing the workflow's iterables depending on whether --bold_only is @@ -39,9 +39,10 @@ def prep_bids_iter(layout, bold_only=False, inclusion_list=['all']): "No functional file with the suffix 'bold' were found among the BIDS directory.") # filter inclusion/exclusion lists - from rabies.utils import filter_scan_inclusion + from rabies.utils import filter_scan_inclusion, filter_scan_exclusion boldname_list=[pathlib.Path(bold.filename).name.rsplit(".nii")[0] for bold in bold_bids] updated_split_name = filter_scan_inclusion(inclusion_list, boldname_list) + updated_split_name = filter_scan_exclusion(exclusion_list, updated_split_name) filtered_bold_bids=[] for name in updated_split_name: diff --git a/rabies/run_main.py b/rabies/run_main.py index 0503557..505aed7 100644 --- a/rabies/run_main.py +++ b/rabies/run_main.py @@ -40,6 +40,13 @@ def execute_workflow(args=None): args += input log.info(args) + # inclusion/exclusion list are incompatible parameters + if (not opts.inclusion_ids[0]=='all') and (not opts.exclusion_ids[0]=='none'): + raise ValueError(f""" + Either an inclusion list (--inclusion_ids) or exclusion list (--exclusion_ids) + can be provided, not both. + """) + if opts.rabies_stage == 'preprocess': workflow = preprocess(opts, log) elif opts.rabies_stage == 'confound_correction': diff --git a/rabies/utils.py b/rabies/utils.py index 74539b1..5190829 100644 --- a/rabies/utils.py +++ b/rabies/utils.py @@ -389,6 +389,39 @@ def flatten_list(l): return l +def filter_scan_exclusion(exclusion_list, split_name): + # the function removes a list of scan IDs from split_name + + # exclusion_list: the input provided by the user + # split_name: a list of all scan IDs that were found + + import numpy as np + import pandas as pd + if os.path.isfile(os.path.abspath(exclusion_list[0])): + updated_split_name=[] + if not '.nii' in pathlib.Path(exclusion_list[0]).name: + # read the file as a .txt + exclusion_list = np.array(pd.read_csv(os.path.abspath(exclusion_list[0]), header=None)).flatten() + for split in split_name: + exclude = False + for scan in exclusion_list: + if split in scan: + exclude = True + if not exclude: + updated_split_name.append(split) + elif exclusion_list[0]=='none': + updated_split_name = split_name + else: + raise ValueError(f"The --exclusion_ids {exclusion_list} input had improper format. It must the full path to a .txt or .nii files.") + + if len(updated_split_name)==0: + raise ValueError(f""" + No scans are left after scan exclusion! + """) + + return updated_split_name + + def filter_scan_inclusion(inclusion_list, split_name): # the function will update the list of scan IDs in split_name to correspond to inclusion/exclusion list From a7262d76254977c000f08cd3c7c04a4a490c5e10 Mon Sep 17 00:00:00 2001 From: Gab-D-G Date: Mon, 25 Sep 2023 18:17:34 -0400 Subject: [PATCH 7/7] Implemented a --force option to automatically ignore previous RABIES outputs. --- rabies/parser.py | 8 ++++++++ rabies/run_main.py | 7 ++++--- scripts/debug_workflow.py | 31 ++++++++++++++++++++++++++++--- 3 files changed, 40 insertions(+), 6 deletions(-) diff --git a/rabies/parser.py b/rabies/parser.py index c24088e..d080b4b 100644 --- a/rabies/parser.py +++ b/rabies/parser.py @@ -156,6 +156,14 @@ def get_parser(): "(default: %(default)s)\n" "\n" ) + g_execution.add_argument( + "-f", "--force", dest='force', action='store_true', + help= + "The pipeline will not stop if previous outputs are encountered. \n" + "Previous outputs will be overwritten.\n" + "(default: %(default)s)\n" + "\n" + ) ####Preprocessing diff --git a/rabies/run_main.py b/rabies/run_main.py index 505aed7..7c83b78 100644 --- a/rabies/run_main.py +++ b/rabies/run_main.py @@ -79,12 +79,13 @@ def execute_workflow(args=None): def prep_logging(opts, output_folder): cli_file = f'{output_folder}/rabies_{opts.rabies_stage}.pkl' - if os.path.isfile(cli_file): + if os.path.isfile(cli_file) and not opts.force: raise ValueError(f""" A previous run was indicated by the presence of {cli_file}. This can lead to inconsistencies between previous outputs and the log files. - To prevent this, you are required to manually remove {cli_file}, and we - recommend also removing previous datasinks from the {opts.rabies_stage} RABIES step. + To prevent this, we recommend removing previous datasinks from the {opts.rabies_stage} + RABIES stage. To continue with your execution, the {cli_file} file must be + removed (use --force to automatically do so). """) # remove old versions of the log if already existing diff --git a/scripts/debug_workflow.py b/scripts/debug_workflow.py index 24431c4..4cbc3dd 100644 --- a/scripts/debug_workflow.py +++ b/scripts/debug_workflow.py @@ -1,24 +1,27 @@ #! /usr/bin/env python from rabies.utils import generate_token_data +from rabies.run_main import execute_workflow import tempfile tmppath = tempfile.mkdtemp() #### increase the number of scans generated to 3 if running group analysis -generate_token_data(tmppath, number_scans=1) +generate_token_data(tmppath, number_scans=3) output_folder = f'{tmppath}/outputs' #### HERE ARE SET THE DESIRED PARAMETERS FOR PREPROCESSING args = [ + f'--exclusion_ids',f'{tmppath}/inputs/sub-token1_bold.nii.gz', + '-f', #'--debug', 'preprocess', f'{tmppath}/inputs', output_folder, '--anat_inho_cor', 'method=disable,otsu_thresh=2,multiotsu=false', '--bold_inho_cor', 'method=disable,otsu_thresh=2,multiotsu=false', '--bold2anat_coreg', 'registration=no_reg,masking=false,brain_extraction=false', '--commonspace_reg', 'masking=false,brain_extraction=false,fast_commonspace=true,template_registration=no_reg', - '--data_type', 'int16', '--bold_only', + '--data_type', 'int16', '--anat_template', f'{tmppath}/inputs/sub-token1_T1w.nii.gz', '--brain_mask', f'{tmppath}/inputs/token_mask.nii.gz', '--WM_mask', f'{tmppath}/inputs/token_mask.nii.gz', @@ -27,5 +30,27 @@ '--labels', f'{tmppath}/inputs/token_mask.nii.gz', ] -from rabies.run_main import execute_workflow execute_workflow(args=args) + + + +''' + +args = [ + f'--exclusion_ids',f'{tmppath}/inputs/sub-token1_bold.nii.gz',f'{tmppath}/inputs/sub-token2_bold.nii.gz', + '-f', + 'confound_correction', output_folder, output_folder, + '--nativespace_analysis', + ] +execute_workflow(args=args) + + +args = [ + f'--exclusion_ids',f'{tmppath}/inputs/sub-token3_bold.nii.gz', + '-f', + 'analysis', output_folder, output_folder, + '--data_diagnosis' + ] +execute_workflow(args=args) + +'''