Aswendt_Lab
/
2023_Kalantari_AIDAqc_old


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464
							import numpy as np
import os
import pandas as pd
import glob
import matplotlib.backends.backend_pdf
import nibabel as nib
import nibabel as nii
import matplotlib.pyplot as plt
import pv_conv2Nifti as pr
import alive_progress as ap
import pv_parser as par
from QC import *
#%% Feature calculation of the pipeline. Core Unit of the Pipeline     
def CheckingRawFeatures(Path):
    #Path=r"C:\Users\Erfan\Downloads\Compressed\proc_data\P5"  
    Abook = []
    Names =[]
    for file in glob.glob(os.path.join(Path, '*addreses*.csv')) :
        
        if "anat" in file :    
             t2w_path= file
             t2w_addreses= pd.read_csv(t2w_path)
             Abook.append(t2w_addreses)
             Names.append("anat")

        elif "diff" in file:
            dti_path= file
            dti_addreses= pd.read_csv(dti_path)
            Abook.append(dti_addreses)
            Names.append("diff")
        elif "func" in file :
            fmri_path= file
            fmri_addreses= pd.read_csv(fmri_path)
            Abook.append(fmri_addreses)
            Names.append("func")
    
    ErorrList = []
    saving_path = Path
    

    C = np.array([not Check.empty for Check in Abook])
    Names = np.array(Names)[C].tolist()
    Names.append('ErrorData')
    Abook2 = [a.values.tolist() for a in Abook]
    #% Calculate all the SNR for all the data that was found 
    # in the last step and saving it into a vector
    # Load Bruker data from each address 

    kk =0
    for ii,N in enumerate(Names):
        if N != 'ErrorData':
            if kk > 0:
                print(str(kk) + ' 1 faulty file(s) were found. Note: these files will be listed in CanNotProcessTheseFiles.csv \n')
            
            print(N+' processing... \n')
            
            text_files0 = Abook2[ii]
            text_files = [i[0] for i in text_files0]
            
            dd = 1
            snrCh_vec =[]
            tsnr_vec = []
            snr_normal_vec = []
            SpatRes_vec = []
            MI_vec_all = []
            LMV_all = []
            GMV_all = []
            Max_mov_between_all = []
            text_files_new = []
            img_names_new = []
            keys = []
            GMetric_vec =  []
            kk = 0
            i=1
           
            with ap.alive_bar(len(text_files),spinner='wait') as bar:
                
                for tf in text_files:
                   
                    tf = str(tf)
                    tf = os.path.normpath(tf)
                    path_split = tf.split(os.sep)
                    procno = str(1)
                    expno =path_split[-1]
                    study = path_split[-2]
                    raw_folder = os.sep.join(path_split[:-2])
                    proc_folder = os.path.join(raw_folder,'proc_data') #Here still adjustment is needed
                    
                    pv = pr.Bruker2Nifti(study, expno, procno, raw_folder, proc_folder, ftype='NIFTI_GZ')
                    CP_v = os.path.join(tf ,'pdata','1','visu_pars') # Check Parameter: Visu_pars
                    CP_a = os.path.join(tf , 'acqp') # Check Parameter: acqp
                    
                    if os.path.isfile(CP_v) and os.path.isfile(CP_a):
                        try:
                            pv.read_2dseq(map_raw=False, pv6=False)
                            input_file = nii.squeeze_image(pv.nim)
                        except ValueError:
                            ErorrList.append(tf+"_Value Error")
                            print(tf)
                            print("Value Error: catched")
                            continue
                        except SystemError:
                            ErorrList.append(tf+"_System Error")
                            print(tf)
                            print("System Error: catched")
                            continue
                        except KeyError:
                            ErorrList.append(tf+"_KeyError")
                            print(tf)
                            print("KeyError: catched")
                            continue
                        except FileNotFoundError: 
                            ErorrList.append(tf+"_FileNotFoundError")
                            print(tf)
                            print("System Error: catched")
                            continue
                        
                    else:
                        ErorrList.append(tf+"No_Visu_pars_file")
                        print("No Visu_pars file found")
                        kk = kk+1
                        continue

                    # determine sequence name 
                    NameTemp = par.read_param_file(CP_a)
                    MN = NameTemp[1]["ACQ_method"].upper()  #Here we check what the name of the sequence is
                    MN2 = NameTemp[1]["ACQ_protocol_name"].upper()
                    KEY = MN + MN2
                    keys.append(KEY)
                   
# =============================================================================
#                     Size = ((input_file.get_fdata()).nbytes/(1024*1024))
#                     if Size < 3:
#                         ErorrList.append(tf)
#                         continue
# =============================================================================
                    ########### Slice extraction 
                    selected_img = Image_Selection(input_file)                    
                    qc_path = os.path.join(saving_path,"manual_slice_inspection")
                    if not os.path.isdir(qc_path):
                        os.mkdir(qc_path)
                    img_name = str.split(tf,os.sep)[-2]
                    full_img_name = str(N)+"_" + img_name+"_"+ str(dd)+".png".replace(".nii","").replace(".gz","")
                    img_names_new.append(full_img_name) 
                    
                    #plt.figure()          
                    plt.axis('off')
                    plt.imshow(selected_img,cmap='gray')
                    #svg_path = os.path.join(qc_path,+ img_name+".png").replace(".nii","").replace(".gz","")
                    svg_path = os.path.join(qc_path,str(N)+"_"+ img_name+"_"+ str(dd)+".png").replace(".nii","").replace(".gz","")
                    dd = dd +1
                    plt.savefig(svg_path)
                    ########### Slice extraction               
                    # other Features
                    SpatRes = ResCalculator(input_file)
                    GMetric = GoastCheck(input_file)
                    
                    
                    if N == 'anat':
                        
                        # Signal 2 noise ratio
                        snrCh = snrCalclualtor_chang(input_file)
                        snr_normal = snrCalclualtor_normal(input_file)   
                        
                        LMV_all = np.nan
                        GMV_all = np.nan
                        Max_mov_between_all = np.nan
                        snr_normal_vec.append(snr_normal)
                        snrCh_vec.append(snrCh)
                        
                    elif N == 'diff':
                        # Signal 2 noise ratio
                        #print(tf)
                        snrCh = snrCalclualtor_chang(input_file)
                        snr_normal = snrCalclualtor_normal(input_file)   
                        Final,Max_mov_between,GMV,LMV = Ismotion(input_file)
                        
                        
                        GMV_all.append(GMV)
                        LMV_all.append(LMV)
                        MI_vec_all.append(Final)
                        Max_mov_between_all.append(Max_mov_between)
                        snr_normal_vec.append(snr_normal)
                        snrCh_vec.append(snrCh)
                        
                    elif N == 'func':
                        #temporal signal 2 noise ratio
                        #print(tf)
                        tSNR = TsnrCalclualtor(input_file)
                        Final,Max_mov_between,GMV,LMV = Ismotion(input_file)
                        
                        Max_mov_between_all.append(Max_mov_between)
                        GMV_all.append(GMV)
                        LMV_all.append(LMV)
                        MI_vec_all.append(Final)
                        Max_mov_between_all.append(Max_mov_between)
                        tsnr_vec.append(tSNR)
                        
                        
                    i=i+1
                    bar()
                    text_files_new.append(tf)
                    SpatRes_vec.append(SpatRes)
                    GMetric_vec.append(GMetric)
            
            df = pd.DataFrame()
            df['FileAddress'] = text_files_new
            df['sequence name'] = keys
            df["corresponding_img"] = img_names_new
            df['SpatRx'] = np.array(SpatRes_vec)[:,0]
            df['SpatRy'] = np.array(SpatRes_vec)[:,1]
            df['Slicethick'] = np.array(SpatRes_vec)[:,2]
            df['Goasting'] = np.array(GMetric_vec)
            
            
            if N == 'anat':
                 df['SNR Chang'] = np.array(snrCh_vec)
                 df['SNR Normal'] = np.array(snr_normal_vec)
                 
            elif N == 'diff':
                 df['SNR Chang'] = np.array(snrCh_vec)
                 df['SNR Normal'] = np.array(snr_normal_vec)
                 df['Displacement factor (std of Mutual information)']=np.array(LMV_all)
                 #df['Maximal displacement']=AR[4]
                 
            elif N == "func":
                 df['tSNR (Averaged Brain ROI)'] = np.array(tsnr_vec)
                 df['Displacement factor (std of Mutual information)']=np.array(LMV_all)
                 #df['Maximal displacement']=AR[4]
                 
            if N=="anat":
                t2w_result= os.path.join(Path,"caculated_features_anat.csv")
                df.to_csv( t2w_result)

            elif N=="diff":    
                dti_result= os.path.join(Path,"caculated_features_diff.csv")
                df.to_csv( dti_result)   

            elif N=="func":
                fmri_result= os.path.join(Path,"caculated_features_func.csv")
                df.to_csv(fmri_result)

    if ErorrList:            
        dfNewError = pd.DataFrame(ErorrList)
        new_file_path = os.path.join(saving_path, "CanNotProcessTheseFiles.csv")
        dfNewError.to_csv(new_file_path)
      
    print('\n\noutput files were created:' + str(Path))
    
    print('\n\n%%%%%%%%%%%%% End of the stage 2 %%%%%%%%%%%%%%%\n\n'.upper())
   
#%% exact above function but this time for nifti format
def CheckingNiftiFeatures(Path):   
    
    
    Abook = []
    Names =[]
    for file in glob.glob(os.path.join(Path, '*addreses*.csv')) :

        if "anat" in file :    
             t2w_path= file
             t2w_addreses= pd.read_csv(t2w_path)
             Abook.append(t2w_addreses)
             Names.append("anat")             
        elif "diff" in file:
            dti_path= file
            dti_addreses= pd.read_csv(dti_path)
            Abook.append(dti_addreses)
            Names.append("diff")
        elif "func" in file :
            fmri_path= file
            fmri_addreses= pd.read_csv(fmri_path)
            Abook.append(fmri_addreses)
            Names.append("func")
    
    ErorrList = []
    saving_path = os.path.dirname(Path) 
    

    C = np.array([not Check.empty for Check in Abook])
    Names = np.array(Names)[C].tolist()
    Names.append('ErrorData')
    Abook2 = [a.values.tolist() for a in Abook]


    #% Calculate all the SNR for all the data that was found 
    # in the last step and saving it into a vector
    # Load Bruker data from each address 

    kk =0
    
    for ii,N in enumerate(Names):
        if N != 'ErrorData':
            if kk > 0:
                print(str(kk) + 'faulty files were found: All faulty files are available in the Errorlist tab in the Excel outputs\n')
            
            print(N+' processing... \n')
            
            text_files0 = Abook2[ii]
            text_files = [i[0] for i in text_files0]
            
            dd = 1
            snrCh_vec =[]
            tsnr_vec = []
            snr_normal_vec = []
            SpatRes_vec = []
            MI_vec_all = []
            LMV_all = []
            GMV_all = []
            Max_mov_between_all = []
            text_files_new = []
            img_names_new = []
            GMetric_vec =  []
            kk = 0
            i=1
            
            
            with ap.alive_bar(len(text_files),spinner='wait') as bar:

                for tf in text_files:

                    tf = str(tf)
                    print(tf)
                    """
                    if "DTI".upper() in tf.upper() :
                            N= "DTI"
                    if  "T2w".upper() in tf.upper():
                            N="T2w"
                    if  "fMRI".upper() in tf.upper():
                            N="rsfMRI"
                    """
                    tf = os.path.normpath(tf)
                    try:
                        input_file= nib.load(tf)
                    except nib.loadsave.ImageFileError:
                        print("could not load the following file (check the size of the file):")
                        print(tf)
                        ErorrList.append(tf)
                        continue
                    
                    ########### Slice extraction 
                    selected_img = Image_Selection(input_file)                    
                    qc_path = os.path.join(Path,"manual_slice_inspection")
                    if not os.path.isdir(qc_path):
                        os.mkdir(qc_path)
                    img_name = str.split(tf,os.sep)[-1]
                    folder_name = str.split(tf,os.sep)[-2] 
                    full_img_name = (str(N)+"_"+folder_name+"_"+img_name+"_"+str(dd)+".png").replace(".nii","").replace(".gz","")
                    img_names_new.append(full_img_name)
                    
                    #plt.figure()          
                    plt.axis('off')
                    plt.imshow(selected_img,cmap='gray')
                    svg_path = os.path.join(qc_path,str(N)+"_"+folder_name+"_"+img_name+"_"+str(dd)+".png").replace(".nii","").replace(".gz","")
                    dd = dd +1
                    plt.savefig(svg_path)
                    ########### Slice extraction               
                    # other Features
                    SpatRes = ResCalculator(input_file)
                    GMetric = GoastCheck(input_file)
                    
                    if N == "anat":
                        # Signal 2 noise ratio
                        snrCh = snrCalclualtor_chang(input_file)
                        snr_normal = snrCalclualtor_normal(input_file)   
                        
                        LMV_all = np.nan
                        GMV_all = np.nan
                        Max_mov_between_all = np.nan
                        snr_normal_vec.append(snr_normal)
                        snrCh_vec.append(snrCh)
                        
                    elif N == "diff":
                        # Signal 2 noise ratio
                        
                        snrCh = snrCalclualtor_chang(input_file)
                        snr_normal = snrCalclualtor_normal(input_file)   
                        Final,Max_mov_between,GMV,LMV = Ismotion(input_file)
                        
                        GMV_all.append(GMV)
                        LMV_all.append(LMV)
                        MI_vec_all.append(Final)
                        Max_mov_between_all.append(Max_mov_between)
                        snr_normal_vec.append(snr_normal)
                        snrCh_vec.append(snrCh)
                        
                    elif N == "func":
                        #temporal signal 2 noise ratio
                        tSNR = TsnrCalclualtor(input_file)
                        Final,Max_mov_between,GMV,LMV = Ismotion(input_file)
                        
                        Max_mov_between_all.append(Max_mov_between)
                        GMV_all.append(GMV)
                        LMV_all.append(LMV)
                        MI_vec_all.append(Final)
                        Max_mov_between_all.append(Max_mov_between)
                        tsnr_vec.append(tSNR)
                    
                    
                    i=i+1
                    bar()
                    text_files_new.append(tf)
                    SpatRes_vec.append(SpatRes)
                    GMetric_vec.append(GMetric)
                    
                     
            # Saving parsed files to excel sheets
            #AR = [text_files_new,np.array(SpatRes_vec),np.array(snrCh_vec),np.array(LMV_all),np.array(GMV_all),np.array(snr_normal_vec)]
            
            
            # using the savetxt 
            # from the numpy module
            
            df = pd.DataFrame()
            df['FileAddress'] = text_files_new
            df["corresponding_img"] = img_names_new
            df['SpatRx'] = np.array(SpatRes_vec)[:,0]
            df['SpatRy'] = np.array(SpatRes_vec)[:,1]
            df['Slicethick'] = np.array(SpatRes_vec)[:,2]
            df['Goasting'] = np.array(GMetric_vec)
            
          
            if N == "anat":
                 df['SNR Chang'] = np.array(snrCh_vec)
                 df['SNR Normal'] = np.array(snr_normal_vec)
                 
            elif N == "diff":
                 df['SNR Chang'] = np.array(snrCh_vec)
                 df['SNR Normal'] = np.array(snr_normal_vec)
                 df['Displacement factor (std of Mutual information)']=np.array(LMV_all)
                 #df['Maximal displacement']=AR[4]
                 
            elif N == "func":
                 df['tSNR (Averaged Brain ROI)'] = np.array(tsnr_vec)
                 df['Displacement factor (std of Mutual information)']=np.array(LMV_all)
                 #df['Maximal displacement']=AR[4]
                 
            if N=="anat":
                t2w_result= os.path.join(Path,"caculated_features_anat.csv")
                df.to_csv( t2w_result)

            elif N=="diff":    
                dti_result= os.path.join(Path,"caculated_features_diff.csv")
                df.to_csv( dti_result)   

            elif N=="func":
                fmri_result= os.path.join(Path,"caculated_features_func.csv")
                df.to_csv(fmri_result)

    if ErorrList:            
        dfNewError = pd.DataFrame(ErorrList)
        new_file_path = os.path.join(saving_path, "CanNotProcessTheseFiles.csv")
        dfNewError.to_csv(new_file_path)

    print('\n\noutput file was created:' + str(Path))
    
    print('\n\n%%%%%%%%%%%%% End of the stage 2 %%%%%%%%%%%%%%%\n\n'.upper())
    
   
#%%