浏览代码

modified grid2csv.py

Martin Frébourg 2 年之前
父节点
当前提交
34bc9b8856
共有 3 个文件被更改,包括 5 次插入2 次删除
  1. 4 1
      code/grid2csv.py
  2. 0 1
      outputs/grid2csv_output/BN.csv
  3. 1 0
      outputs/grid2csv_output/BN32_010007-aligned.csv.csv

+ 4 - 1
code/grid2csv.py

@@ -57,6 +57,9 @@ for file in files:
         for interval in tier.get_all_intervals():
             
             if not interval[2]: continue
+            if interval[2] == "sil" : 
+                continue
+
             #populates dataframe
             temp_dict = {'speaker_id': tier.name, 'segment_onset': (interval[0]*1000 + audio_onset),
                 'segment_offset': (interval[1]*1000 + audio_onset), 'transcription': interval[2]}
@@ -82,5 +85,5 @@ df = pd.concat([df, orig_df_subset])
 df.sort_values(by='segment_onset', inplace= True)
 
 #exports to csv
-df.to_csv("{0}/BN.csv".format(output_path), mode = "x", na_rep= "NA", index= False)
+df.to_csv("{0}/BN32_010007-aligned.csv.csv".format(output_path), mode = "x", na_rep= "NA", index= False)
 print("----------------SAVED!-----------------")

+ 0 - 1
outputs/grid2csv_output/BN.csv

@@ -1 +0,0 @@
-../../.git/annex/objects/vx/Wp/MD5E-s7745478--90d300849f4aa887ed1c4e6845b69878.csv/MD5E-s7745478--90d300849f4aa887ed1c4e6845b69878.csv

+ 1 - 0
outputs/grid2csv_output/BN32_010007-aligned.csv.csv

@@ -0,0 +1 @@
+../../.git/annex/objects/xZ/ZQ/MD5E-s7705400--ed44f3c5b73a0f1ba209b780aba62b3d.csv.csv/MD5E-s7705400--ed44f3c5b73a0f1ba209b780aba62b3d.csv.csv