|
@@ -57,6 +57,9 @@ for file in files:
|
|
|
for interval in tier.get_all_intervals():
|
|
|
|
|
|
if not interval[2]: continue
|
|
|
+ if interval[2] == "sil" :
|
|
|
+ continue
|
|
|
+
|
|
|
#populates dataframe
|
|
|
temp_dict = {'speaker_id': tier.name, 'segment_onset': (interval[0]*1000 + audio_onset),
|
|
|
'segment_offset': (interval[1]*1000 + audio_onset), 'transcription': interval[2]}
|
|
@@ -82,5 +85,5 @@ df = pd.concat([df, orig_df_subset])
|
|
|
df.sort_values(by='segment_onset', inplace= True)
|
|
|
|
|
|
#exports to csv
|
|
|
-df.to_csv("{0}/BN.csv".format(output_path), mode = "x", na_rep= "NA", index= False)
|
|
|
+df.to_csv("{0}/BN32_010007-aligned.csv.csv".format(output_path), mode = "x", na_rep= "NA", index= False)
|
|
|
print("----------------SAVED!-----------------")
|