|
@@ -54,7 +54,7 @@ class DownloadChildCorpora :
|
|
|
chat,
|
|
|
participants_to_consider: List[str],
|
|
|
phonemize_child: bool,
|
|
|
- ) -> Generator[str, str, float, List[str]]:
|
|
|
+ ) -> Generator:
|
|
|
"""
|
|
|
Get the data for each participant. Here, the data for each participant\
|
|
|
is the set of utterances produced by this participant at all child ages.
|
|
@@ -201,7 +201,8 @@ class DownloadChildCorpora :
|
|
|
participant,
|
|
|
backend,
|
|
|
phonemize_child=phonemize_child) :
|
|
|
- utterance = self.utterances_cleaner.clean(utterance)
|
|
|
+ # utterance = " ".join(phon for word in utterance.split("@") for phon in word.split("$") if phon)
|
|
|
+ # utterance = self.utterances_cleaner.clean(utterance)
|
|
|
utterance = self.utterances_cleaner.remove_multiple_spaces(utterance)
|
|
|
if not utterance :
|
|
|
continue
|