Browse Source

re-downloaded childes data

yaya-sy 1 year ago
parent
commit
9ad6226668

+ 0 - 3
code/download_childes_corpora.py

@@ -201,9 +201,6 @@ class DownloadChildCorpora :
                                                                     participant,
                                                                     backend,
                                                                     phonemize_child=phonemize_child) :
-                        # utterance = " ".join(phon for word in utterance.split("@") for phon in word.split("$") if phon)
-                        # utterance = self.utterances_cleaner.clean(utterance)
-                        utterance = self.utterances_cleaner.remove_multiple_spaces(utterance)
                         if not utterance :
                             continue
                         family_name = "_".join((corpus, family))

+ 1 - 1
datasets/childes_json_corpora/da.json

@@ -1 +1 @@
-../../.git/annex/objects/wM/J4/MD5E-s2940316--a8934de46f3d6e2096f15f7f096e92b0.json/MD5E-s2940316--a8934de46f3d6e2096f15f7f096e92b0.json
+../../.git/annex/objects/4W/Xg/MD5E-s2940316--507efe8e52bf5ce75f8df711d87d1f38.json/MD5E-s2940316--507efe8e52bf5ce75f8df711d87d1f38.json

+ 1 - 1
datasets/childes_json_corpora/de.json

@@ -1 +1 @@
-../../.git/annex/objects/gx/kK/MD5E-s46328318--41a6db192dc968c831890df8073f4797.json/MD5E-s46328318--41a6db192dc968c831890df8073f4797.json
+../../.git/annex/objects/Qk/zP/MD5E-s46328318--e1731bf1fa906c3d80fb05dd5d3d6f5a.json/MD5E-s46328318--e1731bf1fa906c3d80fb05dd5d3d6f5a.json

+ 1 - 1
datasets/childes_json_corpora/en.json

@@ -1 +1 @@
-../../.git/annex/objects/7V/1j/MD5E-s32520507--e5ba1e7c1bfa0ed106862bef65784026.json/MD5E-s32520507--e5ba1e7c1bfa0ed106862bef65784026.json
+../../.git/annex/objects/x6/Pz/MD5E-s32520507--791da7dcf5989c304d57ec99633ecb44.json/MD5E-s32520507--791da7dcf5989c304d57ec99633ecb44.json

+ 1 - 1
datasets/childes_json_corpora/et.json

@@ -1 +1 @@
-../../.git/annex/objects/k8/vv/MD5E-s8521517--d3661c988b3c4298fca6c6bf53a1e50c.json/MD5E-s8521517--d3661c988b3c4298fca6c6bf53a1e50c.json
+../../.git/annex/objects/Mm/k6/MD5E-s8521517--5ef935cd91ae29f412dc7c120ca40935.json/MD5E-s8521517--5ef935cd91ae29f412dc7c120ca40935.json

+ 1 - 1
datasets/childes_json_corpora/eu.json

@@ -1 +1 @@
-../../.git/annex/objects/43/3v/MD5E-s1472846--a18f0bbd772ee30982d7a6698dce2107.json/MD5E-s1472846--a18f0bbd772ee30982d7a6698dce2107.json
+../../.git/annex/objects/ww/Z9/MD5E-s1472846--a667b8b79f2e6776432563587ce07e5f.json/MD5E-s1472846--a667b8b79f2e6776432563587ce07e5f.json

+ 1 - 1
datasets/childes_json_corpora/pl.json

@@ -1 +1 @@
-../../.git/annex/objects/v0/qZ/MD5E-s17536902--3ae284fc8e315cdb5ff45ea0f68f5732.json/MD5E-s17536902--3ae284fc8e315cdb5ff45ea0f68f5732.json
+../../.git/annex/objects/fF/vZ/MD5E-s17536902--3ffc596ee76e6cc85c4f7d6ca8b3296d.json/MD5E-s17536902--3ffc596ee76e6cc85c4f7d6ca8b3296d.json

+ 1 - 1
datasets/childes_json_corpora/pt.json

@@ -1 +1 @@
-../../.git/annex/objects/6k/0G/MD5E-s6191044--0998067d5cdac6b67d219afaa092d48c.json/MD5E-s6191044--0998067d5cdac6b67d219afaa092d48c.json
+../../.git/annex/objects/Jp/Vg/MD5E-s6191044--27633d407e17573a948c99aaa1a3b697.json/MD5E-s6191044--27633d407e17573a948c99aaa1a3b697.json

+ 1 - 1
datasets/childes_json_corpora/sr.json

@@ -1 +1 @@
-../../.git/annex/objects/7J/1p/MD5E-s8135600--6a80c3fbc662975ad3c67a668ce7e062.json/MD5E-s8135600--6a80c3fbc662975ad3c67a668ce7e062.json
+../../.git/annex/objects/ww/Jw/MD5E-s8135600--6edc4ae6a907ab4d710bc1b8fe2b60ed.json/MD5E-s8135600--6edc4ae6a907ab4d710bc1b8fe2b60ed.json