|
@@ -69,6 +69,25 @@ def _get_children(children_path):
|
|
|
return data
|
|
|
|
|
|
|
|
|
+#ac2pl
|
|
|
+def _get_correspondance(correspondance_path):
|
|
|
+ """
|
|
|
+ Returns a DataFrame of correspondances across child ID (phone numbers) or an empty DataFrame if `correspondance.csv` does not
|
|
|
+ exist
|
|
|
+ :param recordings_path: Path to the `correspondance.csv` metadata file
|
|
|
+ :type correspondance_path: str
|
|
|
+ :return: dataframe of correspondances across child ID (phone numbers) or empty dataframe
|
|
|
+ :rtype: pandas.DataFrame
|
|
|
+ """
|
|
|
+ try:
|
|
|
+ data = pd.read_csv(correspondance_path)
|
|
|
+ #TODO, check that data has wanted columns?
|
|
|
+ except:
|
|
|
+ columns = ['number', 'original']
|
|
|
+ data = pd.DataFrame(columns=columns)
|
|
|
+ return data
|
|
|
+
|
|
|
+
|
|
|
def _build_recording_metadata(recordings_path, recording, experiment, recording_device_type):
|
|
|
"""
|
|
|
Return the metadata corresponding to a given file (date, time, duration, etc.)
|
|
@@ -156,15 +175,20 @@ def import_children(project_path, experiment):
|
|
|
"""
|
|
|
recordings_metadata_path = os.path.join(project_path, 'metadata', 'recordings.csv')
|
|
|
children_metadata_path = os.path.join(project_path, 'metadata', 'children.csv')
|
|
|
+ correspondance_metadata_path = os.path.join(project_path, 'metadata', 'correspondance.csv') #ac2lp
|
|
|
|
|
|
recordings = _get_recordings(recordings_metadata_path)
|
|
|
children = _get_children(children_metadata_path)
|
|
|
children_count = len(children)
|
|
|
+ children = _get_correspondance(correspondance_metadata_path) #ac2pl
|
|
|
|
|
|
child_id_recordings = set(recordings['child_id'])
|
|
|
missing_children = child_id_recordings - set(children['child_id'])
|
|
|
|
|
|
+
|
|
|
for child_id in missing_children:
|
|
|
+ # ac2lp check if children may not correspond to another telephone number
|
|
|
+ # add: if child_id in correspondance['original'] then redefine child_id as the right cell in correspondance['original'] else what follows
|
|
|
child_metadata = {
|
|
|
'experiment': experiment,
|
|
|
'child_id': child_id,
|