12345678910111213141516171819202122 |
- import argparse
- import pandas as pd
- parser = argparse.ArgumentParser(description = 'match classifications with extracted chunks')
- parser.add_argument('classifications', help = 'classifications file')
- parser.add_argument('output', help = 'output')
- parser.add_argument('--chunks', help = 'list of chunks', nargs = '+', required = True)
- args = parser.parse_args()
- classifications = pd.read_csv(args.classifications)
- chunks = pd.concat([
- pd.read_csv(f) for f in args.chunks
- ])
- classifications = classifications.merge(
- chunks,
- left_on = 'subject_id',
- right_on = 'zooniverse_id'
- )
- classifications.to_csv(args.output, index = False)
|