import glob | |
import json | |
from sys import argv | |
for split in ['train', 'valid']: | |
with open(f'json/{split}.json', 'w') as f: | |
data = [{'source': glob.glob(f'shard/{split}/*'), 'source_lang': 'en', 'weight': 1.0, 'name': '16gb-en'}] | |
json.dump(data, f, indent=4) | |