in atis.py [0:0]
def sample_data(args):
assert args['ex_per_slot'] == -1
for lang in args['languages'].split(','):
with open(os.path.join(args.output_dir, f'matis_{lang}_train_squad.json'), 'r') as data_f, \
open(os.path.join(args.output_dir, f'matis_{lang}_train_squad_sample_{args["ex_uniform"]}.json'), 'w') as out_f:
data = json.load(data_f)
sampled = {
'version': data['version'],
'data': [{
'title': data['data'][0]['title'],
'paragraphs': random.sample(data['data'][0]['paragraphs'], args['ex_uniform'])
}]
}
json.dump(sampled, out_f, indent=4)