Spaces:
Sleeping
Sleeping
File size: 542 Bytes
1b58092 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 |
import argparse
import json
argparse = argparse.ArgumentParser()
argparse.add_argument('path', type=str)
args = argparse.parse_args()
assert args.path.endswith('.json')
data = json.load(open(args.path))
writer = open(args.path.replace('.json', '.jsonl'), 'w')
for idx, item in enumerate(data):
conversations = item['conversations']
if conversations[0]['from'] == 'system':
item['conversations'] = item['conversations'][1:]
item['id'] = idx
writer.write(json.dumps(item, ensure_ascii=False) + '\n')
writer.close()
|