import argparse import json argparse = argparse.ArgumentParser() argparse.add_argument('path', type=str) args = argparse.parse_args() assert args.path.endswith('.json') data = json.load(open(args.path)) writer = open(args.path.replace('.json', '.jsonl'), 'w') for idx, item in enumerate(data): conversations = item['conversations'] if conversations[0]['from'] == 'system': item['conversations'] = item['conversations'][1:] item['id'] = idx writer.write(json.dumps(item, ensure_ascii=False) + '\n') writer.close()