bingqin111's picture
Upload folder using huggingface_hub
677cc91 verified
import json
data = json.load(open('/home/hsichen/LLaMA-Factory/data/chaiting/pk_2087.json','r'))
converted_data = []
for item in data:
try:
bot_name = item['conversations'][2]['value'].split(':')[0]
item['chosen']['value'] = bot_name + ': ' + item['chosen']['value']
converted_data.append({
'conversations': item['conversations'] + [item['chosen']]
})
except:
print(item['conversations'])
print('###############\n\n')
continue
output = '/home/hsichen/LLaMA-Factory/data/chaiting/sft_2087.json'
with open(output, 'w') as f:
json.dump(converted_data, f, ensure_ascii=False)
print(f"Converted data saved to {output}, length: {len(converted_data)}")