initial commit

This commit is contained in:
wea_ondara
2024-04-17 18:58:50 +02:00
commit 41d5b4f591
22 changed files with 1611 additions and 0 deletions

12
utils/download_dataset.py Normal file
View File

@@ -0,0 +1,12 @@
import pickle
from conversation import mkdir
from datasets import load_dataset
dataset_id = 'OpenAssistant/oasst2'
mkdir('../datasets')
pickle_filename = './datasets/' + dataset_id.replace('/', '_') + '.pickle'
dataset = load_dataset(dataset_id)
with open(pickle_filename, 'wb') as file:
pickle.dump(dataset, file)
print('Saved as pickle to ' + pickle_filename)