|
@@ -75,7 +75,7 @@ from modelscope.msdatasets import MsDataset
|
|
|
def get_gsm8k_questions(split="train") -> Dataset:
|
|
|
# data = load_dataset('openai/gsm8k', 'main')[split]
|
|
|
data = MsDataset.load('openai-mirror/gsm8k', subset_name='main', split=split)
|
|
|
- os.makedirs(f'../data/temp/',exist_ok=False)
|
|
|
+ os.makedirs(f'../data/temp/',exist_ok=True)
|
|
|
# Save original datasets to JSONL
|
|
|
with open(f'../data/temp/gsm8k_original_{split}.jsonl', 'w') as f:
|
|
|
for item in data:
|