瀏覽代碼

换用github jwjohns/unsloth-GRPO-qwen2.5 验证GRPO训练模型

zhouyang.xie 2 月之前
父節點
當前提交
5f6552665d
共有 1 個文件被更改,包括 1 次插入1 次删除
  1. 1 1
      src/train_model_github_jwjohns.py

+ 1 - 1
src/train_model_github_jwjohns.py

@@ -75,7 +75,7 @@ from modelscope.msdatasets import MsDataset
 def get_gsm8k_questions(split="train") -> Dataset:
 def get_gsm8k_questions(split="train") -> Dataset:
     # data = load_dataset('openai/gsm8k', 'main')[split]
     # data = load_dataset('openai/gsm8k', 'main')[split]
     data =  MsDataset.load('openai-mirror/gsm8k', subset_name='main', split=split)
     data =  MsDataset.load('openai-mirror/gsm8k', subset_name='main', split=split)
-    os.makedirs(f'../data/temp/',exist_ok=False)
+    os.makedirs(f'../data/temp/',exist_ok=True)
     # Save original datasets to JSONL
     # Save original datasets to JSONL
     with open(f'../data/temp/gsm8k_original_{split}.jsonl', 'w') as f:
     with open(f'../data/temp/gsm8k_original_{split}.jsonl', 'w') as f:
         for item in data:
         for item in data: