|
@@ -171,8 +171,8 @@ class ModelTrainer:
|
|
|
# train_dataset, batch_size=1, shuffle=True, pin_memory=True
|
|
|
# )
|
|
|
|
|
|
- # 释放未使用的显存
|
|
|
- torch.cuda.empty_cache()
|
|
|
+ # # 释放未使用的显存
|
|
|
+ # torch.cuda.empty_cache()
|
|
|
|
|
|
training_args = GRPOConfig(
|
|
|
use_vllm = False, # use vLLM for fast inference!
|