Prechádzať zdrojové kódy

遵循面向对象思想重构train_model_grpo.py

zhouyang.xie 3 mesiacov pred
rodič
commit
c7b5cc14c5
1 zmenil súbory, kde vykonal 1 pridanie a 1 odobranie
  1. 1 1
      src/train_model_grpo_v1.1.py

+ 1 - 1
src/train_model_grpo_v1.1.py

@@ -29,7 +29,7 @@ class ModelTrainer:
         self.gpu_memory_utilization = config.gpu_memory_utilization
         # 初始化 BERT 模型和分词器
         self.tokenizer = LongformerTokenizer.from_pretrained(f'../models/allenai/longformer-base-4096')
-        self.bert_model = LongformerModel.from_pretrained(f'../models/allenai/longformer-base-4096')
+        self.longformer_model = LongformerModel.from_pretrained(f'../models/allenai/longformer-base-4096')
 
     def load_model(self):
         """