|
@@ -24,10 +24,27 @@ class DataGenerator:
|
|
|
# print("case_data[2] ->",case_data[2])
|
|
|
# print("case_data[3] ->",case_data[3])
|
|
|
# print("case_data[4] ->",case_data[4])
|
|
|
- processed_data.append({
|
|
|
- "text": f"<human>: {case_data[1]}\n<bot>: {case_data[2]}\n{case_data[3]}\n{case_data[4]}",
|
|
|
- "metadata": {"source": f"wind_turbine_fault_cases {case_data[0]}"}
|
|
|
- })
|
|
|
+ # processed_data.append({
|
|
|
+ # "text": f"<human>: {case_data[1]}\n<bot>: {case_data[2]}\n{case_data[3]}\n{case_data[4]}",
|
|
|
+ # "metadata": {"source": f"wind_turbine_fault_cases {case_data[0]}"}
|
|
|
+ # })
|
|
|
+
|
|
|
+ # 当 human 和 bot 都取到后,拼装一个新的 JSON
|
|
|
+ target_data = {
|
|
|
+ "question": case_data[1]+" 请予以故障诊断?",
|
|
|
+ "answer": "".join([case_data[2],"\n",case_data[3],"\n",case_data[4]]),
|
|
|
+ "prompt": [
|
|
|
+ {
|
|
|
+ "content": "\nRespond in the following format:\n<reasoning>\n...\n</reasoning>\n<answer>\n...\n</answer>\n",
|
|
|
+ "role": "system"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "content": case_data[1]+" 请予以故障诊断?",
|
|
|
+ "role": "user"
|
|
|
+ }
|
|
|
+ ]
|
|
|
+ }
|
|
|
+ processed_data.append(target_data)
|
|
|
return processed_data
|
|
|
|
|
|
def split_data(self, data):
|