BaseDataTrans.py 5.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116
  1. import datetime
  2. import traceback
  3. from etl.common.ClearData import ClearData
  4. from etl.common.PathsAndTable import PathsAndTable
  5. from etl.common.SaveToDb import SaveToDb
  6. from etl.common.UnzipAndRemove import UnzipAndRemove
  7. from service.plt_service import get_all_wind, update_trans_status_success, update_trans_status_error, \
  8. update_trans_status_running
  9. from utils.file.trans_methods import read_excel_files
  10. from utils.log.trans_log import trans_print, set_trance_id
  11. class BaseDataTrans(object):
  12. def __init__(self, data: dict = None, save_db=True, step=0, end=4):
  13. self.batch_no = data['batch_code']
  14. self.batch_name = data['batch_name']
  15. self.read_type = data['transfer_type']
  16. self.read_path = data['transfer_addr']
  17. self.field_code = data['field_code']
  18. self.field_name = data['field_name']
  19. self.save_zip = False
  20. self.step = step
  21. self.end = end
  22. self.wind_col_trans, self.rated_power_and_cutout_speed_map = get_all_wind(self.field_code)
  23. self.batch_count = 100000
  24. self.save_db = save_db
  25. self.filed_conf = self.get_filed_conf()
  26. self.pathsAndTable = PathsAndTable(self.batch_no, self.batch_name, self.read_path, self.field_name,
  27. self.read_type, save_db, self.save_zip)
  28. def get_filed_conf(self):
  29. raise NotImplementedError("需要实现 获取点检表 方法")
  30. # 第一步 清理数据
  31. def clean_file_and_db(self):
  32. clean_data = ClearData(self.pathsAndTable)
  33. clean_data.run()
  34. # 第二步 解压 移动到临时文件
  35. def unzip_or_remove_to_tmp_dir(self):
  36. # 解压并删除
  37. unzip_and_remove = UnzipAndRemove(self.pathsAndTable)
  38. unzip_and_remove.run()
  39. # 第三步 读取 并 保存到临时文件
  40. def read_and_save_tmp_file(self):
  41. raise NotImplementedError("第三步未做实现")
  42. # 第四步 统计 并 保存到正式文件
  43. def statistics_and_save_to_file(self):
  44. raise NotImplementedError("第四步未做实现")
  45. # 第五步 保存到数据库
  46. def save_to_db(self):
  47. save_to_db = SaveToDb(self.pathsAndTable, self.batch_count)
  48. save_to_db.run()
  49. # 最后更新执行程度
  50. def update_exec_progress(self):
  51. update_trans_status_success(self.batch_no, self.read_type,
  52. len(read_excel_files(self.pathsAndTable.get_save_path())),
  53. None, None, None, None, self.save_db)
  54. def run(self):
  55. total_begin = datetime.datetime.now()
  56. try:
  57. trance_id = '-'.join([self.batch_no, self.field_name, self.read_type])
  58. set_trance_id(trance_id)
  59. update_trans_status_running(self.batch_no, self.read_type, self.save_db)
  60. if self.step <= 0 and self.end >= 0:
  61. begin = datetime.datetime.now()
  62. trans_print("开始清理数据,临时文件夹:", self.pathsAndTable.get_tmp_path())
  63. self.clean_file_and_db()
  64. trans_print("清理数据结束,耗时:", datetime.datetime.now() - begin, "总耗时:", datetime.datetime.now() - begin)
  65. if self.step <= 1 and self.end >= 1:
  66. begin = datetime.datetime.now()
  67. trans_print("开始解压移动文件")
  68. self.unzip_or_remove_to_tmp_dir()
  69. trans_print("解压移动文件结束:耗时:", datetime.datetime.now() - begin, "总耗时:", datetime.datetime.now() - begin)
  70. if self.step <= 2 and self.end >= 2:
  71. begin = datetime.datetime.now()
  72. trans_print("开始保存数据到临时文件")
  73. self.read_and_save_tmp_file()
  74. trans_print("保存数据到临时文件结束,耗时:", datetime.datetime.now() - begin, "总耗时:", datetime.datetime.now() - begin)
  75. if self.step <= 3 and self.end >= 3:
  76. begin = datetime.datetime.now()
  77. trans_print("开始保存数据到正式文件")
  78. self.statistics_and_save_to_file()
  79. trans_print("保存数据到正式文件结束,耗时:", datetime.datetime.now() - begin, "总耗时:", datetime.datetime.now() - begin)
  80. if self.step <= 4 and self.end >= 4:
  81. begin = datetime.datetime.now()
  82. trans_print("开始保存到数据库,是否存库:", self.pathsAndTable.save_db)
  83. self.save_to_db()
  84. trans_print("保存到数据结束,耗时:", datetime.datetime.now() - begin, "总耗时:", datetime.datetime.now() - begin)
  85. self.update_exec_progress()
  86. except Exception as e:
  87. trans_print(traceback.format_exc())
  88. update_trans_status_error(self.batch_no, self.read_type, str(e), self.save_db)
  89. raise e
  90. finally:
  91. # self.pathsAndTable.delete_tmp_files()
  92. trans_print("执行结束,总耗时:", str(datetime.datetime.now() - total_begin))
  93. if __name__ == '__main__':
  94. test = BaseDataTrans(save_db=False, batch_no="WOF053600062-WOB000010", read_type="fault")
  95. test.run()