tf_cnn_train.py 5.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123
  1. #!/usr/bin/env python
  2. # -*- coding: utf-8 -*-
  3. # time: 2024/5/6 13:25
  4. # file: time_series.py
  5. # author: David
  6. # company: shenyang JY
  7. import json, copy
  8. import numpy as np
  9. from flask import Flask, request, g
  10. import traceback
  11. import logging, argparse
  12. from data_processing.data_operation.data_handler import DataHandler
  13. import time, yaml
  14. from copy import deepcopy
  15. from models_processing.model_tf.tf_cnn import CNNHandler
  16. from common.database_dml_koi import *
  17. import matplotlib.pyplot as plt
  18. from common.logs import Log
  19. from common.data_utils import deep_update
  20. # logger = logging.getLogger()
  21. logger = Log('tf_cnn').logger
  22. np.random.seed(42) # NumPy随机种子
  23. app = Flask('tf_cnn_train——service')
  24. current_dir = os.path.dirname(os.path.abspath(__file__))
  25. with open(os.path.join(current_dir, 'cnn.yaml'), 'r', encoding='utf-8') as f:
  26. global_config = yaml.safe_load(f) # 只读的全局配置
  27. @app.before_request
  28. def update_config():
  29. # ------------ 整理参数,整合请求参数 ------------
  30. # 深拷贝全局配置 + 合并请求参数
  31. current_config = deepcopy(global_config)
  32. request_args = request.values.to_dict()
  33. # features参数规则:1.有传入,解析,覆盖 2. 无传入,不覆盖,原始值
  34. request_args['features'] = request_args['features'].split(',') if 'features' in request_args else current_config['features']
  35. current_config = deep_update(current_config, request_args)
  36. # 存储到请求上下文
  37. g.opt = argparse.Namespace(**current_config)
  38. g.dh = DataHandler(logger, current_config) # 每个请求独立实例
  39. g.cnn = CNNHandler(logger, current_config)
  40. @app.route('/tf_cnn_training', methods=['POST'])
  41. def model_training_cnn():
  42. # 获取程序开始时间
  43. start_time = time.time()
  44. result = {}
  45. success = 0
  46. dh = g.dh
  47. cnn = g.cnn
  48. args = deepcopy(g.opt.__dict__)
  49. logger.info("Program starts execution!")
  50. try:
  51. # ------------ 获取数据,预处理训练数据 ------------
  52. train_data = get_data_from_mongo(args)
  53. train_x, train_y, valid_x, valid_y, scaled_train_bytes, scaled_target_bytes, scaled_cap = dh.train_data_handler(train_data)
  54. cnn.opt.Model['input_size'] = len(dh.opt.features)
  55. cnn.opt.cap = round(scaled_cap, 2)
  56. # ------------ 训练模型,保存模型 ------------
  57. # 1. 如果是加强训练模式,先加载预训练模型特征参数,再预处理训练数据
  58. # 2. 如果是普通模式,先预处理训练数据,再根据训练数据特征加载模型
  59. logger.info("---------cap归一化:{}".format(cnn.opt.cap))
  60. model = cnn.train_init() if cnn.opt.Model['add_train'] else cnn.get_keras_model(cnn.opt)
  61. if cnn.opt.Model['add_train']:
  62. if model:
  63. feas = json.loads(cnn.model_params)['features']
  64. if set(feas).issubset(set(dh.opt.features)):
  65. dh.opt.features = list(feas)
  66. train_x, train_y, valid_x, valid_y, scaled_train_bytes, scaled_target_bytes, scaled_cap = dh.train_data_handler(train_data)
  67. else:
  68. model = cnn.get_keras_model(cnn.opt)
  69. logger.info("训练数据特征,不满足,加强训练模型特征")
  70. else:
  71. model = cnn.get_keras_model(cnn.opt)
  72. bp_model = cnn.training(model, [train_x, train_y, valid_x, valid_y])
  73. args['Model']['features'] = ','.join(dh.opt.features)
  74. args['params'] = json.dumps(args)
  75. args['descr'] = '测试'
  76. args['gen_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(time.time()))
  77. insert_trained_model_into_mongo(bp_model, args)
  78. insert_scaler_model_into_mongo(scaled_train_bytes, scaled_target_bytes, args)
  79. success = 1
  80. except Exception as e:
  81. my_exception = traceback.format_exc()
  82. my_exception.replace("\n", "\t")
  83. result['msg'] = my_exception
  84. end_time = time.time()
  85. result['success'] = success
  86. result['args'] = args
  87. result['start_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(start_time))
  88. result['end_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(end_time))
  89. print("Program execution ends!")
  90. return result
  91. if __name__ == "__main__":
  92. print("Program starts execution!")
  93. from waitress import serve
  94. serve(app, host="0.0.0.0", port=10113,
  95. threads=8, # 指定线程数(默认4,根据硬件调整)
  96. channel_timeout=600 # 连接超时时间(秒)
  97. )
  98. # print("server start!")
  99. # args_dict = {"mongodb_database": 'david_test', 'scaler_table': 'j00083_scaler', 'model_name': 'bp1.0.test',
  100. # 'model_table': 'j00083_model', 'mongodb_read_table': 'j00083', 'col_time': 'dateTime',
  101. # 'features': 'speed10,direction10,speed30,direction30,speed50,direction50,speed70,direction70,speed90,direction90,speed110,direction110,speed150,direction150,speed170,direction170'}
  102. # args_dict['features'] = args_dict['features'].split(',')
  103. # arguments.update(args_dict)
  104. # dh = DataHandler(logger, arguments)
  105. # cnn = CNNHandler(logger)
  106. # opt = argparse.Namespace(**arguments)
  107. # opt.Model['input_size'] = len(opt.features)
  108. # train_data = get_data_from_mongo(args_dict)
  109. # train_x, valid_x, train_y, valid_y, scaled_train_bytes, scaled_target_bytes = dh.train_data_handler(train_data, opt)
  110. # cnn_model = cnn.training(opt, [train_x, train_y, valid_x, valid_y])
  111. #
  112. # args_dict['gen_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(time.time()))
  113. # args_dict['params'] = arguments
  114. # args_dict['descr'] = '测试'
  115. # insert_trained_model_into_mongo(cnn_model, args_dict)
  116. # insert_scaler_model_into_mongo(scaled_train_bytes, scaled_target_bytes, args_dict)