6 months ago · e30d503239
--- a/common/database_dml.py
+++ b/common/database_dml.py
@@ -0,0 +1,214 @@
 
															+from pymongo import MongoClient, UpdateOne
														
 
															+import pandas as pd
														
 
															+from sqlalchemy import create_engine
														
 
															+import pickle
														
 
															+from io import BytesIO
														
 
															+import joblib
														
 
															+import h5py
														
 
															+import tensorflow as tf
														
 
															+
														
 
															+def get_data_from_mongo(args):
														
 
															+    mongodb_connection = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/"
														
 
															+    mongodb_database = args['mongodb_database']
														
 
															+    mongodb_read_table = args['mongodb_read_table']
														
 
															+    query_dict = {}
														
 
															+    if 'timeBegin' in args.keys():
														
 
															+        timeBegin = args['timeBegin']
														
 
															+        query_dict.update({"$gte": timeBegin})
														
 
															+    if 'timeEnd' in args.keys():
														
 
															+        timeEnd = args['timeEnd']
														
 
															+        query_dict.update({"$lte": timeEnd})
														
 
															+
														
 
															+    client = MongoClient(mongodb_connection)
														
 
															+    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															+    db = client[mongodb_database]
														
 
															+    collection = db[mongodb_read_table]  # 集合名称
														
 
															+    if len(query_dict) != 0:
														
 
															+        query = {"dateTime": query_dict}
														
 
															+        cursor = collection.find(query)
														
 
															+    else:
														
 
															+        cursor = collection.find()
														
 
															+    data = list(cursor)
														
 
															+    df = pd.DataFrame(data)
														
 
															+    # 4. 删除 _id 字段（可选）
														
 
															+    if '_id' in df.columns:
														
 
															+        df = df.drop(columns=['_id'])
														
 
															+    client.close()
														
 
															+    return df
														
 
															+
														
 
															+
														
 
															+def get_df_list_from_mongo(args):
														
 
															+    mongodb_connection,mongodb_database,mongodb_read_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_read_table'].split(',')
														
 
															+    df_list = []
														
 
															+    client = MongoClient(mongodb_connection)
														
 
															+    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															+    db = client[mongodb_database]
														
 
															+    for table in mongodb_read_table:
														
 
															+        collection = db[table]  # 集合名称
														
 
															+        data_from_db = collection.find()  # 这会返回一个游标（cursor）
														
 
															+        # 将游标转换为列表，并创建 pandas DataFrame
														
 
															+        df = pd.DataFrame(list(data_from_db))
														
 
															+        if '_id' in df.columns:
														
 
															+            df = df.drop(columns=['_id'])
														
 
															+        df_list.append(df)
														
 
															+    client.close()
														
 
															+    return df_list
														
 
															+
														
 
															+def insert_data_into_mongo(res_df, args):
														
 
															+    """
														
 
															+    插入数据到 MongoDB 集合中，可以选择覆盖、追加或按指定的 key 进行更新插入。
														
 
															+
														
 
															+    参数:
														
 
															+    - res_df: 要插入的 DataFrame 数据
														
 
															+    - args: 包含 MongoDB 数据库和集合名称的字典
														
 
															+    - overwrite: 布尔值，True 表示覆盖，False 表示追加
														
 
															+    - update_keys: 列表，指定用于匹配的 key 列，如果存在则更新，否则插入 'col1','col2'
														
 
															+    """
														
 
															+    mongodb_connection = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/"
														
 
															+    mongodb_database = args['mongodb_database']
														
 
															+    mongodb_write_table = args['mongodb_write_table']
														
 
															+    overwrite = 1
														
 
															+    update_keys = None
														
 
															+    if 'overwrite' in args.keys():
														
 
															+        overwrite = int(args['overwrite'])
														
 
															+    if 'update_keys' in args.keys():
														
 
															+        update_keys = args['update_keys'].split(',')
														
 
															+
														
 
															+    client = MongoClient(mongodb_connection)
														
 
															+    db = client[mongodb_database]
														
 
															+    collection = db[mongodb_write_table]
														
 
															+
														
 
															+    # 覆盖模式：删除现有集合
														
 
															+    if overwrite:
														
 
															+        if mongodb_write_table in db.list_collection_names():
														
 
															+            collection.drop()
														
 
															+            print(f"Collection '{mongodb_write_table}' already exists, deleted successfully!")
														
 
															+
														
 
															+    # 将 DataFrame 转为字典格式
														
 
															+    data_dict = res_df.to_dict("records")  # 每一行作为一个字典
														
 
															+
														
 
															+    # 如果没有数据，直接返回
														
 
															+    if not data_dict:
														
 
															+        print("No data to insert.")
														
 
															+        return
														
 
															+
														
 
															+    # 如果指定了 update_keys，则执行 upsert（更新或插入）
														
 
															+    if update_keys and not overwrite:
														
 
															+        operations = []
														
 
															+        for record in data_dict:
														
 
															+            # 构建查询条件，用于匹配要更新的文档
														
 
															+            query = {key: record[key] for key in update_keys}
														
 
															+            operations.append(UpdateOne(query, {'$set': record}, upsert=True))
														
 
															+
														
 
															+        # 批量执行更新/插入操作
														
 
															+        if operations:
														
 
															+            result = collection.bulk_write(operations)
														
 
															+            print(f"Matched: {result.matched_count}, Upserts: {result.upserted_count}")
														
 
															+    else:
														
 
															+        # 追加模式：直接插入新数据
														
 
															+        collection.insert_many(data_dict)
														
 
															+        print("Data inserted successfully!")
														
 
															+
														
 
															+
														
 
															+def get_data_fromMysql(params):
														
 
															+    mysql_conn = params['mysql_conn']
														
 
															+    query_sql = params['query_sql']
														
 
															+    #数据库读取实测气象
														
 
															+    engine = create_engine(f"mysql+pymysql://{mysql_conn}")
														
 
															+    # 定义SQL查询
														
 
															+    env_df = pd.read_sql_query(query_sql, engine)
														
 
															+    return env_df
														
 
															+
														
 
															+
														
 
															+def insert_pickle_model_into_mongo(model, args):
														
 
															+    mongodb_connection, mongodb_database, mongodb_write_table, model_name = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/", \
														
 
															+    args['mongodb_database'], args['mongodb_write_table'], args['model_name']
														
 
															+    client = MongoClient(mongodb_connection)
														
 
															+    db = client[mongodb_database]
														
 
															+    # 序列化模型
														
 
															+    model_bytes = pickle.dumps(model)
														
 
															+    model_data = {
														
 
															+        'model_name': model_name,
														
 
															+        'model': model_bytes,  # 将模型字节流存入数据库
														
 
															+    }
														
 
															+    print('Training completed!')
														
 
															+
														
 
															+    if mongodb_write_table in db.list_collection_names():
														
 
															+        db[mongodb_write_table].drop()
														
 
															+        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															+    collection = db[mongodb_write_table]  # 集合名称
														
 
															+    collection.insert_one(model_data)
														
 
															+    print("model inserted successfully!")
														
 
															+
														
 
															+
														
 
															+def insert_h5_model_into_mongo(model,feature_scaler_bytes,target_scaler_bytes ,args):
														
 
															+    mongodb_connection,mongodb_database,scaler_table,model_table,model_name = ("mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",
														
 
															+                                args['mongodb_database'],args['scaler_table'],args['model_table'],args['model_name'])
														
 
															+    client = MongoClient(mongodb_connection)
														
 
															+    db = client[mongodb_database]
														
 
															+    collection = db[scaler_table]  # 集合名称
														
 
															+    # Save the scalers in MongoDB as binary data
														
 
															+    collection.insert_one({
														
 
															+        "feature_scaler": feature_scaler_bytes.read(),
														
 
															+        "target_scaler": target_scaler_bytes.read()
														
 
															+    })
														
 
															+    print("model inserted successfully!")
														
 
															+    model_table = db[model_table]
														
 
															+    # 创建 BytesIO 缓冲区
														
 
															+    model_buffer = BytesIO()
														
 
															+    # 将模型保存为 HDF5 格式到内存 (BytesIO)
														
 
															+    model.save(model_buffer, save_format='h5')
														
 
															+    # 将指针移到缓冲区的起始位置
														
 
															+    model_buffer.seek(0)
														
 
															+    # 获取模型的二进制数据
														
 
															+    model_data = model_buffer.read()
														
 
															+    # 将模型保存到 MongoDB
														
 
															+    model_table.insert_one({
														
 
															+        "model_name": model_name,
														
 
															+        "model_data": model_data
														
 
															+    })
														
 
															+    print("模型成功保存到 MongoDB！")
														
 
															+
														
 
															+
														
 
															+def get_h5_model_from_mongo(args):
														
 
															+    mongodb_connection,mongodb_database,model_table,model_name = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['model_table'],args['model_name']
														
 
															+    client = MongoClient(mongodb_connection)
														
 
															+    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															+    db = client[mongodb_database]
														
 
															+    collection = db[model_table]  # 集合名称
														
 
															+
														
 
															+     # 查询 MongoDB 获取模型数据
														
 
															+    model_doc = collection.find_one({"model_name": model_name})
														
 
															+    if model_doc:
														
 
															+        model_data = model_doc['model_data']  # 获取模型的二进制数据
														
 
															+        # 将二进制数据加载到 BytesIO 缓冲区
														
 
															+        model_buffer = BytesIO(model_data)
														
 
															+        # 从缓冲区加载模型
														
 
															+         # 使用 h5py 和 BytesIO 从内存中加载模型
														
 
															+        with h5py.File(model_buffer, 'r') as f:
														
 
															+            model = tf.keras.models.load_model(f)
														
 
															+        print(f"{model_name}模型成功从 MongoDB 加载！")
														
 
															+        client.close()
														
 
															+        return model
														
 
															+    else:
														
 
															+        print(f"未找到model_name为 {model_name} 的模型。")
														
 
															+        client.close()
														
 
															+        return None
														
 
															+
														
 
															+
														
 
															+def get_scaler_model_from_mongo(args):
														
 
															+    mongodb_connection, mongodb_database, scaler_table, = ("mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",
														
 
															+                                                           args['mongodb_database'], args['scaler_table'])
														
 
															+    client = MongoClient(mongodb_connection)
														
 
															+    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															+    db = client[mongodb_database]
														
 
															+    collection = db[scaler_table]  # 集合名称
														
 
															+    # Retrieve the scalers from MongoDB
														
 
															+    scaler_doc = collection.find_one()
														
 
															+    # Deserialize the scalers
														
 
															+
														
 
															+    feature_scaler_bytes = BytesIO(scaler_doc["feature_scaler"])
														
 
															+    feature_scaler = joblib.load(feature_scaler_bytes)
														
 
															+    target_scaler_bytes = BytesIO(scaler_doc["target_scaler"])
														
 
															+    target_scaler = joblib.load(target_scaler_bytes)
														
 
															+    return feature_scaler,target_scaler
														
--- a/data_processing/data_operation/data_join.py
+++ b/data_processing/data_operation/data_join.py
@@ -1,10 +1,10 @@
 
															 import pandas as pd
														
 
															-from pymongo import MongoClient
														
 
															 from flask import Flask,request,jsonify
														
 
															 import time
														
 
															 import logging
														
 
															 import traceback
														
 
															 from functools import reduce
														
 
															+from common.database_dml import get_df_list_from_mongo,insert_data_into_mongo
														
 
															 app = Flask('data_join——service')
														
@@ -13,36 +13,6 @@ app = Flask('data_join——service')
 
															 def hello():
														
 
															     return jsonify(message='Hello, World!')
														
 
															-def get_data_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_read_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_read_table'].split(',')
														
 
															-    df_list = []
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    for table in mongodb_read_table:
														
 
															-        collection = db[table]  # 集合名称
														
 
															-        data_from_db = collection.find()  # 这会返回一个游标（cursor）
														
 
															-        # 将游标转换为列表，并创建 pandas DataFrame
														
 
															-        df = pd.DataFrame(list(data_from_db))
														
 
															-        df_list.append(df)
														
 
															-    client.close()
														
 
															-    return df_list
														
 
															-
														
 
															-
														
 
															-def insert_data_into_mongo(res_df,args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_write_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_write_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    if mongodb_write_table in db.list_collection_names():
														
 
															-        db[mongodb_write_table].drop()
														
 
															-        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															-    collection = db[mongodb_write_table]  # 集合名称
														
 
															-    # 将 DataFrame 转为字典格式
														
 
															-    data_dict = res_df.to_dict("records")  # 每一行作为一个字典
														
 
															-    # 插入到 MongoDB
														
 
															-    collection.insert_many(data_dict)
														
 
															-    print("data inserted successfully!")
														
 
															-
														
 
															 #1.AGC/AVC信号判断限电（有的场站准 有的不准） 1种方法  数据库数据有问题 暂时用不了
														
 
															 def  data_merge(df_list, args):
														
@@ -62,7 +32,7 @@ def data_join():
 
															         args = request.values.to_dict()
														
 
															         print('args',args)
														
 
															         logger.info(args)
														
 
															-        df_list = get_data_from_mongo(args)
														
 
															+        df_list = get_df_list_from_mongo(args)
														
 
															         res_df = data_merge(df_list,args)
														
 
															         insert_data_into_mongo(res_df,args)
														
 
															         success = 1
														
--- a/data_processing/data_operation/mysql_to_mongo.py
+++ b/data_processing/data_operation/mysql_to_mongo.py
@@ -1,11 +1,8 @@
 
															-import pandas as pd
														
 
															-from pymongo import MongoClient
														
 
															-from sqlalchemy import create_engine
														
 
															 from flask import Flask,request,jsonify
														
 
															 import time
														
 
															 import logging
														
 
															 import traceback
														
 
															-
														
 
															+from common.database_dml import insert_data_into_mongo,get_data_fromMysql
														
 
															 app = Flask('mysql_to_mongo——service')
														
@@ -13,30 +10,6 @@ app = Flask('mysql_to_mongo——service')
 
															 def hello():
														
 
															     return jsonify(message='Hello, World!')
														
 
															-def get_data_fromMysql(params):
														
 
															-    mysql_conn = params['mysql_conn']
														
 
															-    query_sql = params['query_sql']
														
 
															-    #数据库读取实测气象
														
 
															-    engine = create_engine(f"mysql+pymysql://{mysql_conn}")
														
 
															-    # 定义SQL查询
														
 
															-    env_df = pd.read_sql_query(query_sql, engine)
														
 
															-    return env_df
														
 
															-
														
 
															-
														
 
															-def insert_data_into_mongo(res_df,args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_write_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_write_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    if mongodb_write_table in db.list_collection_names():
														
 
															-        db[mongodb_write_table].drop()
														
 
															-        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															-    collection = db[mongodb_write_table]  # 集合名称
														
 
															-    # 将 DataFrame 转为字典格式
														
 
															-    data_dict = res_df.to_dict("records")  # 每一行作为一个字典
														
 
															-    # 插入到 MongoDB
														
 
															-    collection.insert_many(data_dict)
														
 
															-    print("data inserted successfully!")
														
 
															-
														
 
															 @app.route('/mysql_to_mongo', methods=['POST'])
														
 
															 def data_join():
														
--- a/data_processing/processing_limit_power/processing_limit_power_by_agcavc.py
+++ b/data_processing/processing_limit_power/processing_limit_power_by_agcavc.py
@@ -5,6 +5,7 @@ from flask import Flask,request,jsonify
 
															 import time
														
 
															 import logging
														
 
															 import traceback
														
 
															+from common.database_dml import get_data_from_mongo,insert_data_into_mongo
														
 
															 app = Flask('processing_limit_power_by_agcavc——service')
														
@@ -13,34 +14,6 @@ def hello():
 
															     return jsonify(message='Hello, World!')
														
 
															-def get_data_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_read_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_read_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[mongodb_read_table]  # 集合名称
														
 
															-    data_from_db = collection.find()  # 这会返回一个游标（cursor）
														
 
															-    # 将游标转换为列表，并创建 pandas DataFrame
														
 
															-    df = pd.DataFrame(list(data_from_db))
														
 
															-    client.close()
														
 
															-    return df
														
 
															-
														
 
															-
														
 
															-def insert_data_into_mongo(res_df,args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_write_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_write_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    if mongodb_write_table in db.list_collection_names():
														
 
															-        db[mongodb_write_table].drop()
														
 
															-        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															-    collection = db[mongodb_write_table]  # 集合名称
														
 
															-    # 将 DataFrame 转为字典格式
														
 
															-    data_dict = res_df.to_dict("records")  # 每一行作为一个字典
														
 
															-    # 插入到 MongoDB
														
 
															-    collection.insert_many(data_dict)
														
 
															-    print("data inserted successfully!")
														
 
															-
														
 
															-
														
 
															 #1.AGC/AVC信号判断限电（有的场站准 有的不准） 1种方法  数据库数据有问题 暂时用不了
														
 
															 def  agc_avc_judgement(power_df,args):
														
 
															     timeBegin,timeEnd,col_time,mysql_connection,avc_table = args['timeBegin'], args['timeEnd'],args['col_time'],args['mysql_connection'],args['agc_avc_table']
														
--- a/data_processing/processing_limit_power/processing_limit_power_by_machines.py
+++ b/data_processing/processing_limit_power/processing_limit_power_by_machines.py
@@ -6,38 +6,9 @@ from flask import Flask, request
 
															 import time
														
 
															 import logging
														
 
															 import traceback
														
 
															-
														
 
															+from common.database_dml import get_data_from_mongo,insert_data_into_mongo
														
 
															 app = Flask('processing_limit_power_by_machines——service')
														
 
															-
														
 
															-def get_data_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_read_table = args['mongodb_connection'],args['mongodb_database'],args['mongodb_read_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[mongodb_read_table]  # 集合名称
														
 
															-    data_from_db = collection.find()  # 这会返回一个游标（cursor）
														
 
															-    # 将游标转换为列表，并创建 pandas DataFrame
														
 
															-    df = pd.DataFrame(list(data_from_db))
														
 
															-    client.close()
														
 
															-    return df
														
 
															-    
														
 
															-
														
 
															-def insert_data_into_mongo(res_df,args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_write_table = args['mongodb_connection'],args['mongodb_database'],args['mongodb_write_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    if mongodb_write_table in db.list_collection_names():
														
 
															-        db[mongodb_write_table].drop()
														
 
															-        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															-    collection = db[mongodb_write_table]  # 集合名称
														
 
															-    # 将 DataFrame 转为字典格式
														
 
															-    data_dict = res_df.to_dict("records")  # 每一行作为一个字典
														
 
															-    # 插入到 MongoDB
														
 
															-    collection.insert_many(data_dict)
														
 
															-    print("data inserted successfully!")
														
 
															-    
														
 
															-
														
 
															 #样板机法
														
 
															 def windLight_machine_judgment(power,args):
														
 
															     col_rp,col_tp = args['col_rp'],args['col_tp']
														
--- a/data_processing/processing_limit_power/processing_limit_power_by_records.py
+++ b/data_processing/processing_limit_power/processing_limit_power_by_records.py
@@ -5,35 +5,8 @@ from flask import Flask,request
 
															 import time
														
 
															 import logging
														
 
															 import traceback
														
 
															+from common.database_dml import get_data_from_mongo,insert_data_into_mongo
														
 
															 app = Flask('processing_limit_power_by_records——service')
														
 
															-
														
 
															-
														
 
															-def get_data_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_read_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_read_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[mongodb_read_table]  # 集合名称
														
 
															-    data_from_db = collection.find()  # 这会返回一个游标（cursor）
														
 
															-    # 将游标转换为列表，并创建 pandas DataFrame
														
 
															-    df = pd.DataFrame(list(data_from_db))
														
 
															-    client.close()
														
 
															-    return df
														
 
															-    
														
 
															-
														
 
															-def insert_data_into_mongo(res_df,args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_write_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_write_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    if mongodb_write_table in db.list_collection_names():
														
 
															-        db[mongodb_write_table].drop()
														
 
															-        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															-    collection = db[mongodb_write_table]  # 集合名称
														
 
															-    # 将 DataFrame 转为字典格式
														
 
															-    data_dict = res_df.to_dict("records")  # 每一行作为一个字典
														
 
															-    # 插入到 MongoDB
														
 
															-    collection.insert_many(data_dict)
														
 
															-    print("data inserted successfully!")
														
 
															 def limit_record_judgement(power,args):
														
--- a/data_processing/processing_limit_power/processing_limit_power_by_statistics_light.py
+++ b/data_processing/processing_limit_power/processing_limit_power_by_statistics_light.py
@@ -8,6 +8,7 @@ from sklearn.linear_model import LinearRegression
 
															 import numpy as np
														
 
															 from bson.decimal128 import Decimal128
														
 
															 import numbers
														
 
															+from common.database_dml import get_data_from_mongo,insert_data_into_mongo
														
 
															 app = Flask('processing_limit_power_by_statistics_light——service')
														
@@ -16,34 +17,6 @@ def hello():
 
															     return jsonify(message='Hello, World!')
														
 
															-def get_data_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_read_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_read_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[mongodb_read_table]  # 集合名称
														
 
															-    data_from_db = collection.find()  # 这会返回一个游标（cursor）
														
 
															-    # 将游标转换为列表，并创建 pandas DataFrame
														
 
															-    df = pd.DataFrame(list(data_from_db))
														
 
															-    client.close()
														
 
															-    return df
														
 
															-
														
 
															-
														
 
															-def insert_data_into_mongo(res_df,args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_write_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_write_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    if mongodb_write_table in db.list_collection_names():
														
 
															-        db[mongodb_write_table].drop()
														
 
															-        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															-    collection = db[mongodb_write_table]  # 集合名称
														
 
															-    # 将 DataFrame 转为字典格式
														
 
															-    data_dict = res_df.to_dict("records")  # 每一行作为一个字典
														
 
															-    # 插入到 MongoDB
														
 
															-    collection.insert_many(data_dict)
														
 
															-    print("data inserted successfully!")
														
 
															-
														
 
															-
														
 
															 def light_statistics_judgement(df_power,args):
														
 
															     """
														
 
															     原理：基于实测辐照度与实际功率相关性强正相关，呈严格线性关系为假设前提，
														
--- a/data_processing/processing_limit_power/processing_limit_power_by_statistics_wind.py
+++ b/data_processing/processing_limit_power/processing_limit_power_by_statistics_wind.py
@@ -9,7 +9,7 @@ from sklearn.preprocessing import StandardScaler
 
															 from sklearn.cluster import DBSCAN
														
 
															 import numbers
														
 
															 from bson.decimal128 import Decimal128
														
 
															-
														
 
															+from common.database_dml import get_data_from_mongo,insert_data_into_mongo
														
 
															 app = Flask('processing_limit_power_by_statistics_wind——service')
														
@@ -18,34 +18,6 @@ def hello():
 
															     return jsonify(message='Hello, World!')
														
 
															-def get_data_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_read_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_read_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[mongodb_read_table]  # 集合名称
														
 
															-    data_from_db = collection.find()  # 这会返回一个游标（cursor）
														
 
															-    # 将游标转换为列表，并创建 pandas DataFrame
														
 
															-    df = pd.DataFrame(list(data_from_db))
														
 
															-    client.close()
														
 
															-    return df
														
 
															-
														
 
															-
														
 
															-def insert_data_into_mongo(res_df,args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_write_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_write_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    if mongodb_write_table in db.list_collection_names():
														
 
															-        db[mongodb_write_table].drop()
														
 
															-        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															-    collection = db[mongodb_write_table]  # 集合名称
														
 
															-    # 将 DataFrame 转为字典格式
														
 
															-    data_dict = res_df.to_dict("records")  # 每一行作为一个字典
														
 
															-    # 插入到 MongoDB
														
 
															-    collection.insert_many(data_dict)
														
 
															-    print("data inserted successfully!")
														
 
															-
														
 
															-
														
 
															 def wind_statistics_judgement(df_power,args):
														
 
															     """
														
 
															     原理：基于实测辐照度与实际功率相关性强正相关，呈严格线性关系为假设前提，
														
--- a/evaluation_processing/analysis.py
+++ b/evaluation_processing/analysis.py
@@ -1,247 +1,247 @@
 
															-# -*- coding: utf-8 -*-
														
 
															-import pandas as pd
														
 
															-import matplotlib.pyplot as plt
														
 
															-from pymongo import MongoClient
														
 
															-import pickle
														
 
															-import numpy as np
														
 
															-import plotly.express as px
														
 
															-from plotly.subplots import make_subplots
														
 
															-import plotly.graph_objects as go
														
 
															-from flask import Flask,request,jsonify
														
 
															-from waitress import serve
														
 
															-import time
														
 
															-import random
														
 
															-import argparse
														
 
															-import logging
														
 
															-import traceback
														
 
															-import os
														
 
															-import lightgbm as lgb
														
 
															-
														
 
															-app = Flask('analysis_report——service')
														
 
															-def get_data_from_mongo(args):
														
 
															-    # 1.读数据 
														
 
															-    mongodb_connection,mongodb_database,all_table,accuracy_table,model_table,model_name = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['train_table'],args['accuracy_table'],args['model_table'],args['model_name']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    # 将游标转换为列表，并创建 pandas DataFrame
														
 
															-    df_all = pd.DataFrame(db[all_table].find({}, {'_id': 0}))
														
 
															-    
														
 
															-    df_accuracy = pd.DataFrame(db[accuracy_table].find({}, {'_id': 0}))
														
 
															-    
														
 
															-    model_data = db[model_table].find_one({"model_name": model_name})
														
 
															-    if model_data is not None:
														
 
															-        model_binary = model_data['model']  # 确保这个字段是存储模型的二进制数据
														
 
															-        # 反序列化模型 
														
 
															-        model = pickle.loads(model_binary)
														
 
															-    client.close()
														
 
															-    return df_all,df_accuracy,model
														
 
															-
														
 
															-
														
 
															-def draw_info(df_all,df_accuracy,model,features,args):
														
 
															-    #1.数据描述 数据描述：
														
 
															-    col_time = args['col_time']
														
 
															-    label = args['label']
														
 
															-    df_accuracy_beginTime = df_accuracy[col_time].min()
														
 
															-    df_accuracy_endTime = df_accuracy[col_time].max()
														
 
															-    df_train = df_all[df_all[col_time]<df_accuracy_beginTime][features+[col_time,label]]
														
 
															-    df_train_beginTime = df_train[col_time].min()
														
 
															-    df_train_endTime = df_train[col_time].max()
														
 
															-    text_content = f"训练数据时间范围：{df_train_beginTime} 至 {df_train_endTime}，共{df_train.shape[0]}条记录，测试集数据时间范围：{df_accuracy_beginTime} 至 {df_accuracy_endTime}。<br>lightgbm模型参数：{model.params}"
														
 
															-    return text_content
														
 
															-    
														
 
															-
														
 
															-
														
 
															-def draw_global_scatter(df,args):
														
 
															-    # --- 1. 实际功率和辐照度的散点图 ---
														
 
															-    col_x = args['scatter_col_x']
														
 
															-    col_y = args['label']
														
 
															-    scatter_fig = px.scatter(
														
 
															-        df,
														
 
															-        x=col_x,
														
 
															-        y=col_y,
														
 
															-        title=f"{col_x}和{col_y}的散点图",
														
 
															-        labels={"辐照度": "辐照度 (W/m²)", "实际功率": "实际功率 (kW)"}
														
 
															-    )
														
 
															-    return scatter_fig
														
 
															-    
														
 
															-    
														
 
															-
														
 
															-def draw_corr(df,features,args):
														
 
															-
														
 
															-    # --- 2. 相关性热力图 ---
														
 
															-    # 计算相关性矩阵
														
 
															-    label = args['label']
														
 
															-    features_coor = features+[label]
														
 
															-    corr_matrix = df[features_coor].corr()
														
 
															-    # 使用 Plotly Express 绘制热力图
														
 
															-    heatmap_fig = px.imshow(corr_matrix, 
														
 
															-                    text_auto=True,  # 显示数值
														
 
															-                    color_continuous_scale='RdBu',  # 配色方案
														
 
															-                    title="Correlation Heatmap")
														
 
															-    heatmap_fig.update_coloraxes(showscale=False)
														
 
															-
														
 
															-    return heatmap_fig
														
 
															-
														
 
															-def draw_feature_importance(model,features):
														
 
															-    # --- 3. 特征重要性排名 ---
														
 
															-    # 获取特征重要性
														
 
															-    importance = model.feature_importance()  # 'split' 或 'gain'，根据需求选择
														
 
															-    
														
 
															-    # 转换为 DataFrame 方便绘图
														
 
															-    feature_importance_df = pd.DataFrame({
														
 
															-        'Feature': features,
														
 
															-        'Importance': importance
														
 
															-    })
														
 
															-    feature_importance_df = feature_importance_df.sort_values(by='Importance', ascending=False)
														
 
															-    
														
 
															-    # 使用 Plotly Express 绘制条形图
														
 
															-    importance_fig = px.bar(feature_importance_df, x='Feature', y='Importance', 
														
 
															-                 title="特征重要性排名", 
														
 
															-                 labels={'Feature': '特征', 'Importance': '重要性'}, 
														
 
															-                 color='Importance', 
														
 
															-                 color_continuous_scale='Viridis')
														
 
															-    # 更新每个 trace，确保没有图例
														
 
															-    
														
 
															-    importance_fig.update_layout(title="模型特征重要性排名", 
														
 
															-                                 showlegend=False  # 移除图例
														
 
															-                                )
														
 
															-    importance_fig.update_coloraxes(showscale=False)
														
 
															-    return importance_fig
														
 
															-
														
 
															-
														
 
															-def draw_data_info_table(content):
														
 
															-    # --- 4. 创建数据说明的表格 ---
														
 
															-    # 转换为表格格式：1行1列，且填充文字说明
														
 
															-    # 转换为表格格式  
														
 
															-    # 创建一个空的图
														
 
															-    table_fig = go.Figure()
														
 
															-
														
 
															-    # 第一部分: 显示文字说明
														
 
															-    table_fig.add_trace(go.Table(
														
 
															-        header=dict(
														
 
															-            values=["说明"],  # 表格只有一列：说明
														
 
															-            fill_color="paleturquoise",
														
 
															-            align="center"
														
 
															-        ),
														
 
															-        cells=dict(
														
 
															-            values=[[content]] ,  # 第一行填入文本说明
														
 
															-            fill_color="lavender",
														
 
															-            align="center"
														
 
															-        )
														
 
															-    ))
														
 
															-
														
 
															-   
														
 
															-    return table_fig
														
 
															-    
														
 
															-
														
 
															-
														
 
															-def draw_accuracy_table(df,content):
														
 
															-    
														
 
															-    # --- 4. 每日的准确率表格 ---
														
 
															-    # 转换为表格格式  
														
 
															-    table_fig = go.Figure(
														
 
															-        data=[
														
 
															-            go.Table(
														
 
															-                header=dict(
														
 
															-                    values=list(df.columns),
														
 
															-                    fill_color="paleturquoise",
														
 
															-                    align="center"
														
 
															-                ),
														
 
															-                cells=dict(
														
 
															-                    values=[df[col] for col in df.columns],
														
 
															-                    fill_color="lavender",
														
 
															-                    align="center"
														
 
															-                )
														
 
															-            )
														
 
															-        ]
														
 
															-    )
														
 
															-    table_fig.update_layout(title="准确率表", showlegend=False)
														
 
															-    return table_fig
														
 
															-
														
 
															-
														
 
															-@app.route('/analysis_report', methods=['POST'])
														
 
															-def analysis_report():
														
 
															-    start_time = time.time()  
														
 
															-    result = {}
														
 
															-    success = 0
														
 
															-    path = ""
														
 
															-    print("Program starts execution!")
														
 
															-    try:
														
 
															-        args = request.values.to_dict()
														
 
															-        print('args',args)
														
 
															-        logger.info(args)
														
 
															-        #获取数据
														
 
															-        df_all, df_accuracy, model = get_data_from_mongo(args)
														
 
															-        features = model.feature_name()
														
 
															-        text_content = draw_info(df_all,df_accuracy,model,features,args)
														
 
															-        text_fig,scatter_fig,heatmap_fig,importance_fig,table_fig=draw_data_info_table(text_content),draw_global_scatter(df_all,args),draw_corr(df_all,features,args),draw_feature_importance(model,features),\
														
 
															-        draw_accuracy_table(df_accuracy,text_content)
														
 
															-        # --- 合并图表并保存到一个 HTML 文件 ---
														
 
															-        # 创建子图布局
														
 
															-        combined_fig = make_subplots(
														
 
															-            rows=5, cols=1,
														
 
															-            subplot_titles=["数据-模型概览","辐照度和实际功率的散点图", "相关性","特征重要性排名", "准确率表"],
														
 
															-            row_heights=[0.3, 0.6, 0.6, 0.6, 0.4],
														
 
															-            specs=[[{"type": "table"}], [{"type": "xy"}], [{"type": "heatmap"}], [{"type": "xy"}],[{"type": "table"}]]  # 指定每个子图类型
														
 
															-        )
														
 
															-        # 添加文本信息到子图（第一行）
														
 
															-        # 添加文字说明
														
 
															-        for trace in text_fig.data:
														
 
															-            combined_fig.add_trace(trace, row=1, col=1)
														
 
															-            
														
 
															-        # 添加散点图
														
 
															-        for trace in scatter_fig.data:
														
 
															-            combined_fig.add_trace(trace, row=2, col=1)
														
 
															-        
														
 
															-        # 添加相关性热力图
														
 
															-        for trace in heatmap_fig.data:
														
 
															-            combined_fig.add_trace(trace, row=3, col=1)
														
 
															-            
														
 
															-        # 添加特征重要性排名图
														
 
															-        for trace in importance_fig.data:
														
 
															-            combined_fig.add_trace(trace, row=4, col=1)
														
 
															-        
														
 
															-        # 添加表格
														
 
															-        for trace in table_fig.data:
														
 
															-            combined_fig.add_trace(trace, row=5, col=1)
														
 
															-    
														
 
															-        # 更新布局
														
 
															-        combined_fig.update_layout(
														
 
															-        height=1500,
														
 
															-        title_text="分析结果汇总",  # 添加换行符以适应文本内容
														
 
															-        title_x=0.5,  # 中心对齐标题
														
 
															-        showlegend=False,
														
 
															-        )
														
 
															-        combined_fig.update_coloraxes(showscale=False)
														
 
															-        filename = f"{int(time.time() * 1000)}_{random.randint(1000, 9999)}.html"
														
 
															-        # 保存为 HTML
														
 
															-        directory = '/usr/share/nginx/html'
														
 
															-        if not os.path.exists(directory):
														
 
															-            os.makedirs(directory)
														
 
															-        file_path = os.path.join(directory, filename)
														
 
															-        # combined_fig.write_html(f"D://usr//{filename}")
														
 
															-        combined_fig.write_html(file_path)
														
 
															-        path = f"http://ds2:10093/{filename}"
														
 
															-        success = 1
														
 
															-    except Exception as e:
														
 
															-        my_exception = traceback.format_exc()
														
 
															-        my_exception.replace("\n","\t")
														
 
															-        result['msg'] = my_exception
														
 
															-    end_time = time.time() 
														
 
															-    result['success'] = success
														
 
															-    result['args'] = args
														
 
															-    result['start_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(start_time))
														
 
															-    result['end_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(end_time))
														
 
															-    result['file_path'] = path
														
 
															-    print("Program execution ends!")
														
 
															-    return result
														
 
															-
														
 
															-
														
 
															-if __name__=="__main__":  
														
 
															-    print("Program starts execution!")
														
 
															-    logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')
														
 
															-    logger = logging.getLogger("analysis_report log")
														
 
															-    from waitress import serve
														
 
															-    serve(app, host="0.0.0.0", port=10092)
														
 
															-    print("server start!")
														
 
															+# # -*- coding: utf-8 -*-
														
 
															+# import pandas as pd
														
 
															+# import matplotlib.pyplot as plt
														
 
															+# from pymongo import MongoClient
														
 
															+# import pickle
														
 
															+# import numpy as np
														
 
															+# import plotly.express as px
														
 
															+# from plotly.subplots import make_subplots
														
 
															+# import plotly.graph_objects as go
														
 
															+# from flask import Flask,request,jsonify
														
 
															+# from waitress import serve
														
 
															+# import time
														
 
															+# import random
														
 
															+# import argparse
														
 
															+# import logging
														
 
															+# import traceback
														
 
															+# import os
														
 
															+# import lightgbm as lgb
														
 
															+#
														
 
															+# app = Flask('analysis_report——service')
														
 
															+# def get_data_from_mongo(args):
														
 
															+#     # 1.读数据
														
 
															+#     mongodb_connection,mongodb_database,all_table,accuracy_table,model_table,model_name = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['train_table'],args['accuracy_table'],args['model_table'],args['model_name']
														
 
															+#     client = MongoClient(mongodb_connection)
														
 
															+#     # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															+#     db = client[mongodb_database]
														
 
															+#     # 将游标转换为列表，并创建 pandas DataFrame
														
 
															+#     df_all = pd.DataFrame(db[all_table].find({}, {'_id': 0}))
														
 
															+#
														
 
															+#     df_accuracy = pd.DataFrame(db[accuracy_table].find({}, {'_id': 0}))
														
 
															+#
														
 
															+#     model_data = db[model_table].find_one({"model_name": model_name})
														
 
															+#     if model_data is not None:
														
 
															+#         model_binary = model_data['model']  # 确保这个字段是存储模型的二进制数据
														
 
															+#         # 反序列化模型
														
 
															+#         model = pickle.loads(model_binary)
														
 
															+#     client.close()
														
 
															+#     return df_all,df_accuracy,model
														
 
															+#
														
 
															+#
														
 
															+# def draw_info(df_all,df_accuracy,model,features,args):
														
 
															+#     #1.数据描述 数据描述：
														
 
															+#     col_time = args['col_time']
														
 
															+#     label = args['label']
														
 
															+#     df_accuracy_beginTime = df_accuracy[col_time].min()
														
 
															+#     df_accuracy_endTime = df_accuracy[col_time].max()
														
 
															+#     df_train = df_all[df_all[col_time]<df_accuracy_beginTime][features+[col_time,label]]
														
 
															+#     df_train_beginTime = df_train[col_time].min()
														
 
															+#     df_train_endTime = df_train[col_time].max()
														
 
															+#     text_content = f"训练数据时间范围：{df_train_beginTime} 至 {df_train_endTime}，共{df_train.shape[0]}条记录，测试集数据时间范围：{df_accuracy_beginTime} 至 {df_accuracy_endTime}。<br>lightgbm模型参数：{model.params}"
														
 
															+#     return text_content
														
 
															+#
														
 
															+#
														
 
															+#
														
 
															+# def draw_global_scatter(df,args):
														
 
															+#     # --- 1. 实际功率和辐照度的散点图 ---
														
 
															+#     col_x = args['scatter_col_x']
														
 
															+#     col_y = args['label']
														
 
															+#     scatter_fig = px.scatter(
														
 
															+#         df,
														
 
															+#         x=col_x,
														
 
															+#         y=col_y,
														
 
															+#         title=f"{col_x}和{col_y}的散点图",
														
 
															+#         labels={"辐照度": "辐照度 (W/m²)", "实际功率": "实际功率 (kW)"}
														
 
															+#     )
														
 
															+#     return scatter_fig
														
 
															+#
														
 
															+#
														
 
															+#
														
 
															+# def draw_corr(df,features,args):
														
 
															+#
														
 
															+#     # --- 2. 相关性热力图 ---
														
 
															+#     # 计算相关性矩阵
														
 
															+#     label = args['label']
														
 
															+#     features_coor = features+[label]
														
 
															+#     corr_matrix = df[features_coor].corr()
														
 
															+#     # 使用 Plotly Express 绘制热力图
														
 
															+#     heatmap_fig = px.imshow(corr_matrix,
														
 
															+#                     text_auto=True,  # 显示数值
														
 
															+#                     color_continuous_scale='RdBu',  # 配色方案
														
 
															+#                     title="Correlation Heatmap")
														
 
															+#     heatmap_fig.update_coloraxes(showscale=False)
														
 
															+#
														
 
															+#     return heatmap_fig
														
 
															+#
														
 
															+# def draw_feature_importance(model,features):
														
 
															+#     # --- 3. 特征重要性排名 ---
														
 
															+#     # 获取特征重要性
														
 
															+#     importance = model.feature_importance()  # 'split' 或 'gain'，根据需求选择
														
 
															+#
														
 
															+#     # 转换为 DataFrame 方便绘图
														
 
															+#     feature_importance_df = pd.DataFrame({
														
 
															+#         'Feature': features,
														
 
															+#         'Importance': importance
														
 
															+#     })
														
 
															+#     feature_importance_df = feature_importance_df.sort_values(by='Importance', ascending=False)
														
 
															+#
														
 
															+#     # 使用 Plotly Express 绘制条形图
														
 
															+#     importance_fig = px.bar(feature_importance_df, x='Feature', y='Importance',
														
 
															+#                  title="特征重要性排名",
														
 
															+#                  labels={'Feature': '特征', 'Importance': '重要性'},
														
 
															+#                  color='Importance',
														
 
															+#                  color_continuous_scale='Viridis')
														
 
															+#     # 更新每个 trace，确保没有图例
														
 
															+#
														
 
															+#     importance_fig.update_layout(title="模型特征重要性排名",
														
 
															+#                                  showlegend=False  # 移除图例
														
 
															+#                                 )
														
 
															+#     importance_fig.update_coloraxes(showscale=False)
														
 
															+#     return importance_fig
														
 
															+#
														
 
															+#
														
 
															+# def draw_data_info_table(content):
														
 
															+#     # --- 4. 创建数据说明的表格 ---
														
 
															+#     # 转换为表格格式：1行1列，且填充文字说明
														
 
															+#     # 转换为表格格式
														
 
															+#     # 创建一个空的图
														
 
															+#     table_fig = go.Figure()
														
 
															+#
														
 
															+#     # 第一部分: 显示文字说明
														
 
															+#     table_fig.add_trace(go.Table(
														
 
															+#         header=dict(
														
 
															+#             values=["说明"],  # 表格只有一列：说明
														
 
															+#             fill_color="paleturquoise",
														
 
															+#             align="center"
														
 
															+#         ),
														
 
															+#         cells=dict(
														
 
															+#             values=[[content]] ,  # 第一行填入文本说明
														
 
															+#             fill_color="lavender",
														
 
															+#             align="center"
														
 
															+#         )
														
 
															+#     ))
														
 
															+#
														
 
															+#
														
 
															+#     return table_fig
														
 
															+#
														
 
															+#
														
 
															+#
														
 
															+# def draw_accuracy_table(df,content):
														
 
															+#
														
 
															+#     # --- 4. 每日的准确率表格 ---
														
 
															+#     # 转换为表格格式
														
 
															+#     table_fig = go.Figure(
														
 
															+#         data=[
														
 
															+#             go.Table(
														
 
															+#                 header=dict(
														
 
															+#                     values=list(df.columns),
														
 
															+#                     fill_color="paleturquoise",
														
 
															+#                     align="center"
														
 
															+#                 ),
														
 
															+#                 cells=dict(
														
 
															+#                     values=[df[col] for col in df.columns],
														
 
															+#                     fill_color="lavender",
														
 
															+#                     align="center"
														
 
															+#                 )
														
 
															+#             )
														
 
															+#         ]
														
 
															+#     )
														
 
															+#     table_fig.update_layout(title="准确率表", showlegend=False)
														
 
															+#     return table_fig
														
 
															+#
														
 
															+#
														
 
															+# @app.route('/analysis_report', methods=['POST'])
														
 
															+# def analysis_report():
														
 
															+#     start_time = time.time()
														
 
															+#     result = {}
														
 
															+#     success = 0
														
 
															+#     path = ""
														
 
															+#     print("Program starts execution!")
														
 
															+#     try:
														
 
															+#         args = request.values.to_dict()
														
 
															+#         print('args',args)
														
 
															+#         logger.info(args)
														
 
															+#         #获取数据
														
 
															+#         df_all, df_accuracy, model = get_data_from_mongo(args)
														
 
															+#         features = model.feature_name()
														
 
															+#         text_content = draw_info(df_all,df_accuracy,model,features,args)
														
 
															+#         text_fig,scatter_fig,heatmap_fig,importance_fig,table_fig=draw_data_info_table(text_content),draw_global_scatter(df_all,args),draw_corr(df_all,features,args),draw_feature_importance(model,features),\
														
 
															+#         draw_accuracy_table(df_accuracy,text_content)
														
 
															+#         # --- 合并图表并保存到一个 HTML 文件 ---
														
 
															+#         # 创建子图布局
														
 
															+#         combined_fig = make_subplots(
														
 
															+#             rows=5, cols=1,
														
 
															+#             subplot_titles=["数据-模型概览","辐照度和实际功率的散点图", "相关性","特征重要性排名", "准确率表"],
														
 
															+#             row_heights=[0.3, 0.6, 0.6, 0.6, 0.4],
														
 
															+#             specs=[[{"type": "table"}], [{"type": "xy"}], [{"type": "heatmap"}], [{"type": "xy"}],[{"type": "table"}]]  # 指定每个子图类型
														
 
															+#         )
														
 
															+#         # 添加文本信息到子图（第一行）
														
 
															+#         # 添加文字说明
														
 
															+#         for trace in text_fig.data:
														
 
															+#             combined_fig.add_trace(trace, row=1, col=1)
														
 
															+#
														
 
															+#         # 添加散点图
														
 
															+#         for trace in scatter_fig.data:
														
 
															+#             combined_fig.add_trace(trace, row=2, col=1)
														
 
															+#
														
 
															+#         # 添加相关性热力图
														
 
															+#         for trace in heatmap_fig.data:
														
 
															+#             combined_fig.add_trace(trace, row=3, col=1)
														
 
															+#
														
 
															+#         # 添加特征重要性排名图
														
 
															+#         for trace in importance_fig.data:
														
 
															+#             combined_fig.add_trace(trace, row=4, col=1)
														
 
															+#
														
 
															+#         # 添加表格
														
 
															+#         for trace in table_fig.data:
														
 
															+#             combined_fig.add_trace(trace, row=5, col=1)
														
 
															+#
														
 
															+#         # 更新布局
														
 
															+#         combined_fig.update_layout(
														
 
															+#         height=1500,
														
 
															+#         title_text="分析结果汇总",  # 添加换行符以适应文本内容
														
 
															+#         title_x=0.5,  # 中心对齐标题
														
 
															+#         showlegend=False,
														
 
															+#         )
														
 
															+#         combined_fig.update_coloraxes(showscale=False)
														
 
															+#         filename = f"{int(time.time() * 1000)}_{random.randint(1000, 9999)}.html"
														
 
															+#         # 保存为 HTML
														
 
															+#         directory = '/usr/share/nginx/html'
														
 
															+#         if not os.path.exists(directory):
														
 
															+#             os.makedirs(directory)
														
 
															+#         file_path = os.path.join(directory, filename)
														
 
															+#         # combined_fig.write_html(f"D://usr//{filename}")
														
 
															+#         combined_fig.write_html(file_path)
														
 
															+#         path = f"http://ds2:10093/{filename}"
														
 
															+#         success = 1
														
 
															+#     except Exception as e:
														
 
															+#         my_exception = traceback.format_exc()
														
 
															+#         my_exception.replace("\n","\t")
														
 
															+#         result['msg'] = my_exception
														
 
															+#     end_time = time.time()
														
 
															+#     result['success'] = success
														
 
															+#     result['args'] = args
														
 
															+#     result['start_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(start_time))
														
 
															+#     result['end_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(end_time))
														
 
															+#     result['file_path'] = path
														
 
															+#     print("Program execution ends!")
														
 
															+#     return result
														
 
															+#
														
 
															+#
														
 
															+# if __name__=="__main__":
														
 
															+#     # print("Program starts execution!")
														
 
															+#     # logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')
														
 
															+#     # logger = logging.getLogger("analysis_report log")
														
 
															+#     # from waitress import serve
														
 
															+#     # serve(app, host="0.0.0.0", port=10092)
														
 
															+#     # print("server start!")
														
--- a/evaluation_processing/analysis_report.py
+++ b/evaluation_processing/analysis_report.py
@@ -0,0 +1,303 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+from plotly.subplots import make_subplots
														
 
															+from flask import Flask,request
														
 
															+import time
														
 
															+import random
														
 
															+import logging
														
 
															+import traceback
														
 
															+import os
														
 
															+from common.database_dml import get_df_list_from_mongo,insert_data_into_mongo
														
 
															+import plotly.express as px
														
 
															+import plotly.graph_objects as go
														
 
															+import pandas as pd
														
 
															+import plotly.io as pio
														
 
															+
														
 
															+app = Flask('analysis_report——service')
														
 
															+
														
 
															+def put_analysis_report_to_html(args,df_clean,df_accuracy):
														
 
															+    col_time = args['col_time']
														
 
															+    col_x_env = args['col_x_env']
														
 
															+    col_x_pre = args['col_x_pre']
														
 
															+    label = args['label']
														
 
															+    label_pre = args['label_pre']
														
 
															+    farmId =  args['farmId']
														
 
															+    df_overview = pd.DataFrame(
														
 
															+        {'数据开始时间': [df_clean[col_time].min()], '数据结束时间': [df_clean[col_time].max()], '数据总记录数': [df_clean.shape[0]]})
														
 
															+    overview_html = df_overview.to_html(classes='table table-bordered table-striped', index=False)
														
 
															+
														
 
															+    # -------------------- 数据描述 --------------------
														
 
															+    describe_html = df_clean.describe().reset_index().rename(columns={'index': '统计量'}).to_html(
														
 
															+        classes='table table-bordered table-striped', index=False)
														
 
															+
														
 
															+    # -------------------- 实测气象与实际功率散点图--------------------
														
 
															+
														
 
															+    # 生成实际功率与辐照度的散点图
														
 
															+    fig_scatter = px.scatter(df_clean, x=col_x_env, y=label)
														
 
															+
														
 
															+    # 自定义散点图布局
														
 
															+    fig_scatter.update_layout(
														
 
															+        template='seaborn',
														
 
															+        plot_bgcolor='rgba(255, 255, 255, 0.8)',  # 背景色
														
 
															+        xaxis=dict(
														
 
															+            showgrid=True,
														
 
															+            gridcolor='rgba(200, 200, 200, 0.5)',
														
 
															+            title=col_x_env
														
 
															+        ),
														
 
															+        yaxis=dict(
														
 
															+            showgrid=True,
														
 
															+            gridcolor='rgba(200, 200, 200, 0.5)',
														
 
															+            title=label
														
 
															+        ),
														
 
															+        legend=dict(x=0.01, y=0.99, bgcolor='rgba(255, 255, 255, 0.7)', bordercolor='black', borderwidth=1)
														
 
															+    )
														
 
															+
														
 
															+    # 将散点图保存为 HTML 片段
														
 
															+    scatter_html = pio.to_html(fig_scatter, full_html=False)
														
 
															+
														
 
															+    # -------------------- 生成相关性热力图 --------------------
														
 
															+
														
 
															+    # 计算相关矩阵
														
 
															+    correlation_matrix = df_clean.corr()
														
 
															+
														
 
															+    # 生成热力图，带数值标签和新配色
														
 
															+    fig_heatmap = go.Figure(data=go.Heatmap(
														
 
															+        z=correlation_matrix.values,
														
 
															+        x=correlation_matrix.columns,
														
 
															+        y=correlation_matrix.columns,
														
 
															+        colorscale='RdBu',  # 使用红蓝配色：正相关为蓝色，负相关为红色
														
 
															+        text=correlation_matrix.round(2).astype(str),  # 将相关性值保留两位小数并转换为字符串
														
 
															+        texttemplate="%{text}",  # 显示数值标签
														
 
															+        colorbar=dict(title='Correlation'),
														
 
															+        zmin=-1, zmax=1  # 设置颜色映射的范围
														
 
															+    ))
														
 
															+
														
 
															+    # 自定义热力图布局
														
 
															+    fig_heatmap.update_layout(
														
 
															+        # title='Correlation Matrix Heatmap',
														
 
															+        xaxis=dict(tickangle=45),
														
 
															+        yaxis=dict(autorange='reversed'),
														
 
															+        template='seaborn'
														
 
															+    )
														
 
															+
														
 
															+    # 将热力图保存为 HTML 片段
														
 
															+    corr_html = pio.to_html(fig_heatmap, full_html=False)
														
 
															+
														
 
															+    # -------------------- 实测气象与预测气象趋势曲线 --------------------
														
 
															+
														
 
															+    # 生成折线图（以 C_GLOBALR 和 NWP预测总辐射 为例）
														
 
															+    fig_line = px.line(df_clean, x=col_time, y=[col_x_env, col_x_pre], markers=True)
														
 
															+
														
 
															+    # 自定义趋势图布局
														
 
															+    fig_line.update_layout(
														
 
															+        template='seaborn',
														
 
															+        # title=dict(text=f"{col_x_env}与{col_x_pre}趋势曲线",
														
 
															+        # x=0.5, font=dict(size=24, color='darkblue')),
														
 
															+        plot_bgcolor='rgba(255, 255, 255, 0.8)',  # 改为白色背景
														
 
															+        xaxis=dict(
														
 
															+            showgrid=True,
														
 
															+            gridcolor='rgba(200, 200, 200, 0.5)',  # 网格线颜色
														
 
															+            rangeslider=dict(visible=True),  # 显示滚动条
														
 
															+            rangeselector=dict(visible=True)  # 显示预设的时间范围选择器
														
 
															+        ),
														
 
															+        yaxis=dict(showgrid=True, gridcolor='rgba(200, 200, 200, 0.5)'),
														
 
															+        legend=dict(x=0.01, y=0.99, bgcolor='rgba(255, 255, 255, 0.7)', bordercolor='black', borderwidth=1)
														
 
															+    )
														
 
															+
														
 
															+    # 将折线图保存为 HTML 片段
														
 
															+    env_pre_html = pio.to_html(fig_line, full_html=False)
														
 
															+
														
 
															+    # -------------------- 实测气象与预测气象偏差密度曲线 --------------------
														
 
															+
														
 
															+    df_clean['deviation'] = df_clean[col_x_pre] - df_clean[col_x_env]
														
 
															+    # 生成预测与实测辐照度偏差的密度曲线图
														
 
															+    # 生成偏差的密度图
														
 
															+    fig_density = px.histogram(df_clean, x='deviation', nbins=30, marginal='rug', opacity=0.75,
														
 
															+                               histnorm='density')
														
 
															+
														
 
															+    # 自定义密度曲线图布局
														
 
															+    fig_density.update_layout(
														
 
															+        template='seaborn',
														
 
															+        # # title=dict(text=f"{col_x_pre}与{col_x_env}偏差密度曲线",
														
 
															+        # x=0.5, font=dict(size=24, color='darkred')),
														
 
															+        plot_bgcolor='rgba(255, 255, 255, 0.8)',
														
 
															+        xaxis=dict(
														
 
															+            showgrid=True,
														
 
															+            gridcolor='rgba(200, 200, 200, 0.5)',
														
 
															+            title='偏差'
														
 
															+        ),
														
 
															+        yaxis=dict(
														
 
															+            showgrid=True,
														
 
															+            gridcolor='rgba(200, 200, 200, 0.5)',
														
 
															+            title='Density'
														
 
															+        ),
														
 
															+        legend=dict(x=0.01, y=0.99, bgcolor='rgba(255, 255, 255, 0.7)', bordercolor='black', borderwidth=1)
														
 
															+    )
														
 
															+
														
 
															+    # 将密度曲线图保存为 HTML 片段
														
 
															+    density_html = pio.to_html(fig_density, full_html=False)
														
 
															+
														
 
															+    # -------------------- 预测功率与实际功率曲线 --------------------
														
 
															+
														
 
															+    # 生成折线图（以 C_GLOBALR 和 NWP预测总辐射 为例）
														
 
															+    fig_line = px.line(df_clean, x='dateTime', y=[label, label_pre], markers=True)
														
 
															+
														
 
															+    # 自定义趋势图布局
														
 
															+    fig_line.update_layout(
														
 
															+        template='seaborn',
														
 
															+        # title=dict(text=f"{label_pre}与{label}曲线",
														
 
															+        # x=0.5, font=dict(size=24, color='darkblue')),
														
 
															+        plot_bgcolor='rgba(255, 255, 255, 0.8)',  # 改为白色背景
														
 
															+        xaxis=dict(
														
 
															+            showgrid=True,
														
 
															+            gridcolor='rgba(200, 200, 200, 0.5)',  # 网格线颜色
														
 
															+            rangeslider=dict(visible=True),  # 显示滚动条
														
 
															+            rangeselector=dict(visible=True)  # 显示预设的时间范围选择器
														
 
															+        ),
														
 
															+        yaxis=dict(showgrid=True, gridcolor='rgba(200, 200, 200, 0.5)'),
														
 
															+        legend=dict(x=0.01, y=0.99, bgcolor='rgba(255, 255, 255, 0.7)', bordercolor='black', borderwidth=1)
														
 
															+    )
														
 
															+
														
 
															+    # 将折线图保存为 HTML 片段
														
 
															+    power_html = pio.to_html(fig_line, full_html=False)
														
 
															+
														
 
															+    # -------------------- 准确率表展示--------------------
														
 
															+    acc_html = df_accuracy.to_html(classes='table table-bordered table-striped', index=False)
														
 
															+    # -------------------- 生成完整 HTML 页面 --------------------
														
 
															+
														
 
															+    html_content = f"""
														
 
															+    <!DOCTYPE html>
														
 
															+    <html lang="en">
														
 
															+    <head>
														
 
															+        <meta charset="UTF-8">
														
 
															+        <meta name="viewport" content="width=device-width, initial-scale=1.0">
														
 
															+        <title>Data Analysis Report</title>
														
 
															+        <!-- 引入 Bootstrap CSS -->
														
 
															+        <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0/dist/css/bootstrap.min.css" rel="stylesheet">
														
 
															+        <style>
														
 
															+            body {{
														
 
															+                background-color: #f4f4f9;
														
 
															+                font-family: Arial, sans-serif;
														
 
															+                padding: 20px;
														
 
															+            }}
														
 
															+            .container {{
														
 
															+                background-color: #fff;
														
 
															+                padding: 20px;
														
 
															+                border-radius: 10px;
														
 
															+                box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1);
														
 
															+                margin-bottom: 30px;
														
 
															+            }}
														
 
															+           h1 {{
														
 
															+                text-align: center;
														
 
															+                color: #333;
														
 
															+                margin-bottom: 20px;
														
 
															+            }}
														
 
															+            .plot-container {{
														
 
															+                margin: 20px 0;
														
 
															+                max-height: 500px;  /* 限制高度 */
														
 
															+                overflow-y: auto;   /* 显示垂直滚动条 */
														
 
															+            }}
														
 
															+            .table-container {{
														
 
															+                margin-top: 30px;
														
 
															+                overflow-x: auto;   /* 水平滚动条 */
														
 
															+                max-width: 100%;     /* 限制宽度 */
														
 
															+                white-space: nowrap; /* 防止内容换行 */
														
 
															+            }}
														
 
															+            table {{
														
 
															+                width: 100%;
														
 
															+                font-size: 12px;  /* 设置字体大小为12px */
														
 
															+            }}
														
 
															+            th, td {{
														
 
															+                text-align: center;  /* 表头和单元格文字居中 */
														
 
															+            }}
														
 
															+        </style>
														
 
															+    </head>
														
 
															+    <body>
														
 
															+        <div class="container">
														
 
															+            <h1>分析报告</h1>
														
 
															+            <!-- Pandas DataFrame 表格 -->
														
 
															+            <div class="table-container">
														
 
															+                <h2>1. 数据总览</h2>
														
 
															+                {overview_html}
														
 
															+            </div>
														
 
															+            <!-- Pandas DataFrame 表格 -->
														
 
															+            <div class="table-container">
														
 
															+                <h2>2. 数据描述</h2>
														
 
															+                {describe_html}
														
 
															+            </div>
														
 
															+            <div class="plot-container">
														
 
															+                <h2>3. 数据清洗后实测气象与实际功率散点图</h2>
														
 
															+                {scatter_html}
														
 
															+            </div>
														
 
															+            <div class="plot-container">
														
 
															+                <h2>4. 相关性分析</h2>
														
 
															+                {corr_html}
														
 
															+            </div>
														
 
															+            <div class="plot-container">
														
 
															+                <h2>5. 实测气象与预测气象曲线趋势</h2>
														
 
															+                {env_pre_html}
														
 
															+            </div>
														
 
															+            <div class="plot-container">
														
 
															+                <h2>6. 预测气象与实测气象偏差曲线</h2>
														
 
															+                {density_html}
														
 
															+            </div>
														
 
															+            <div class="plot-container">
														
 
															+                <h2>7. 预测功率与实际功率曲线对比</h2>
														
 
															+                {power_html}
														
 
															+            </div>
														
 
															+            <!-- Pandas DataFrame 表格 -->
														
 
															+            <div class="table-container">
														
 
															+                <h2>8. 准确率对比</h2>
														
 
															+                {acc_html}
														
 
															+            </div>
														
 
															+        </div>
														
 
															+    </body>
														
 
															+    </html>
														
 
															+    """
														
 
															+    filename = f"{farmId}_{int(time.time() * 1000)}_{random.randint(1000, 9999)}.html"
														
 
															+    # 保存为 HTML
														
 
															+    directory = '/data/html'
														
 
															+    if not os.path.exists(directory):
														
 
															+        os.makedirs(directory)
														
 
															+    file_path = os.path.join(directory, filename)
														
 
															+    path = f"http://ds3:10010/{filename}"
														
 
															+    # 将 HTML 内容写入文件
														
 
															+    with open(file_path, "w", encoding="utf-8") as f:
														
 
															+        f.write(html_content)
														
 
															+    print("HTML report generated successfully!")
														
 
															+    return path
														
 
															+@app.route('/analysis_report', methods=['POST'])
														
 
															+def analysis_report():
														
 
															+    start_time = time.time()  
														
 
															+    result = {}
														
 
															+    success = 0
														
 
															+    path = ""
														
 
															+    print("Program starts execution!")
														
 
															+    try:
														
 
															+        args = request.values.to_dict()
														
 
															+        print('args',args)
														
 
															+        logger.info(args)
														
 
															+        #获取数据
														
 
															+        df_clean, df_accuracy = get_df_list_from_mongo(args)[0], get_df_list_from_mongo(args)[1]
														
 
															+        path = put_analysis_report_to_html(args, df_clean, df_accuracy)
														
 
															+        success = 1
														
 
															+    except Exception as e:
														
 
															+        my_exception = traceback.format_exc()
														
 
															+        my_exception.replace("\n","\t")
														
 
															+        result['msg'] = my_exception
														
 
															+    end_time = time.time() 
														
 
															+    result['success'] = success
														
 
															+    result['args'] = args
														
 
															+    result['start_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(start_time))
														
 
															+    result['end_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(end_time))
														
 
															+    result['file_path'] = path
														
 
															+    print("Program execution ends!")
														
 
															+    return result
														
 
															+
														
 
															+
														
 
															+if __name__=="__main__":  
														
 
															+    print("Program starts execution!")
														
 
															+    logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')
														
 
															+    logger = logging.getLogger("analysis_report log")
														
 
															+    from waitress import serve
														
 
															+    serve(app, host="0.0.0.0", port=10092)
														
 
															+    print("server start!")
														
--- a/models_processing/model_predict/model_prediction_lightgbm.py
+++ b/models_processing/model_predict/model_prediction_lightgbm.py
@@ -5,40 +5,8 @@ from flask import Flask,request
 
															 import time
														
 
															 import logging
														
 
															 import traceback
														
 
															-
														
 
															+from common.database_dml import get_data_from_mongo,insert_data_into_mongo
														
 
															 app = Flask('model_prediction_lightgbm——service')
														
 
															-
														
 
															-
														
 
															-def get_data_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_read_table,timeBegin,timeEnd = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_read_table'],args['timeBegin'],args['timeEnd']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[mongodb_read_table]  # 集合名称
														
 
															-    query = {"dateTime": {"$gte": timeBegin, "$lte": timeEnd}}
														
 
															-    cursor = collection.find(query)
														
 
															-    data = list(cursor)
														
 
															-    df = pd.DataFrame(data)
														
 
															-    # 4. 删除 _id 字段（可选）
														
 
															-    if '_id' in df.columns:
														
 
															-        df = df.drop(columns=['_id'])
														
 
															-    client.close()
														
 
															-    return df
														
 
															-    
														
 
															-
														
 
															-def insert_data_into_mongo(res_df,args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_write_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_write_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    if mongodb_write_table in db.list_collection_names():
														
 
															-        db[mongodb_write_table].drop()
														
 
															-        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															-    collection = db[mongodb_write_table]  # 集合名称
														
 
															-    # 将 DataFrame 转为字典格式
														
 
															-    data_dict = res_df.to_dict("records")  # 每一行作为一个字典
														
 
															-    # 插入到 MongoDB
														
 
															-    collection.insert_many(data_dict)
														
 
															-    print("data inserted successfully!")
														
 
															 def model_prediction(df,args):
														
--- a/models_processing/model_predict/model_prediction_lstm.py
+++ b/models_processing/model_predict/model_prediction_lstm.py
@@ -1,78 +1,13 @@
 
															-import pandas as pd
														
 
															-from pymongo import MongoClient
														
 
															 from flask import Flask,request
														
 
															 import time
														
 
															 import logging
														
 
															 import traceback
														
 
															-from io import BytesIO
														
 
															-import joblib
														
 
															 import numpy as np
														
 
															-import h5py
														
 
															-import tensorflow as tf
														
 
															 from itertools import chain
														
 
															-
														
 
															-
														
 
															+from common.database_dml import get_data_from_mongo,insert_data_into_mongo,get_h5_model_from_mongo,get_scaler_model_from_mongo
														
 
															 app = Flask('model_prediction_lstm——service')
														
 
															-def get_data_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_read_table,timeBegin,timeEnd = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_read_table'],args['timeBegin'],args['timeEnd']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[mongodb_read_table]  # 集合名称
														
 
															-    query = {"dateTime": {"$gte": timeBegin, "$lte": timeEnd}}
														
 
															-    cursor = collection.find(query)
														
 
															-    data = list(cursor)
														
 
															-    df = pd.DataFrame(data)
														
 
															-    # 4. 删除 _id 字段（可选）
														
 
															-    if '_id' in df.columns:
														
 
															-        df = df.drop(columns=['_id'])
														
 
															-    client.close()
														
 
															-    return df
														
 
															-    
														
 
															-
														
 
															-def insert_data_into_mongo(res_df,args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_write_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_write_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    if mongodb_write_table in db.list_collection_names():
														
 
															-        db[mongodb_write_table].drop()
														
 
															-        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															-    collection = db[mongodb_write_table]  # 集合名称
														
 
															-    # 将 DataFrame 转为字典格式
														
 
															-    data_dict = res_df.to_dict("records")  # 每一行作为一个字典
														
 
															-    # 插入到 MongoDB
														
 
															-    collection.insert_many(data_dict)
														
 
															-    print("data inserted successfully!")
														
 
															-
														
 
															-
														
 
															-def get_model_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,model_table,model_name = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['model_table'],args['model_name']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[model_table]  # 集合名称
														
 
															-
														
 
															-     # 查询 MongoDB 获取模型数据
														
 
															-    model_doc = collection.find_one({"model_name": model_name})
														
 
															-    if model_doc:
														
 
															-        model_data = model_doc['model_data']  # 获取模型的二进制数据
														
 
															-        # 将二进制数据加载到 BytesIO 缓冲区
														
 
															-        model_buffer = BytesIO(model_data)
														
 
															-        # 从缓冲区加载模型
														
 
															-         # 使用 h5py 和 BytesIO 从内存中加载模型
														
 
															-        with h5py.File(model_buffer, 'r') as f:
														
 
															-            model = tf.keras.models.load_model(f)
														
 
															-        print(f"{model_name}模型成功从 MongoDB 加载！")
														
 
															-        client.close()
														
 
															-        return model
														
 
															-    else:
														
 
															-        print(f"未找到model_name为 {model_name} 的模型。")
														
 
															-        client.close()
														
 
															-        return None
														
 
															-
														
 
															-
														
 
															 # 创建时间序列数据
														
 
															 def create_sequences(data_features,data_target,time_steps):
														
 
															     X, y = [], []
														
@@ -86,28 +21,16 @@ def create_sequences(data_features,data_target,time_steps):
 
															                 y.append(data_target[i + time_steps -1])
														
 
															         return np.array(X), np.array(y)
														
 
															-def model_prediction(df,args):
														
 
															-
														
 
															-    mongodb_connection, mongodb_database, scaler_table, features, time_steps, col_time = ("mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",
														
 
															-                                        args['mongodb_database'], args['scaler_table'], str_to_list(args['features']),int(args['time_steps']),args['col_time'])
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[scaler_table]  # 集合名称
														
 
															-    # Retrieve the scalers from MongoDB
														
 
															-    scaler_doc = collection.find_one()
														
 
															-    # Deserialize the scalers
														
 
															-    feature_scaler_bytes = BytesIO(scaler_doc["feature_scaler"])
														
 
															-    feature_scaler = joblib.load(feature_scaler_bytes)
														
 
															-    target_scaler_bytes = BytesIO(scaler_doc["target_scaler"])
														
 
															-    target_scaler = joblib.load(target_scaler_bytes)
														
 
															+def model_prediction(df,args):
														
 
															+    features, time_steps, col_time =  str_to_list(args['features']), int(args['time_steps']),args['col_time']
														
 
															+    feature_scaler,target_scaler = get_scaler_model_from_mongo(args)
														
 
															     df = df.fillna(method='ffill').fillna(method='bfill').sort_values(by=col_time)
														
 
															     scaled_features = feature_scaler.transform(df[features])
														
 
															     X_predict, _ = create_sequences(scaled_features, [], time_steps)
														
 
															     # 加载模型时传入自定义损失函数
														
 
															     # model = load_model(f'{farmId}_model.h5', custom_objects={'rmse': rmse})
														
 
															-    model = get_model_from_mongo(args)
														
 
															+    model = get_h5_model_from_mongo(args)
														
 
															     y_predict = list(chain.from_iterable(target_scaler.inverse_transform([model.predict(X_predict).flatten()])))
														
 
															     result = df[-len(y_predict):]
														
 
															     result['predict'] = y_predict
														
--- a/models_processing/model_train/model_training_lightgbm.py
+++ b/models_processing/model_train/model_training_lightgbm.py
@@ -1,43 +1,13 @@
 
															 import lightgbm as lgb
														
 
															-import pandas as pd 
														
 
															 import numpy as np
														
 
															-from pymongo import MongoClient
														
 
															-import pickle
														
 
															 from sklearn.model_selection import train_test_split
														
 
															 from sklearn.metrics import mean_squared_error,mean_absolute_error
														
 
															 from flask import Flask,request
														
 
															 import time
														
 
															 import traceback
														
 
															 import logging
														
 
															-
														
 
															+from common.database_dml import get_data_from_mongo,insert_pickle_model_into_mongo
														
 
															 app = Flask('model_training_lightgbm——service')
														
 
															-def get_data_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_read_table,timeBegin,timeEnd = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_read_table'],args['timeBegin'],args['timeEnd']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[mongodb_read_table]  # 集合名称
														
 
															-    query = {"dateTime": {"$gte": timeBegin, "$lte": timeEnd}}
														
 
															-    cursor = collection.find(query)
														
 
															-    data = list(cursor)
														
 
															-    df = pd.DataFrame(data)
														
 
															-    # 4. 删除 _id 字段（可选）
														
 
															-    if '_id' in df.columns:
														
 
															-        df = df.drop(columns=['_id'])
														
 
															-    client.close()
														
 
															-    return df
														
 
															-    
														
 
															-
														
 
															-def insert_model_into_mongo(model_data,args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_write_table = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_write_table']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    if mongodb_write_table in db.list_collection_names():
														
 
															-        db[mongodb_write_table].drop()
														
 
															-        print(f"Collection '{mongodb_write_table} already exist, deleted successfully!")
														
 
															-    collection = db[mongodb_write_table]  # 集合名称
														
 
															-    collection.insert_one(model_data)
														
 
															-    print("model inserted successfully!")
														
 
															 def build_model(df,args):
														
@@ -75,14 +45,8 @@ def build_model(df,args):
 
															     mae = mean_absolute_error(y_test, y_pred)
														
 
															     print(f'The test rmse is: {rmse},"The test mae is:"{mae}')
														
 
															-    # 序列化模型
														
 
															-    model_bytes = pickle.dumps(gbm)
														
 
															-    model_data = {
														
 
															-                'model_name': model_name,
														
 
															-                'model': model_bytes,     #将模型字节流存入数据库
														
 
															-        }
														
 
															-    print('Training completed!')
														
 
															-    return model_data
														
 
															+
														
 
															+    return gbm
														
 
															 def str_to_list(arg):
														
@@ -105,7 +69,7 @@ def model_training_lightgbm():
 
															         logger.info(args)
														
 
															         power_df = get_data_from_mongo(args)
														
 
															         model = build_model(power_df,args)
														
 
															-        insert_model_into_mongo(model,args)
														
 
															+        insert_pickle_model_into_mongo(model,args)
														
 
															         success = 1
														
 
															     except Exception as e:
														
 
															         my_exception = traceback.format_exc()
														
--- a/models_processing/model_train/model_training_lstm.py
+++ b/models_processing/model_train/model_training_lstm.py
@@ -12,68 +12,22 @@ import joblib
 
															 from tensorflow.keras.models import Sequential
														
 
															 from tensorflow.keras.layers import LSTM, Dense
														
 
															 from tensorflow.keras.callbacks import EarlyStopping, ReduceLROnPlateau
														
 
															-import matplotlib.pyplot as plt
														
 
															+# import matplotlib.pyplot as plt
														
 
															 import tensorflow as tf
														
 
															-
														
 
															+from common.database_dml import get_data_from_mongo,insert_h5_model_into_mongo
														
 
															 app = Flask('model_training_lightgbm——service')
														
 
															-def draw_loss(history):
														
 
															-    #绘制训练集和验证集损失
														
 
															-    plt.figure(figsize=(20, 8))
														
 
															-    plt.plot(history.history['loss'], label='Training Loss')
														
 
															-    plt.plot(history.history['val_loss'], label='Validation Loss')
														
 
															-    plt.title('Loss Curve')
														
 
															-    plt.xlabel('Epochs')
														
 
															-    plt.ylabel('Loss')
														
 
															-    plt.legend()
														
 
															-    plt.show()
														
 
															-
														
 
															-def get_data_from_mongo(args):
														
 
															-    mongodb_connection,mongodb_database,mongodb_read_table,timeBegin,timeEnd = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['mongodb_read_table'],args['timeBegin'],args['timeEnd']
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[mongodb_read_table]  # 集合名称
														
 
															-    query = {"dateTime": {"$gte": timeBegin, "$lte": timeEnd}}
														
 
															-    cursor = collection.find(query)
														
 
															-    data = list(cursor)
														
 
															-    df = pd.DataFrame(data)
														
 
															-    # 4. 删除 _id 字段（可选）
														
 
															-    if '_id' in df.columns:
														
 
															-        df = df.drop(columns=['_id'])
														
 
															-    client.close()
														
 
															-    return df
														
 
															-    
														
 
															-
														
 
															-def insert_model_into_mongo(model,feature_scaler_bytes,target_scaler_bytes ,args):
														
 
															-    mongodb_connection,mongodb_database,scaler_table,model_table,model_name = ("mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",
														
 
															-                                args['mongodb_database'],args['scaler_table'],args['model_table'],args['model_name'])
														
 
															-    client = MongoClient(mongodb_connection)
														
 
															-    db = client[mongodb_database]
														
 
															-    collection = db[scaler_table]  # 集合名称
														
 
															-    # Save the scalers in MongoDB as binary data
														
 
															-    collection.insert_one({
														
 
															-        "feature_scaler": feature_scaler_bytes.read(),
														
 
															-        "target_scaler": target_scaler_bytes.read()
														
 
															-    })
														
 
															-    print("model inserted successfully!")
														
 
															-    model_table = db[model_table]
														
 
															-    # 创建 BytesIO 缓冲区
														
 
															-    model_buffer = BytesIO()
														
 
															-    # 将模型保存为 HDF5 格式到内存 (BytesIO)
														
 
															-    model.save(model_buffer, save_format='h5')
														
 
															-    # 将指针移到缓冲区的起始位置
														
 
															-    model_buffer.seek(0)
														
 
															-    # 获取模型的二进制数据
														
 
															-    model_data = model_buffer.read()
														
 
															-    # 将模型保存到 MongoDB
														
 
															-    model_table.insert_one({
														
 
															-        "model_name": model_name,
														
 
															-        "model_data": model_data
														
 
															-    })
														
 
															-    print("模型成功保存到 MongoDB！")
														
 
															-
														
 
															+# def draw_loss(history):
														
 
															+#     #绘制训练集和验证集损失
														
 
															+#     plt.figure(figsize=(20, 8))
														
 
															+#     plt.plot(history.history['loss'], label='Training Loss')
														
 
															+#     plt.plot(history.history['val_loss'], label='Validation Loss')
														
 
															+#     plt.title('Loss Curve')
														
 
															+#     plt.xlabel('Epochs')
														
 
															+#     plt.ylabel('Loss')
														
 
															+#     plt.legend()
														
 
															+#     plt.show()
														
 
															 def rmse(y_true, y_pred):
														
 
															     return tf.math.sqrt(tf.reduce_mean(tf.square(y_true - y_pred)))
														
@@ -130,7 +84,7 @@ def build_model(data, args):
 
															                         validation_data=(X_test, y_test),
														
 
															                         verbose=2,
														
 
															                         callbacks=[early_stopping, reduce_lr])
														
 
															-    draw_loss(history)
														
 
															+    # draw_loss(history)
														
 
															     return model,feature_scaler_bytes,target_scaler_bytes
														
@@ -154,7 +108,7 @@ def model_training_lstm():
 
															         logger.info(args)
														
 
															         power_df = get_data_from_mongo(args)
														
 
															         model,feature_scaler_bytes,target_scaler_bytes = build_model(power_df,args)
														
 
															-        insert_model_into_mongo(model,feature_scaler_bytes,target_scaler_bytes ,args)
														
 
															+        insert_h5_model_into_mongo(model,feature_scaler_bytes,target_scaler_bytes ,args)
														
 
															         success = 1
														
 
															     except Exception as e:
														
 
															         my_exception = traceback.format_exc()
														
--- a/run_all.py
+++ b/run_all.py
@@ -9,7 +9,7 @@ services = [
 
															     ("data_processing/processing_limit_power/processing_limit_power_by_records.py", 10088),
														
 
															     ("data_processing/processing_limit_power/processing_limit_power_by_statistics_light.py", 10085),
														
 
															     ("data_processing/processing_limit_power/processing_limit_power_by_statistics_wind.py", 10093),
														
 
															-    ("evaluation_processing/analysis.py", 10092),
														
 
															+    ("evaluation_processing/analysis_report.py", 10092),
														
 
															     ("evaluation_processing/evaluation_accuracy.py", 10091),
														
 
															     ("models_processing/model_train/model_training_lightgbm.py", 10089),
														
 
															     ("models_processing/model_predict/model_prediction_lightgbm.py", 10090),