anweiguo
/
algorithm_platform


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247
							# # -*- coding: utf-8 -*-
# import pandas as pd
# import matplotlib.pyplot as plt
# from pymongo import MongoClient
# import pickle
# import numpy as np
# import plotly.express as px
# from plotly.subplots import make_subplots
# import plotly.graph_objects as go
# from flask import Flask,request,jsonify
# from waitress import serve
# import time
# import random
# import argparse
# import logging
# import traceback
# import os
# import lightgbm as lgb
#
# app = Flask('analysis_report——service')
# def get_data_from_mongo(args):
#     # 1.读数据
#     mongodb_connection,mongodb_database,all_table,accuracy_table,model_table,model_name = "mongodb://root:sdhjfREWFWEF23e@192.168.1.43:30000/",args['mongodb_database'],args['train_table'],args['accuracy_table'],args['model_table'],args['model_name']
#     client = MongoClient(mongodb_connection)
#     # 选择数据库（如果数据库不存在，MongoDB 会自动创建）
#     db = client[mongodb_database]
#     # 将游标转换为列表，并创建 pandas DataFrame
#     df_all = pd.DataFrame(db[all_table].find({}, {'_id': 0}))
#
#     df_accuracy = pd.DataFrame(db[accuracy_table].find({}, {'_id': 0}))
#
#     model_data = db[model_table].find_one({"model_name": model_name})
#     if model_data is not None:
#         model_binary = model_data['model']  # 确保这个字段是存储模型的二进制数据
#         # 反序列化模型
#         model = pickle.loads(model_binary)
#     client.close()
#     return df_all,df_accuracy,model
#
#
# def draw_info(df_all,df_accuracy,model,features,args):
#     #1.数据描述 数据描述：
#     col_time = args['col_time']
#     label = args['label']
#     df_accuracy_beginTime = df_accuracy[col_time].min()
#     df_accuracy_endTime = df_accuracy[col_time].max()
#     df_train = df_all[df_all[col_time]<df_accuracy_beginTime][features+[col_time,label]]
#     df_train_beginTime = df_train[col_time].min()
#     df_train_endTime = df_train[col_time].max()
#     text_content = f"训练数据时间范围：{df_train_beginTime} 至 {df_train_endTime}，共{df_train.shape[0]}条记录，测试集数据时间范围：{df_accuracy_beginTime} 至 {df_accuracy_endTime}。<br>lightgbm模型参数：{model.params}"
#     return text_content
#
#
#
# def draw_global_scatter(df,args):
#     # --- 1. 实际功率和辐照度的散点图 ---
#     col_x = args['scatter_col_x']
#     col_y = args['label']
#     scatter_fig = px.scatter(
#         df,
#         x=col_x,
#         y=col_y,
#         title=f"{col_x}和{col_y}的散点图",
#         labels={"辐照度": "辐照度 (W/m²)", "实际功率": "实际功率 (kW)"}
#     )
#     return scatter_fig
#
#
#
# def draw_corr(df,features,args):
#
#     # --- 2. 相关性热力图 ---
#     # 计算相关性矩阵
#     label = args['label']
#     features_coor = features+[label]
#     corr_matrix = df[features_coor].corr()
#     # 使用 Plotly Express 绘制热力图
#     heatmap_fig = px.imshow(corr_matrix,
#                     text_auto=True,  # 显示数值
#                     color_continuous_scale='RdBu',  # 配色方案
#                     title="Correlation Heatmap")
#     heatmap_fig.update_coloraxes(showscale=False)
#
#     return heatmap_fig
#
# def draw_feature_importance(model,features):
#     # --- 3. 特征重要性排名 ---
#     # 获取特征重要性
#     importance = model.feature_importance()  # 'split' 或 'gain'，根据需求选择
#
#     # 转换为 DataFrame 方便绘图
#     feature_importance_df = pd.DataFrame({
#         'Feature': features,
#         'Importance': importance
#     })
#     feature_importance_df = feature_importance_df.sort_values(by='Importance', ascending=False)
#
#     # 使用 Plotly Express 绘制条形图
#     importance_fig = px.bar(feature_importance_df, x='Feature', y='Importance',
#                  title="特征重要性排名",
#                  labels={'Feature': '特征', 'Importance': '重要性'},
#                  color='Importance',
#                  color_continuous_scale='Viridis')
#     # 更新每个 trace，确保没有图例
#
#     importance_fig.update_layout(title="模型特征重要性排名",
#                                  showlegend=False  # 移除图例
#                                 )
#     importance_fig.update_coloraxes(showscale=False)
#     return importance_fig
#
#
# def draw_data_info_table(content):
#     # --- 4. 创建数据说明的表格 ---
#     # 转换为表格格式：1行1列，且填充文字说明
#     # 转换为表格格式
#     # 创建一个空的图
#     table_fig = go.Figure()
#
#     # 第一部分: 显示文字说明
#     table_fig.add_trace(go.Table(
#         header=dict(
#             values=["说明"],  # 表格只有一列：说明
#             fill_color="paleturquoise",
#             align="center"
#         ),
#         cells=dict(
#             values=[[content]] ,  # 第一行填入文本说明
#             fill_color="lavender",
#             align="center"
#         )
#     ))
#
#
#     return table_fig
#
#
#
# def draw_accuracy_table(df,content):
#
#     # --- 4. 每日的准确率表格 ---
#     # 转换为表格格式
#     table_fig = go.Figure(
#         data=[
#             go.Table(
#                 header=dict(
#                     values=list(df.columns),
#                     fill_color="paleturquoise",
#                     align="center"
#                 ),
#                 cells=dict(
#                     values=[df[col] for col in df.columns],
#                     fill_color="lavender",
#                     align="center"
#                 )
#             )
#         ]
#     )
#     table_fig.update_layout(title="准确率表", showlegend=False)
#     return table_fig
#
#
# @app.route('/analysis_report', methods=['POST'])
# def analysis_report():
#     start_time = time.time()
#     result = {}
#     success = 0
#     path = ""
#     print("Program starts execution!")
#     try:
#         args = request.values.to_dict()
#         print('args',args)
#         logger.info(args)
#         #获取数据
#         df_all, df_accuracy, model = get_data_from_mongo(args)
#         features = model.feature_name()
#         text_content = draw_info(df_all,df_accuracy,model,features,args)
#         text_fig,scatter_fig,heatmap_fig,importance_fig,table_fig=draw_data_info_table(text_content),draw_global_scatter(df_all,args),draw_corr(df_all,features,args),draw_feature_importance(model,features),\
#         draw_accuracy_table(df_accuracy,text_content)
#         # --- 合并图表并保存到一个 HTML 文件 ---
#         # 创建子图布局
#         combined_fig = make_subplots(
#             rows=5, cols=1,
#             subplot_titles=["数据-模型概览","辐照度和实际功率的散点图", "相关性","特征重要性排名", "准确率表"],
#             row_heights=[0.3, 0.6, 0.6, 0.6, 0.4],
#             specs=[[{"type": "table"}], [{"type": "xy"}], [{"type": "heatmap"}], [{"type": "xy"}],[{"type": "table"}]]  # 指定每个子图类型
#         )
#         # 添加文本信息到子图（第一行）
#         # 添加文字说明
#         for trace in text_fig.data:
#             combined_fig.add_trace(trace, row=1, col=1)
#
#         # 添加散点图
#         for trace in scatter_fig.data:
#             combined_fig.add_trace(trace, row=2, col=1)
#
#         # 添加相关性热力图
#         for trace in heatmap_fig.data:
#             combined_fig.add_trace(trace, row=3, col=1)
#
#         # 添加特征重要性排名图
#         for trace in importance_fig.data:
#             combined_fig.add_trace(trace, row=4, col=1)
#
#         # 添加表格
#         for trace in table_fig.data:
#             combined_fig.add_trace(trace, row=5, col=1)
#
#         # 更新布局
#         combined_fig.update_layout(
#         height=1500,
#         title_text="分析结果汇总",  # 添加换行符以适应文本内容
#         title_x=0.5,  # 中心对齐标题
#         showlegend=False,
#         )
#         combined_fig.update_coloraxes(showscale=False)
#         filename = f"{int(time.time() * 1000)}_{random.randint(1000, 9999)}.html"
#         # 保存为 HTML
#         directory = '/usr/share/nginx/html'
#         if not os.path.exists(directory):
#             os.makedirs(directory)
#         file_path = os.path.join(directory, filename)
#         # combined_fig.write_html(f"D://usr//{filename}")
#         combined_fig.write_html(file_path)
#         path = f"http://ds2:10093/{filename}"
#         success = 1
#     except Exception as e:
#         my_exception = traceback.format_exc()
#         my_exception.replace("\n","\t")
#         result['msg'] = my_exception
#     end_time = time.time()
#     result['success'] = success
#     result['args'] = args
#     result['start_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(start_time))
#     result['end_time'] = time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(end_time))
#     result['file_path'] = path
#     print("Program execution ends!")
#     return result
#
#
# if __name__=="__main__":
#     # print("Program starts execution!")
#     # logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')
#     # logger = logging.getLogger("analysis_report log")
#     # from waitress import serve
#     # serve(app, host="0.0.0.0", port=10092)
#     # print("server start!")