datapro.py 1.2 KB

12345678910111213141516171819202122232425262728293031323334353637383940
  1. import pandas as pd
  2. import matplotlib.pyplot as plt
  3. def split_test():
  4. # 读取大型数据集
  5. large_dataset = pd.read_csv("../data/Dataset_test/power/power_test.csv")
  6. # 将数据集等分为5个较小的数据集
  7. num_splits = 5
  8. split_size = len(large_dataset) // num_splits
  9. small_datasets = []
  10. for i in range(num_splits):
  11. start = i * split_size
  12. end = (i + 1) * split_size if i < num_splits - 1 else len(large_dataset)
  13. small_datasets.append(large_dataset[start:end])
  14. # 保存5个较小的数据集为.csv文件
  15. for i, small_dataset in enumerate(small_datasets):
  16. small_dataset.to_csv(f"../data/Dataset_test/power/power_dataset_{i + 1}.csv", index=False)
  17. if __name__ == '__main__':
  18. # 读取Excel文件
  19. # df = pd.read_excel("./data/nwp1.xlsx")
  20. #
  21. # # 计算分段数量
  22. # num_windows = df.shape[0] // 16
  23. #
  24. # # 循环每一个分段
  25. # for i in range(num_windows):
  26. # window = df.iloc[i * 16:(i + 1) * 16,2:-2]
  27. # data = window.astype(float)
  28. #
  29. # # 将数据绘制为图像
  30. # plt.imshow(data, cmap="gray")
  31. #
  32. # # 保存图像
  33. # plt.savefig("./wind/window_{}.png".format(i))
  34. split_test()