第十章-家用热水器用户行为分析与事件识别
10.1数据探索分析
import pandas as pd
import matplotlib.pyplot as pltinputfile = '..demo/data/original_data.xls' # 输入的数据文件
data = pd.read_excel(inputfile) # 读取数据# 查看有无水流的分布
# 数据提取
lv_non = pd.Series(data['有无水流']).value_counts()['无']
lv_move = pd.Series(data['有无水流']).value_counts()['有']
# 绘制条形图fig = plt.figure(figsize = (6 ,5)) # 设置画布大小
plt.rcParams['font.sans-serif'] = 'SimHei' # 设置中文显示
plt.rcParams['axes.unicode_minus'] = False
plt.bar(x=range(2), height=[lv_non, lv_move], width=0.4, alpha=0.8, color='skyblue')
plt.xticks([index for index in range(2)], ['无','