python实训2
import pandas as pd # 餐饮数据 data = pd.read_excel(r"C:\Users\Minori\Desktop\python实训\catering_sale.xls",index_col=u'日期') # 读取数据,指定“日期”列为索引列 print(data) print(data.describe(),data.describe().max()-data.describe().min()) import matplotlib.pyplot as plt # 导入图像库 plt.rcParams['font.sans-serif'] = ['SimHei'] # 用来正常显示中文标签 plt.rcParams['axes.unicode_minus'] = False # 用来正常显示负号 plt.figure() # 建立图像 p = data.boxplot(return_type='dict') # 画箱线图,直接使用DataFrame的方法 x = p['fliers'][0].get_xdata() # 'flies'即为异常值的标签 y = p['fliers'][0].get_ydata() y.sort() # 从小到大排序,该方法直接改变原对象 for i in range(len(x)): if i>0: plt.annotate(y[i], xy = (x[i],y[i]), xytext=(x[i]+0.05 -0.8/(y[i]-y[i-1]),y[i])) else: plt.annotate(y[i], xy = (x[i],y[i]), xytext=(x[i]+0.08,y[i])) plt.title('箱型图3127',fontsize=20) plt.show() # 展示箱线图
import pandas as pd import numpy as np data = pd.read_excel(r"C:\Users\Minori\Desktop\python实训\catering_sale.xls",names=['date','sale']) print(data.describe()) bins = [0,500,1000,1500,2000,2500,3000,3500,4000] labels = ['A_lei','[500,1000)','[1000,1500)','[1500,2000)', '[2000,2500)','[2500,3000)','[3000,3500)','[3500,4000)'] data['sale分层'] = pd.cut(data.sale, bins, labels=labels) print(data) aggResult = data.groupby('sale分层').agg({'sale':'count'}) print(aggResult) pAggResult = round(aggResult/aggResult.sum(), 2, ) import matplotlib.pyplot as plt plt.figure(figsize=(10,6)) # 设置图框大小尺寸 pAggResult['sale'].plot(kind='bar',width=0.8,fontsize=10) # 绘制频率直方图 plt.rcParams['font.sans-serif'] = ['SimHei'] # 用来正常显示中文标签 plt.title('季度销售额频率分布直方图3127',fontsize=20) plt.show()
import pandas as pd import matplotlib.pyplot as plt data = pd.read_excel(r"C:\Users\Minori\Desktop\python实训\catering_dish_profit.xls") # 餐饮数据 x =data['盈利'] labels = data['菜品名'] plt.figure(figsize=(8,6)) plt.pie(x,labels=labels) plt.rcParams['font.sans-serif'] = 'SimHei' plt.title('菜品销售分布(饼图)3127',fontsize=20) plt.axis('equal') plt.show()
import pandas as pd import matplotlib.pyplot as plt data = pd.read_excel(r"C:\Users\Minori\Desktop\python实训\catering_dish_profit.xls") # 餐饮数据 x=data['菜品名'] y=data['盈利'] plt.figure(figsize=(8,4)) plt.bar(x,y) plt.rcParams['font.sans-serif']='SimHei' plt.xlabel('菜品') plt.ylabel('销量') plt.title('菜品销售量分布(条形图)3127',fontsize=20) plt.show()
#部门之间 import pandas as pd import matplotlib.pyplot as plt from pylab import mplmpl.rcParams['font.sans-serif'] = ['SimHei'] data=pd.read_excel(r"C:\Users\Minori\Desktop\python实训\dish_sale.xls") plt.figure(figsize=(8,4)) plt.plot(data['月份'],data['A部门'],color='green',label='A部门',marker='o') plt.plot(data['月份'],data['B部门'],color='red',label='B部门',marker='s') plt.plot(data['月份'],data['C部门'],color='skyblue',label='C部门',marker='x') plt.legend() plt.ylabel('销售额(万元)') plt.title('部门之间销售金额比较3127',fontsize=20) plt.show()
import pandas as pd import matplotlib.pyplot as plt from pylab import mpl mpl.rcParams['font.sans-serif'] = ['SimHei'] data=pd.read_excel(r"C:\Users\Minori\Desktop\python实训\dish_sale_b.xls") plt.figure(figsize=(8,4)) plt.plot(data['月份'],data['2012年'],color='green',label='2012年',marker='o') plt.plot(data['月份'],data['2013年'],color='red',label='2013年',marker='s') plt.plot(data['月份'],data['2014年'],color='blue',label='2014年',marker='x') plt.legend() plt.ylabel('销售额(万元)') plt.title('B部门各年份之间销售金额的比较3104',fontsize=20) plt.show()