在使用 Excel 中,经常会用到数据透视表。所以在 Python 这里,也简单演示下。
1 2 3 4 5
| from pandas import Series,DataFrame import pandas as pd import matplotlib.pyplot as plt %matplotlib inline
|
1 2 3 4 5 6
| tips = sns.load_dataset('tips')
tips.head()
|
data:image/s3,"s3://crabby-images/17f89/17f89fdfb07927b1c0a43d9d0484ac4d04172344" alt="image.png"
数据透视表
1 2 3
| piovt_table = tips.pivot_table(values='tip', index='day') piovt_table
|
data:image/s3,"s3://crabby-images/6b5f7/6b5f75be401b66317eab155d311e33a93eae621e" alt="image.png"
1 2 3
| piovt_table = piovt_table.divide(piovt_table.sum(),axis=1) piovt_table
|
data:image/s3,"s3://crabby-images/7e798/7e798a3ee05729c42dc74096ff3fd2d4803e43e9" alt="image.png"
数据交叉表
1 2 3
| cross_table = pd.crosstab(index=tips['day'],columns=tips['size']) cross_table
|
data:image/s3,"s3://crabby-images/ed1cf/ed1cf1b7d7f2081388c64f04162bccce61c0185d" alt="image.png"
1 2 3
| df = cross_table.div(cross_table.sum(1),axis=0) df
|
data:image/s3,"s3://crabby-images/04161/04161d2ea495f7a1130c8caa576a48b8a930b3c8" alt="image.png"
1 2
| df.plot(kind='bar',stacked=True)
|
data:image/s3,"s3://crabby-images/1a9c3/1a9c37d42a25f12a3e8f2679835f4f63d8e23f53" alt="output_8_1.png"