笔记
import pandas as pd
import matplotlib.pyplot as plt
file_path = './pandas_data/IMDB-Movie-Data.csv'
df = pd.read_csv(file_path)
print(df.head(1))
print(df.info())
# rating,runtime分布情况
# 选择图形,直方图
# 准备数据
runtime_data = df["Runtime (Minutes)"].values
max_runtime = runtime_data.max()
min_runtime = runtime_data.min()
# 计算组数
num_bin = (max_runtime - min_runtime)//10
# 设置图形大小
plt.figure(figsize=(20,8),dpi=80)
plt.hist(runtime_data, num_bin)
plt.xticks(range(min_runtime,max_runtime+5,5))
plt.show()