1. # coding=utf-8
    2. import pandas as pd
    3. from matplotlib import pyplot as plt
    4. file_path = "./books.csv"
    5. df = pd.read_csv(file_path)
    6. # print(df.head(2))
    7. #
    8. # print(df.info())
    9. # data1 = df[pd.notnull(df["original_publication_year"])]
    10. #
    11. # grouped = data1.groupby(by="original_publication_year").count()["title"]
    12. #不同年份书的平均评分情况
    13. #去除original_publication_year列中nan的行
    14. data1 = df[pd.notnull(df["original_publication_year"])]
    15. grouped = data1["average_rating"].groupby(by=data1["original_publication_year"]).mean()
    16. # print(grouped)
    17. _x = grouped.index
    18. _y = grouped.values
    19. #画图
    20. plt.figure(figsize=(20,8),dpi=80)
    21. plt.plot(range(len(_x)),_y)
    22. print(len(_x))
    23. plt.xticks(list(range(len(_x)))[::10],_x[::10].astype(int),rotation=45)
    24. plt.show()