# -*- coding: utf-8 -*-
# author:baoshan

import pandas as pd
import matplotlib.pyplot as plt
plt.rcParams['font.sans-serif'] = ['SimHei']
plt.rcParams['axes.unicode_minus'] = False


def main():
    aqi_data = pd.read_csv('china_city_aqi_teacher.csv')
    print('基本信息:')
    print(aqi_data.info())
    print('数据预览')
    print(aqi_data.head())

    # 数据清洗
    # 只保留AQI>0的数据
    filter_contation = aqi_data['AQI'] > 0
    clean_data = aqi_data[filter_contation]

    # 基本统计
    print('AQI最大值', clean_data['AQI'].max())
    print('AQI最小值', clean_data['AQI'].min())
    print('AQI均值', clean_data['AQI'].mean())

    # top50
    top50_cities = clean_data.sort_values(by=['AQI'], ascending=True).head(10)
    print('空气质量最好的十个城市')
    top50_cities.plot(kind='line', x='City', y='AQI', title='空气质量最好的50个城市', figsize=(20,10))
    plt.savefig('top50_aqi_line.png')
    top50_cities.plot(kind='bar', x='City', y='AQI', title='空气质量最好的50个城市', figsize=(20, 10))
    plt.savefig('top50_aqi_bar.png')
    plt.show()


if __name__ == '__main__':
    main()

 

pandas内置matplotlib绘图更简单。

相关文章:

  • 2022-12-23
  • 2022-12-23
  • 2022-02-10
  • 2021-12-06
  • 2021-09-29
  • 2021-11-28
  • 2022-12-23
猜你喜欢
  • 2022-12-23
  • 2021-04-21
  • 2021-07-22
  • 2022-12-23
  • 2022-12-23
  • 2021-05-10
相关资源
相似解决方案