主要数据类型:Series 和 DataFrame

API

  1. import pandas as pd
  2. df = pd.DataFrame([[1,2,3],[4,5,6]],columns=["a", "b", "c"])
  3. # 获取列名字
  4. df.columns.values
  5. # 读取文件
  6. csv = pd.read_csv('../SalesJan2009.csv')
  7. # 获取数据
  8. csv.iloc[1,:]
  9. csv.Transaction_date
  10. # 添加列
  11. csv["Price2"] = csv.Price
  12. # 添加行
  13. csv2 = csv.append(csv, ignore_index=True)
  14. # 复杂查询
  15. # select * from csv where Latitude>30
  16. a = csv.loc[(csv.Latitude>30) & (csv.Latitude>0),:].reset_index()
  17. # select * from csv where Country like 'Aus%'
  18. b = csv.loc[csv.Country.str.startswith('Aus') , :].reset_index()
  19. # 去除空格 左边空格lstrip 右空格 rstrip
  20. csv.Country = csv.Country.str.rstrip()
  21. # order by
  22. csv.sort_values('Price', ascending=False)
  23. # group by
  24. f = csv.groupby(csv.Country).mean()
  25. print(f)