test_pandas.py 1.5 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071
  1. #!/usr/bin/env python
  2. # -*- coding: utf-8 -*-
  3. '''
  4. @Auther :liuyuqi.gov@msn.cn
  5. @Time :2018/7/5 3:08
  6. @File :test_pandas.py
  7. '''
  8. import pandas as pd
  9. def t1():
  10. a = [['a', '1.2', '4.2'], ['b', '70', '0.03'], ['x', '5', '0']]
  11. df = pd.DataFrame(a, columns=list("ABC"))
  12. print(df.dtypes)
  13. print(df)
  14. def t2():
  15. obj = pd.Series(list('cadaabbcc'))
  16. uniques = obj.unique()
  17. print(obj.dtypes)
  18. print(uniques.shape)
  19. def t3():
  20. df = pd.DataFrame()
  21. df2 = pd.read_csv()
  22. df3 = pd.Series()
  23. pd.concat()
  24. pd.to_datetime()
  25. pd.merge()
  26. pd.Timestamp
  27. def t4():
  28. df = pd.DataFrame(columns=list("AB"), data=[[1, 2], [3, 4]])
  29. df["C"] = None
  30. df["C"][1] = 2
  31. print(df)
  32. def t5():
  33. ser1 = pd.Series([1, 2, 3, 4])
  34. ser2 = pd.Series(range(4), index=["a", "b", "c", "d"])
  35. sdata = {'Ohio': 35000, 'Texas': 71000, 'Oregon': 16000, 'Utah': 5000}
  36. ser3 = pd.Series(sdata)
  37. # print(ser1)
  38. print(ser2)
  39. # 访问Series
  40. ser2["a"]
  41. # 所有索引
  42. ser2.index
  43. # 所有值
  44. ser2.values
  45. def t6():
  46. df = pd.DataFrame([{"A": "11", "B": "12"}, {"A": "111", "B": "121"}, {"A": "1111", "B": "1211"}])
  47. print(df)
  48. print(df.columns.size) # 列数 2
  49. h, l = df.shape
  50. print(h, l)
  51. print(df.iloc[:, 0].size) # 行数 3
  52. print(df.ix[[0]].index.values[0]) # 索引值 0
  53. print(df.ix[[0]].values[0][0]) # 第一行第一列的值 11
  54. print(df.ix[[1]].values[0][1]) # 第二行第二列的值 121
  55. t6()