1. # -*- coding:utf-8 -*-
    2. # @auth ivan
    3. # @time 2018-07-16 11:45:41
    4. # @goal clean the big file
    5. import os
    6. import pandas as pd
    7. root_list = ['/data/project/Temp']
    8. result = []
    9. # IF NOT os.walk, YOU CAN USE THE os.listdir
    10. print("Start!")
    11. for root in root_list:
    12. for i, j, k in os.walk(root):
    13. for t in k:
    14. p = i + os.path.sep + t
    15. print(p)
    16. data = pd.DataFrame([[p, os.path.getsize(p)]],
    17. columns=['File', 'Size'])
    18. result.append(data)
    19. print("Finis!")
    20. data_all = pd.DataFrame(pd.concat(result))
    21. data_all.sort_values('Size', inplace=True)
    22. print(data_all)