data_explore.py 534 B

12345678910111213141516171819202122232425262728293031
  1. # -*- coding: utf-8 -*-
  2. """
  3. @author: yq
  4. @time: 2024/11/13
  5. @desc: 数据探索
  6. """
  7. import pandas as pd
  8. from commom import f_save_train_df
  9. class DataExplore():
  10. def __init__(self, ):
  11. pass
  12. def distribution(self, df: pd.DataFrame) -> pd.DataFrame:
  13. """
  14. 数据分布,缺失率,中位数,众数,偏离度等
  15. """
  16. pass
  17. def save(self, df):
  18. """
  19. 数据探索结果固化
  20. """
  21. f_save_train_df("distribution", df)
  22. if __name__ == "__main__":
  23. pass