data_process.py 720 B

123456789101112131415161718192021222324252627282930313233343536373839
  1. # -*- coding: utf-8 -*-
  2. """
  3. @author: yq
  4. @time: 2024/11/13
  5. @desc: 数据加工
  6. """
  7. import pandas as pd
  8. from commom import f_save_train_df
  9. from entitys import MlConfigEntity
  10. class DataProcess():
  11. def __init__(self, ml_config: MlConfigEntity):
  12. self._ml_config = ml_config
  13. def data_fill(self, df: pd.DataFrame) -> pd.DataFrame:
  14. """
  15. 数据填充
  16. """
  17. pass
  18. def data_filter(self, df: pd.DataFrame) -> pd.DataFrame:
  19. """
  20. 数据筛选,删除缺失率高的特征或样本
  21. """
  22. pass
  23. def save(self, df):
  24. """
  25. 加工结果固化
  26. """
  27. f_save_train_df("distribution", df)
  28. if __name__ == "__main__":
  29. pass