data_loader_excel.py 1020 B

12345678910111213141516171819202122232425262728293031323334353637383940
  1. # -*- coding: utf-8 -*-
  2. """
  3. @author: yq
  4. @time: 2024/10/31
  5. @desc:
  6. """
  7. import pandas as pd
  8. from commom import get_logger
  9. from .data_loader_base import DataLoaderBase
  10. logger = get_logger()
  11. class DataLoaderExcel(DataLoaderBase):
  12. def __init__(self, ):
  13. pass
  14. def get_connect(self):
  15. pass
  16. def close_connect(self):
  17. pass
  18. def get_data(self, file_path: str, sheet_name: str = 0) -> pd.DataFrame:
  19. df: pd.DataFrame = pd.DataFrame()
  20. if ".xlsx" in file_path:
  21. df = pd.read_excel(file_path, sheet_name=sheet_name, index_col=False)
  22. elif ".csv" in file_path:
  23. df = pd.read_csv(file_path)
  24. columns = df.columns.to_list()
  25. columns_new = []
  26. for idx, column in enumerate(columns):
  27. column = str(column)
  28. if idx != 0 and "Unnamed:" in column:
  29. columns_new.append(columns_new[-1])
  30. else:
  31. columns_new.append(column)
  32. df.columns = columns_new
  33. return df