diff --git a/pipelines/datasets/br_cvm_fi/tasks.py b/pipelines/datasets/br_cvm_fi/tasks.py index b6b19ebb7..fb15d7125 100644 --- a/pipelines/datasets/br_cvm_fi/tasks.py +++ b/pipelines/datasets/br_cvm_fi/tasks.py @@ -226,9 +226,9 @@ def clean_data_and_make_partitions(path: str, table_id: str) -> str: df = pd.read_csv(f"{path}{file}", sep=";") log(f"File {file} read.") - df.rename(columns={'CNPJ_FUNDO_CLASSE':'CNPJ_FUNDO'}, inplace=True) + df["CNPJ_FUNDO_CLASSE"] = df["CNPJ_FUNDO_CLASSE"].str.replace(r"[/.-]", "") - df["CNPJ_FUNDO"] = df["CNPJ_FUNDO"].str.replace(r"[/.-]", "") + df.drop("ID_SUBCLASSE",axis=1, inplace=True) df = rename_columns(df_arq, df)