diff --git a/src/script/.gitignore b/src/script/.gitignore deleted file mode 100644 index 2a40d2a5a1d39024d84e71b8cf5764efc6082a33..0000000000000000000000000000000000000000 --- a/src/script/.gitignore +++ /dev/null @@ -1,6 +0,0 @@ -cache/* -*.json -*.xls -*.csv -script/base/*.xls -script/base/*.csv diff --git a/src/script/base/dataframe_base.py b/src/script/base/dataframe_base.py index 3d491a234b5bb34038b630b85f42c7ab52d72635..7097a4f38c77c77d83832aebae06d1e7d5d5dfcc 100644 --- a/src/script/base/dataframe_base.py +++ b/src/script/base/dataframe_base.py @@ -1,14 +1,10 @@ -import re + import os -import sys import pandas as pd import numpy as np -from glob import glob -from json import load as json_load from script.utils.situations import * - class DataframeHolder: def __init__(self, dataframe): self.students = dataframe.groupby('MATR_ALUNO') @@ -68,7 +64,6 @@ def fix_dataframes(dataframes): fix_evasion(merged) fix_carga(merged) - return merged @@ -79,6 +74,7 @@ def clean_history(df): ], axis=1, inplace=True) df['PERIODO'] = df['PERIODO'].str.split('o').str[0] + def clean_register(df): df_split = df['PERIODO_INGRESSO'].str.split('/') df['ANO_INGRESSO'] = df_split.str[0] @@ -87,7 +83,6 @@ def clean_register(df): df['ANO_EVASAO'] = df_split.str[0] df['SEMESTRE_EVASAO'] = df_split.str[1].str.split('o').str[0] - df.drop(['ID_PESSOA', 'NOME_PESSOA', 'DT_NASCIMENTO', 'NOME_UNIDADE','COD_CURSO', 'PERIODO_INGRESSO', 'PERIODO_EVASAO'],axis=1, inplace=True)