From ff73b5137d51a06cbe96fc8c6a88e7f2715ecff0 Mon Sep 17 00:00:00 2001 From: odair mario <badwolves123@gmail.com> Date: Mon, 18 Sep 2017 10:18:32 -0300 Subject: [PATCH] analises iniciais --- script/analysis/course_analysis.py | 21 +++++++++++++++++---- 1 file changed, 17 insertions(+), 4 deletions(-) diff --git a/script/analysis/course_analysis.py b/script/analysis/course_analysis.py index 2c994c3..a9f9ce6 100644 --- a/script/analysis/course_analysis.py +++ b/script/analysis/course_analysis.py @@ -1,16 +1,31 @@ # -*- coding: utf-8 -*- -import pandas as pd +import pandas as pd import numpy as np +df = pd.read_excel("../base/historico.xls") +# imprime completamente um dataframe def print_analise(d): with pd.option_context('display.max_rows', None, 'display.max_columns', 27): print(d) + +# calcula as taxas +def func(x,matr): + c = matr[x['COD_ATIV_CURRIC']].values[0] + return (x['counts'] / c) + +#quantidade de matriculas +def qnt_matr(df): + return df.groupby(['COD_ATIV_CURRIC']).size() + + def analise(df): c = df.groupby(['COD_ATIV_CURRIC']).size() diciplinas = df.groupby(['COD_ATIV_CURRIC','SIGLA']).size().reset_index(name='counts') - i=diciplinas.groupby(['COD_ATIV_CURRIC','SIGLA']).apply(lambda x: x['counts'] / (c[x['COD_ATIV_CURRIC']].values[0])).reset_index(name='taxas') + i=diciplinas.groupby(['COD_ATIV_CURRIC','SIGLA','counts']).apply(lambda x: func(x,matr)).reset_index(name='taxas gerais') print_analise(i) + +matr = qnt_matr(df) analise(df) @@ -44,5 +59,3 @@ analise(df) ## c = lambda x: x+1 ## curses = df['COD_ATIV_CURRIC'].drop_duplicates() ## 'MATR_ALUNO',' -#p -#df = pd.read_excel("../base/historico.xls") -- GitLab