Initial charts

This commit is contained in:
Aarni Koskela
2021-02-19 13:00:58 +02:00
parent 060a6f8858
commit e769c6d0ce
5 changed files with 99 additions and 1 deletions

13
data_utils.py Normal file
View File

@@ -0,0 +1,13 @@
import pandas as pd
def get_categorical_stats(
df: pd.DataFrame, category_col: str, value_col: str
) -> pd.DataFrame:
# Drop records where value is not numeric before grouping...
df = df.copy()
df[value_col] = pd.to_numeric(df[value_col], errors="coerce")
df = df[df[value_col].notna() & df[value_col] > 0]
# ... then carry on.
group = df[[category_col, value_col]].groupby(category_col)
return group[value_col].agg(["mean", "min", "max", "median"])