Files
palkkakysely/pulkka/chart_utils.py
2022-08-31 15:09:27 +03:00

85 lines
2.1 KiB
Python

from bokeh import models as bm, plotting as bp
from bokeh.transform import factor_cmap
from pandas import DataFrame
from pulkka.data_utils import get_categorical_stats
CAT_Q_RADIUS = 0.1
gender_colormap = factor_cmap("Sukupuoli", ["#4834d4", "#eb4d4b"], ["mies", "nainen"])
def get_df_hover_tool(df: DataFrame):
return bm.HoverTool(tooltips=[(c, f"@{{{c}}}") for c in df.columns])
def set_yaxis_cash(plot):
plot.yaxis.axis_label = "Vuositulot"
plot.yaxis[0].formatter = bm.NumeralTickFormatter(format="€0")
def get_categorical_stats_plot(df, *, category, value, na_as_category=None, line=True):
df = get_categorical_stats(df, category, value, na_as_category=na_as_category)
df.reset_index(inplace=True)
df[category] = df[category].astype("category")
plot = bp.figure(
title=f"{category}/{value}", x_range=list(df[category].cat.categories)
)
set_yaxis_cash(plot)
plot.vbar(
df[category],
CAT_Q_RADIUS * 2.5,
df["max"],
df["min"],
color="#a4b0be",
fill_alpha=0.7,
)
plot.circle(
df[category],
df["q25"],
radius=CAT_Q_RADIUS,
legend_label="q25",
color="#f368e0",
)
plot.circle(
df[category],
df["q75"],
radius=CAT_Q_RADIUS,
legend_label="q75",
color="#00d2d3",
)
plot.circle(
df[category],
df["q90"],
radius=CAT_Q_RADIUS,
legend_label="q90",
color="#ff9f43",
)
if line:
plot.line(
df[category],
df["median"],
legend_label="median",
color="#1289A7",
line_width=4,
)
plot.line(
df[category], df["mean"], legend_label="mean", color="#B53471", line_width=4
)
else:
plot.circle(
df[category],
df["median"],
radius=CAT_Q_RADIUS,
legend_label="median",
color="#1289A7",
)
plot.circle(
df[category],
df["mean"],
radius=CAT_Q_RADIUS,
legend_label="mean",
color="#B53471",
)
return plot