mirror of
https://github.com/koodiklinikka/palkkakysely.git
synced 2026-02-13 06:52:28 +00:00
Tweak everything for 2023
This commit is contained in:
@@ -1,11 +1,15 @@
|
||||
import pandas as pd
|
||||
|
||||
from pulkka.column_maps import KKPALKKA_COL, VUOSITULOT_COL
|
||||
from pulkka.config import OUT_DIR
|
||||
from pulkka.data_ingest import read_data, force_tulot_numeric, force_age_numeric
|
||||
from pulkka.data_ingest import read_data, force_age_numeric
|
||||
from ydata_profiling import ProfileReport
|
||||
|
||||
|
||||
def main():
|
||||
df = read_data()
|
||||
df = force_tulot_numeric(df)
|
||||
df[KKPALKKA_COL] = pd.to_numeric(df[KKPALKKA_COL], errors="coerce")
|
||||
df[VUOSITULOT_COL] = pd.to_numeric(df[VUOSITULOT_COL], errors="coerce")
|
||||
df = force_age_numeric(df)
|
||||
profile = ProfileReport(df)
|
||||
profile.config.vars.cat.n_obs = 20
|
||||
|
||||
Reference in New Issue
Block a user