From 4adfa0068687dee2ff40ed64b170e553a30c6fa8 Mon Sep 17 00:00:00 2001 From: Veronika Samborska <32176660+veronikasamborska1994@users.noreply.github.com> Date: Sun, 1 Dec 2024 10:53:10 +0100 Subject: [PATCH] =?UTF-8?q?=F0=9F=93=8A=20women's=20rights:=20wb=20gender?= =?UTF-8?q?=20stats=20-=20fix=20Slovakia's=20value=20(#3665)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- etl/steps/data/garden/wb/2024-06-10/gender_statistics.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/etl/steps/data/garden/wb/2024-06-10/gender_statistics.py b/etl/steps/data/garden/wb/2024-06-10/gender_statistics.py index fe734d701c1..79c4a92e643 100644 --- a/etl/steps/data/garden/wb/2024-06-10/gender_statistics.py +++ b/etl/steps/data/garden/wb/2024-06-10/gender_statistics.py @@ -71,9 +71,10 @@ def run(dest_dir: str) -> None: countries_file=paths.country_mapping_path, ) # Pivot the dataframe so that each indicator is a separate column - tb = tb.pivot(index=["country", "year"], columns="wb_seriescode", values="value") - tb = tb.reset_index() + tb = tb.pivot(index=["country", "year"], columns="wb_seriescode", values="value").reset_index() + # Slovakia - should be the same as Czechoslovakia in the period 1970-1993 for the indicator SG.LAW.EQRM.WK as confirmed by the source (but not yet updated on their database) + tb.loc[(tb["country"] == "Slovakia") & (tb["year"].between(1970, 1993)), "SG.LAW.EQRM.WK"] = 1 # Add metadata by finding the descriptions and sources using indicator codes tb = add_metadata(tb, metadata_tb)