owid · spoonerf · Dec 5, 2024 · Dec 5, 2024 · Dec 5, 2024 · Dec 5, 2024
diff --git a/etl/steps/data/garden/antibiotics/2024-12-02/microbe_amr.py b/etl/steps/data/garden/antibiotics/2024-12-02/microbe_amr.py
@@ -1,6 +1,5 @@
 """Load a meadow dataset and create a garden dataset."""
 
-import pandas as pd
 from owid.catalog import Table
 
 from etl.data_helpers import geo
@@ -35,9 +34,7 @@ def run(dest_dir: str) -> None:
     )
     tb_total = tb_total.rename(columns={"value": "total_deaths"}, errors="raise").drop(columns=["lower", "upper"])
 
-    tb = tb_amr.merge(tb_total, on=["country", "year", "infectious_syndrome"], how="right")
-    # Fill missing values with 0
-    tb["amr_attributable_deaths"] = tb["amr_attributable_deaths"].replace(pd.NA, 0)
+    tb = tb_amr.merge(tb_total, on=["country", "year", "infectious_syndrome"], how="inner")
     tb["non_amr_attributable_deaths"] = tb["total_deaths"] - tb["amr_attributable_deaths"]
     # Rename syndromes to be shorter for use in stacked bar charts
     tb = rename_syndromes(tb)

diff --git a/etl/steps/data/garden/antibiotics/2024-12-02/microbe_neonatal_amr.py b/etl/steps/data/garden/antibiotics/2024-12-02/microbe_neonatal_amr.py
@@ -1,6 +1,4 @@
 """Load a meadow dataset and create a garden dataset."""
-import pandas as pd
-
 from etl.data_helpers import geo
 from etl.helpers import PathFinder, create_dataset
 
@@ -39,9 +37,7 @@ def run(dest_dir: str) -> None:
     )
     tb_total = tb_total[tb_total["year"] == 2021]
 
-    tb = tb_amr.merge(tb_total, on=["country", "year", "pathogen"], how="right")
-    # Fill missing values with 0
-    tb["amr_attributable_deaths"] = tb["amr_attributable_deaths"].replace(pd.NA, 0)
+    tb = tb_amr.merge(tb_total, on=["country", "year", "pathogen"], how="inner")
     tb["non_amr_attributable_deaths"] = tb["total_deaths"] - tb["amr_attributable_deaths"]
 
     tb = geo.harmonize_countries(df=tb, countries_file=paths.country_mapping_path)

diff --git a/etl/steps/data/garden/antibiotics/2024-12-02/total_pathogen_bloodstream_amr.py b/etl/steps/data/garden/antibiotics/2024-12-02/total_pathogen_bloodstream_amr.py
@@ -28,9 +28,7 @@ def run(dest_dir: str) -> None:
         .rename(columns={"value": "total_deaths"})
     )
 
-    tb = tb.merge(tb_total, on=["country", "year", "pathogen", "pathogen_type"], how="right")
-
-    tb["amr_attributable_deaths"] = tb["amr_attributable_deaths"].fillna(0)
+    tb = tb.merge(tb_total, on=["country", "year", "pathogen", "pathogen_type"], how="inner")
     tb["non_amr_attributable_deaths"] = tb["total_deaths"] - tb["amr_attributable_deaths"]
     # Process data.
     tb = tb.drop(columns=["country", "pathogen_type"]).rename(columns={"pathogen": "country"})

diff --git a/etl/steps/data/garden/antibiotics/2024-12-04/microbe_total_pathogens_amr.py b/etl/steps/data/garden/antibiotics/2024-12-04/microbe_total_pathogens_amr.py
@@ -34,9 +34,7 @@ def run(dest_dir: str) -> None:
         countries_file=paths.country_mapping_path,
     )
 
-    tb = tb.merge(tb_total, on=["country", "year", "pathogen", "pathogen_type"], how="right")
-
-    tb["amr_attributable_deaths"] = tb["amr_attributable_deaths"].fillna(0)
+    tb = tb.merge(tb_total, on=["country", "year", "pathogen", "pathogen_type"], how="inner")
     tb["non_amr_attributable_deaths"] = tb["total_deaths"] - tb["amr_attributable_deaths"]
     # Process data.
     tb = tb.drop(columns=["country", "pathogen_type"]).rename(columns={"pathogen": "country"})