Source code for cowidev.testing.batch.rwanda

import pandas as pd

from cowidev.utils.web import request_json
from cowidev.utils.clean import clean_date_series
from cowidev.testing.utils import make_monotonic
from cowidev.testing import CountryTestBase

[docs]class Rwanda(CountryTestBase): location: str = "Rwanda" units: str = "samples tested" source_label: str = "Rwanda Ministry of Health" source_url: str = "" source_url_ref: str = "" rename_columns: dict = { # "attributes.sample_tested": "Daily change in cumulative total", "attributes.cumulative_test": "Cumulative total", "attributes.created_date": "Date", } date_start: str = "2021-11-08" params: dict = { "f": "json", "where": "1=1", "returnGeometry": False, "spatialRel": "esriSpatialRelIntersects", "orderByFields": "created_date desc", "outFields": "*", "resultRecordCount": 32000, "resultType": "standard", "cacheHint": True, }
[docs] def read(self) -> pd.DataFrame: """Reads data from source.""" data = request_json(self.source_url, params=self.params) df = pd.json_normalize(data, record_path=["features"]).dropna(subset=["attributes.cumulative_test"]) return df
[docs] def pipe_date(self, df: pd.DataFrame) -> pd.DataFrame: """Cleans date column""" return df.assign(Date=clean_date_series(df["Date"], unit="ms"))
[docs] def pipe_filter(self, df: pd.DataFrame) -> pd.DataFrame: """Filter data""" df = df[df["Cumulative total"] != 5147843.0] df = df[(df["Date"] >= self.date_start)] return df.drop_duplicates(subset="Date")
[docs] def pipeline(self, df: pd.DataFrame) -> pd.DataFrame: """pipeline for data""" return ( df.pipe(self.pipe_rename_columns) .pipe(self.pipe_date) .pipe(self.pipe_filter) .pipe(self.pipe_metadata) .pipe(make_monotonic) .sort_values("Date") .drop_duplicates(subset=["Cumulative total"], keep="first") )
[docs] def export(self): """Exports data to csv""" df = self.export_datafile(df, attach=True)
[docs]def main(): Rwanda().export()