Source code for cowidev.vax.manual.twitter.uganda

import pandas as pd
import re

from cowidev.utils.clean import clean_count, clean_date
from cowidev.vax.manual.twitter.base import TwitterCollectorBase


[docs]class Uganda(TwitterCollectorBase):
    def __init__(self, api):
        super().__init__(
            api=api,
            username="MinofHealthUG",
            location="Uganda",
            add_metrics_nan=True,
        )

[docs]    def _propose_df(self):
        regex_1 = r"Results of COVID-19 tests .*"
        regex_2 = r"against COVID-19: ([\d,]+)"
        data = []
        for tweet in self.tweets:
            dt = clean_date(tweet.created_at)
            if self.stop_search(dt):
                break
            if re.search(regex_1, tweet.full_text):
                if "media" in tweet.entities:
                    data.append(
                        {
                            "date": dt,
                            "text": tweet.full_text,
                            "source_url": self.build_post_url(tweet.id),
                            "media_url": tweet.entities["media"][0]["media_url_https"],
                        }
                    )
            elif re.search(regex_2, tweet.full_text):
                total_vaccinations = re.search(regex_2, tweet.full_text).group(1)
                data.append(
                    {
                        "date": dt,
                        "total_vaccinations": clean_count(total_vaccinations),
                        "text": tweet.full_text,
                        "source_url": self.build_post_url(tweet.id),
                    }
                )
        return pd.DataFrame(data)


[docs]def main(api):
    Uganda(api).to_csv()