from math import log
import pandas as pd
import matplotlib.pyplot as plt


raw_data = pd.read_csv("data/data.csv", parse_dates=["date"])
raw_data.head()


raw_data.date.min(), raw_data.date.max()

(Timestamp('2020-04-27 00:00:00'), Timestamp('2021-04-14 00:00:00'))


raw_data.assign(
    delta=raw_data.sort_values("date").groupby("area")["cases"].diff()
).query("delta < 0").sort_values("delta").head(10)


regions = {
    "south": [
        "SOUTH COUNTY UNINCORPORATED AREA includes communities of Montecito, Summerland and the City of Carpinteria",
        "CITY OF SANTA BARBARA and the unincorporated area of Mission Canyon",
        "CITY OF GOLETA",
        "COMMUNITY OF ISLA VISTA",
        "UNINCORPORATED AREA OF THE GOLETA VALLEY AND GAVIOTA",
        "SANTA YNEZ VALLEY including the Cities of Solvang & Buellton, and the communities of Santa Ynez, Los Alamos, Los Olivos and Ballard"
    ],
    "north": [
        "CITY OF LOMPOC and the communities of Mission Hills and Vandenberg Village",
        "CITY OF SANTA MARIA",
        "COMMUNITY OF ORCUTT",
        "UNINCORPORATED AREAS of Sisquoc, Casmalia, Garey, Cuyama, New Cuyama, and the City of Guadalupe"
    ],
    "other": [
        "FEDERAL PRISON IN LOMPOC",
        "People incarcerated at the Federal Prison in Lompoc",
        "Out of County"
    ],
}

region_map = {v: k for k, vlist in regions.items() for v in vlist}  # invert above mapping

base_data = (
    raw_data.assign(region=raw_data.apply(lambda row: region_map[row.area], axis=1))
    .query("region != 'other'")
    .groupby(["region", "date"])
    .sum("cases")
    .query("date.dt.dayofweek == 2")
)

base_data.head()


base_data = base_data.assign(
    new_cases=base_data.sort_values("date").groupby("region")["cases"].diff()
).unstack(level=0)

base_data.head()


def legend():
    plt.legend(
        title="Region",
        labels=["North county (excluding prison)", "South county (including SYV)"]
    )

base_data.plot(y=[("cases", "north"), ("cases", "south")], grid=True)
plt.xlabel("Date")
plt.ylabel("Cumulative total cases")
legend()


base_data.dropna().plot(y=[("new_cases", "north"), ("new_cases", "south")], grid=True)
plt.xlabel("Date")
plt.ylabel("Weekly new cases")
legend()


ax = plt.gca()
for region in ["north", "south"]:
    base_data.dropna().plot(
        ax=ax,
        x=("cases", region),
        y=[("new_cases", region)],
        style="-o",
        markevery=[-1],
        loglog=True,
        grid=True
    )
plt.xlabel("Cumulative total cases")
plt.ylabel("Weekly new cases")
legend()


data = base_data.sort_values("date")
column = ("cases", "north")
growth_rate = (data.iloc[12][column]/data.iloc[0][column])**(1/12)
doubling_time = log(2)/log(growth_rate)  # weeks

print(f"Average growth rate each week: {int(round((growth_rate-1)*100))}%")
print("Doubling time in weeks:", round(doubling_time, 1))

Average growth rate each week: 22%
Doubling time in weeks: 3.4

	area	cases	date	delta
56	CITY OF SANTA MARIA	11249	2021-04-10	-61.0
2815	FEDERAL PRISON IN LOMPOC	984	2020-07-08	-10.0
3278	FEDERAL PRISON IN LOMPOC	893	2020-05-14	-3.0
513	COMMUNITY OF ORCUTT	1697	2021-03-03	-3.0
2191	FEDERAL PRISON IN LOMPOC	1024	2020-09-21	-2.0
1940	CITY OF SANTA MARIA	4089	2020-10-20	-2.0
2508	SOUTH COUNTY UNINCORPORATED AREA includes comm...	166	2020-08-12	-2.0
3411	CITY OF SANTA MARIA	139	2020-05-02	-2.0
508	UNINCORPORATED AREA OF THE GOLETA VALLEY AND G...	1111	2021-03-03	-2.0
3341	UNINCORPORATED AREA OF THE GOLETA VALLEY AND G...	15	2020-05-08	-1.0

		cases
region	date
north	2020-04-29	271
	2020-05-06	311
	2020-05-13	348
	2020-05-20	404
	2020-05-27	486

	cases		new_cases
region	north	south	north	south
date
2020-04-29	271	104	NaN	NaN
2020-05-06	311	123	40.0	19.0
2020-05-13	348	127	37.0	4.0
2020-05-20	404	139	56.0	12.0
2020-05-27	486	159	82.0	20.0

COVID in Santa Barbara County¶

Cumulative total cases¶

Weekly new cases¶

Trajectory¶

Growth rate¶

	area	cases	date
0	SOUTH COUNTY UNINCORPORATED AREA includes comm...	1353	2021-04-14
1	CITY OF SANTA BARBARA and the unincorporated a...	6323	2021-04-14
2	CITY OF GOLETA	1765	2021-04-14
3	COMMUNITY OF ISLA VISTA	1285	2021-04-14
4	UNINCORPORATED AREA OF THE GOLETA VALLEY AND G...	1191	2021-04-14