# First, let's import the needed libraries.
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from datetime import datetime


# open the respective json files
ts_FUB_monthly = pd.read_json("../data/ts_FUB_monthly.json")
ts_FUB_monthly["Date"] = pd.to_datetime(
    ts_FUB_monthly["Date"], format="%Y-%m-%d", errors="coerce"
)

ts_FUB_daily = pd.read_json("../data/ts_FUB_daily.json")
ts_FUB_daily["MESS_DATUM"] = pd.to_datetime(
    ts_FUB_daily["MESS_DATUM"], format="%Y-%m-%d", errors="coerce"
)

ts_FUB_hourly = pd.read_json("../data/ts_FUB_hourly.json")
ts_FUB_hourly["MESS_DATUM"] = pd.to_datetime(
    ts_FUB_hourly["MESS_DATUM"], format="%Y-%m-%d", errors="coerce"
)


# Your code here...


### DATA WRANGLING ###

### monthly time series ###
daily_rain_2000_2015 = ts_FUB_daily.set_index(["MESS_DATUM"])[
    "2000-01-01":"2015-12-31"
]["Rain"]


monthly_rain_2000_2015 = daily_rain_2000_2015.groupby(
    daily_rain_2000_2015.index.to_period("M")
).agg("sum")


### PLOTTING ###

import matplotlib.dates as mdates  ## add library for custom x axis

plt.figure(figsize=(18, 6))

ax = monthly_rain_2000_2015.plot.bar(
    y="Rain", color="blue", edgecolor="lightgrey", fontsize=16
)

ax.xaxis.set_major_locator(mdates.MonthLocator())
ax.set_title("Monthly rainfall at Berlin-Dahlem for the period 2000-2015", fontsize=16)
ax.set_ylabel("Rainfall", fontsize=16)

plt.show()


### DATA WRANGLING ###
### annual time series ###

yearly_rain_2000_2015 = daily_rain_2000_2015.groupby(
    daily_rain_2000_2015.index.to_period("Y")
).agg("sum")


### PLOTTING ###

plt.figure(figsize=(18, 4))

ax = yearly_rain_2000_2015.plot.bar(
    y="Rain", color="blue", edgecolor="lightgrey", fontsize=16
)
ax.set_title("Annual rainfall at Berlin-Dahlem for the period 2000-2015", fontsize=16)
ax.set_ylabel("Rainfall", fontsize=16)

plt.show()


ts_FUB_hourly = ts_FUB_hourly.set_index(["MESS_DATUM"])
ts_FUB_hourly


plt.figure(figsize=(18, 6))
plt.plot(ts_FUB_hourly, color="blue")

plt.title("Hourly rainfall data for the station Berlin-Dahlem", fontsize=16)
plt.ylabel("Rainfall", fontsize=16)
plt.show()


print(
    f"Start Date: {ts_FUB_hourly.index.min().date()}, End Date: {ts_FUB_hourly.index.max().date()}"
)

Start Date: 2002-01-28, End Date: 2021-12-31


## group data by year and month and get the sum

mean_monthly_rainfall = ts_FUB_hourly.groupby(ts_FUB_hourly.index.to_period("M")).agg(
    "sum"
)


## group by month to get monthly mean
mean_monthly_rainfall = mean_monthly_rainfall.groupby(
    mean_monthly_rainfall.index.month
).mean()
mean_monthly_rainfall


np.arange(1, 13, 1)

array([ 1,  2,  3,  4,  5,  6,  7,  8,  9, 10, 11, 12])


plt.figure(figsize=(18, 4))

ax = mean_monthly_rainfall.plot.bar(y="rainfall", color="blue", edgecolor="lightgrey")
ax.set_title("Mean monthly rainfall at Berlin-Dahlem for the period")
ax.set_ylabel("Rainfall")
ax.set_ylabel("Months")
labels = [
    "Jan",
    "Feb",
    "Mar",
    "Apr",
    "May",
    "Jun",
    "Jul",
    "Aug",
    "Sep",
    "Oct",
    "Nov",
    "Dec",
]

ax.set_xticks(np.arange(0, 12, 1), labels)


plt.show()

<Figure size 1800x400 with 0 Axes>


## Your code here...


### DATA WRANGLING ###
## Add month and time as new columns
ts_FUB_hourly_df = pd.DataFrame(
    {
        "Date": ts_FUB_hourly.index,
        "rain": ts_FUB_hourly.values.flatten(),
        "month": ts_FUB_hourly.index.month,
        "month_name": ts_FUB_hourly.index.month_name(),
        "time": ts_FUB_hourly.index.hour,
    }
).set_index("Date")


## group by month and time and get the sum of rain

ts_FUB_hourly_df = (
    ts_FUB_hourly_df.groupby(["month", "month_name", "time"])
    .agg({"rain": "sum"})
    .reset_index()
)

## normalize to annual mean
ts_FUB_hourly_df.rain = ts_FUB_hourly_df.rain / 15


### PLOTTING ###

import seaborn as sns

g = sns.FacetGrid(
    ts_FUB_hourly_df, col="month_name", height=3.5, aspect=0.65, col_wrap=4
)
g.map_dataframe(sns.barplot, x="time", y="rain")
g.set_axis_labels("Hour of the day", "Rain (mm)")
g.set_titles(col_template="{col_name}")
g.set(xlim=(0, 23), ylim=(0, 7), xticks=[0, 6, 12, 18, 23], yticks=[0, 2, 4, 6, 8])

<seaborn.axisgrid.FacetGrid at 0x162662abf70>

	rainfall
MESS_DATUM
2002-01-28 11:00:00	0.0
2002-01-28 13:00:00	0.0
2002-01-28 15:00:00	1.7
2002-01-28 18:00:00	1.1
2002-01-28 21:00:00	0.0
...	...
2021-12-31 19:00:00	0.7
2021-12-31 20:00:00	0.7
2021-12-31 21:00:00	0.1
2021-12-31 22:00:00	0.1
2021-12-31 23:00:00	0.0

	rainfall
MESS_DATUM
1	48.165
2	31.955
3	35.805
4	25.455
5	53.425
6	58.540
7	83.295
8	62.295
9	42.060
10	47.830
11	43.715
12	41.075

Split-Apply-Combine¶