import pandas as pd

def data_url(city_name):
    base_url = "https://facultyweb.cs.wwu.edu/~wehrwes/courses/csci141_21s/fp/data/"
    return base_url + city_name + ".csv"

bham = pd.read_csv(data_url("WA_Bellingham"), parse_dates=["DATE"], low_memory=False)


# this gives us the maximum hourly relatiev humidity
hourly_humidity_permonth = bham.resample("MS", on="DATE")["HourlyRelativeHumidity"]
hourly_humidity_permonth

<pandas.core.groupby.generic.SeriesGroupBy object at 0x16c45e190>


hourly_humidity_permonth.max()

DATE
2020-01-01    100.0
2020-02-01    100.0
2020-03-01    100.0
2020-04-01     94.0
2020-05-01     94.0
2020-06-01     94.0
2020-07-01     94.0
2020-08-01     97.0
2020-09-01    100.0
2020-10-01    100.0
2020-11-01     97.0
2020-12-01    100.0
Freq: MS, Name: HourlyRelativeHumidity, dtype: float64


hourly_humidity_permonth.mean()

DATE
2020-01-01    76.605477
2020-02-01    79.876310
2020-03-01    70.918979
2020-04-01    65.603015
2020-05-01    69.106618
2020-06-01    73.459698
2020-07-01    72.490196
2020-08-01    72.806373
2020-09-01    81.267051
2020-10-01    82.047081
2020-11-01    79.328092
2020-12-01    89.361538
Freq: MS, Name: HourlyRelativeHumidity, dtype: float64


hourly_humidity_permonth.describe()


import seaborn as sns
import matplotlib.pyplot as plt

for month, data in hourly_humidity_permonth:
    sns.histplot(data, bins=range(0, 110, 10)).set(title=month.month_name())
    plt.show()


def humidity_plots(df):
    resampled = df.resample("MS", on="DATE")["HourlyRelativeHumidity"]
    
    for month, data in resampled:
        sns.histplot(data, bins=range(0, 110, 10)).set(title=month.month_name())
        plt.show()


phoenix = pd.read_csv(data_url("AZ_Phoenix"), low_memory=False, parse_dates=["DATE"])


humidity_plots(phoenix)

	count	mean	std	min	25%	50%	75%	max
DATE
2020-01-01	986.0	76.605477	10.910598	27.0	70.00	79.0	85.0	100.0
2020-02-01	954.0	79.876310	11.092164	39.0	73.00	82.0	89.0	100.0
2020-03-01	901.0	70.918979	17.570527	22.0	61.00	75.0	85.0	100.0
2020-04-01	796.0	65.603015	16.913935	16.0	55.75	68.0	79.0	94.0
2020-05-01	816.0	69.106618	15.069562	28.0	58.00	72.0	80.0	94.0
2020-06-01	794.0	73.459698	11.880193	43.0	65.00	75.0	83.0	94.0
2020-07-01	816.0	72.490196	13.332921	34.0	63.00	75.0	84.0	94.0
2020-08-01	816.0	72.806373	13.934968	27.0	61.00	75.0	84.0	97.0
2020-09-01	1041.0	81.267051	14.993581	18.0	75.00	87.0	93.0	100.0
2020-10-01	1062.0	82.047081	12.306165	37.0	75.25	86.0	92.0	100.0
2020-11-01	954.0	79.328092	12.254657	25.0	74.00	82.5	89.0	97.0
2020-12-01	1040.0	89.361538	9.785872	44.0	85.00	90.0	97.0	100.0

Resample (and some other cool stuff) demo!¶