# This is a comment, it starts with a hash sign

# Import pandas
import pandas as pd

# DO NOT MODIFY THIS TEST CELL
points = 0
try:
    pd.DataFrame()
    points += 5
    print('\u2705 Great work! You correctly imported the pandas library.')
except:
    print('\u274C Oops - pandas was not imported correctly.')
print('You earned {} of 5 points for importing pandas'.format(points))

✅ Great work! You correctly imported the pandas library.
You earned 5 of 5 points for importing pandas

# Request API endpoint
boulder_url = ('https://www.ncei.noaa.gov/access/services/data/v1?'
               'dataset=daily-summaries'
               '&dataTypes=TOBS,PRCP'
               '&stations=USC00050848'
               '&startDate=1893-10-01'
               '&endDate=2024-02-18'
               '&includeStationName=true'
               '&includeStationLocation=1'
               '&units=standard')
boulder_url

'https://www.ncei.noaa.gov/access/services/data/v1?dataset=daily-summaries&dataTypes=TOBS,PRCP&stations=USC00050848&startDate=1893-10-01&endDate=2024-02-18&includeStationName=true&includeStationLocation=1&units=standard'

# DO NOT MODIFY THIS TEST CELL
resp_url = _
points = 0

if type(resp_url)==str:
    points += 3
    print('\u2705 Great work! You correctly called your url variable.')
else:
    print('\u274C Oops - your url variable was not called correctly.')

if len(resp_url)==218:
    points += 3
    print('\u2705 Great work! Your url is the correct length.')
else:
    print('\u274C Oops - your url variable is not the correct length.')

print('You earned {} of 6 points for defining a url variable'.format(points))

✅ Great work! You correctly called your url variable.
✅ Great work! Your url is the correct length.
You earned 6 of 6 points for defining a url variable

boulder_df = pd.read_csv(
  boulder_url,
  index_col='DATE',
  parse_dates=True,
  na_values=['NaN'])
boulder_df

# DO NOT MODIFY THIS TEST CELL
tmax_df_resp = _
points = 0

if isinstance(tmax_df_resp, pd.DataFrame):
    points += 2
    print('\u2705 Great work! You called a DataFrame.')
else:
    print('\u274C Oops - make sure to call your DataFrame for testing.')

print('You earned {} of 2 points for downloading data'.format(points))

✅ Great work! You called a DataFrame.
You earned 2 of 2 points for downloading data

# Check that the data was imported into a pandas DataFrame
type(boulder_df)

pandas.core.frame.DataFrame

# Cleaning up the data frame
boulder_df = boulder_df[['PRCP','TOBS']]
boulder_df

# DO NOT MODIFY THIS TEST CELL
tmax_df_resp = _
points = 0

summary = [round(val, 2) for val in tmax_df_resp.mean().values]
if summary == [0.05, 54.53]:
    points += 5
    print('\u2705 Great work! You correctly downloaded data.')
else:
    print('\u274C Oops - your data are not correct.')
print('You earned {} of 5 points for downloading data'.format(points))

✅ Great work! You correctly downloaded data.
You earned 5 of 5 points for downloading data

boulder_df.plot()

<Axes: xlabel='DATE'>

# Plot the data using .plot
boulder_df.plot(
    y='TOBS',
    title='Temperature (F) at Boulder, CO\n1893-2024',
    xlabel='Year',
    ylabel='Temperature (F)',
    legend=False,
    figsize=(10,6))

<Axes: title={'center': 'Temperature (F) at Boulder, CO\n1893-2024'}, xlabel='Year', ylabel='Temperature (F)'>

# Convert to celcius
boulder_df['TCel'] = (boulder_df['TOBS'] - 32) * 5 / 9
boulder_df

/tmp/ipykernel_9647/860760448.py:2: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  boulder_df['TCel'] = (boulder_df['TOBS'] - 32) * 5 / 9

# DO NOT MODIFY THIS TEST CELL
tmax_df_resp = _
points = 0

if isinstance(tmax_df_resp, pd.DataFrame):
    points += 1
    print('\u2705 Great work! You called a DataFrame.')
else:
    print('\u274C Oops - make sure to call your DataFrame for testing.')

summary = [round(val, 2) for val in tmax_df_resp.mean().values]
if summary == [0.05, 54.53, 12.52]:
    points += 4
    print('\u2705 Great work! You correctly converted to Celcius.')
else:
    print('\u274C Oops - your data are not correct.')
print('You earned {} of 5 points for converting to Celcius'.format(points))

✅ Great work! You called a DataFrame.
✅ Great work! You correctly converted to Celcius.
You earned 5 of 5 points for converting to Celcius

# Write a function to convert Fahrenheit to Celsius
def fah_to_cel(fah):
    """Convert temperature to Celcius"""
    return (fah-32)*5/9 # Put your equation in here

boulder_df['celcius_column'] = boulder_df['TOBS'].apply(fah_to_cel)
boulder_df

/tmp/ipykernel_9647/2628125120.py:6: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  boulder_df['celcius_column'] = boulder_df['TOBS'].apply(fah_to_cel)

# Subset the data 1983 - 2023
boulder_1983_2023 = boulder_df['1983':'2023']
boulder_1983_2023

# DO NOT MODIFY THIS TEST CELL
df_resp = _
points = 0

if isinstance(df_resp, pd.DataFrame):
    points += 1
    print('\u2705 Great work! You called a DataFrame.')
else:
    print('\u274C Oops - make sure to call your DataFrame for testing.')

summary = [round(val, 2) for val in df_resp.mean().values]
if summary == [0.06, 55.67, 13.15]:
    points += 5
    print('\u2705 Great work! You correctly converted to Celcius.')
else:
    print('\u274C Oops - your data are not correct.')
print('You earned {} of 5 points for subsetting'.format(points))

✅ Great work! You called a DataFrame.
❌ Oops - your data are not correct.
You earned 1 of 5 points for subsetting

# Resample the data to look at yearly mean values
boulder_yearly_mean = boulder_1983_2023.resample('Y').mean()
boulder_yearly_mean

/tmp/ipykernel_9647/2796985930.py:2: FutureWarning: 'Y' is deprecated and will be removed in a future version, please use 'YE' instead.
  boulder_yearly_mean = boulder_1983_2023.resample('Y').mean()

# DO NOT MODIFY THIS TEST CELL
df_resp = _
points = 0

if isinstance(df_resp, pd.DataFrame):
    points += 1
    print('\u2705 Great work! You called a DataFrame.')
else:
    print('\u274C Oops - make sure to call your DataFrame for testing.')

summary = [round(val, 2) for val in df_resp.mean().values]
if summary == [0.06, 55.37, 12.99]:
    points += 5
    print('\u2705 Great work! You correctly converted to Celcius.')
else:
    print('\u274C Oops - your data are not correct.')
print('You earned {} of 5 points for resampling'.format(points))

✅ Great work! You called a DataFrame.
❌ Oops - your data are not correct.
You earned 1 of 5 points for resampling

# Plot mean annual temperature values
boulder_yearly_mean.plot(y='TOBS')

<Axes: xlabel='DATE'>

boulder_df_reset = boulder_yearly_mean.reset_index()
boulder_df_reset

boulder_df_reset['year'] = boulder_df_reset['DATE'].dt.year
boulder_df_reset

boulder_df_reset.set_index('year', inplace=True)
boulder_df_reset

# Using ChatGPT to help add a trendline to the plot

import matplotlib.pyplot as plt
import matplotlib.dates as mdates
import numpy as np

fig, ax = plt.subplots(figsize=(5,3))

x_values = boulder_df_reset.index


ax.scatter(x_values,
           boulder_df_reset["TCel"],
           label="Temperature Data",
           color='white',
           edgecolor='black')

# Fit a linear regression model
slope, intercept = np.polyfit(x_values, boulder_df_reset["TCel"], 1)
trendline = slope * x_values + intercept

ax.plot(x_values, trendline, color='red', label="Trendline")
ax.plot(x_values, boulder_df_reset["TCel"], color='grey', markersize=0.3)


# Add text box with slope value (From ChatGPT)
slope_text = f"Slope: {slope:.3f} °C/yr"
ax.text(0.5, 0.6, slope_text, transform=ax.transAxes, fontsize=10,
        verticalalignment='top', bbox=dict(boxstyle='round', facecolor='whitesmoke', alpha=0.9))



ax.set(title="Mean Annual Temperature\nBoulder, CO (1983-2023)",
       ylabel="Temperature (°C)")

ax.legend()  # Add legend to display labels

plt.show()

# Create interactive map using folium
import folium

# Weather station info
station_lat = 39.99282
station_long = -105.26683
station_location_name = 'NOAA Weather Station [GHCND:USC00050848] - Boulder, CO'

# Create a Folium map object
m = folium.Map(location=[station_lat,station_long], zoom_start=10)

# Add marker for river gage
folium.Marker(
    location=[station_lat, station_long],
    popup=station_location_name,
    icon=folium.Icon(color='black')
).add_to(m)


# Save the map as an HTML file or display it inline
m.save('map.html')
# OR
m

%%capture
%%bash
jupyter nbconvert *.ipynb --to html

	STATION	NAME	LATITUDE	LONGITUDE	ELEVATION	PRCP	TOBS
DATE
1893-10-01	USC00050848	BOULDER, CO US	39.99282	-105.26683	1673.0	0.94	NaN
1893-10-02	USC00050848	BOULDER, CO US	39.99282	-105.26683	1673.0	0.00	NaN
1893-10-03	USC00050848	BOULDER, CO US	39.99282	-105.26683	1673.0	0.00	NaN
1893-10-04	USC00050848	BOULDER, CO US	39.99282	-105.26683	1673.0	0.04	NaN
1893-10-05	USC00050848	BOULDER, CO US	39.99282	-105.26683	1673.0	0.00	NaN
...	...	...	...	...	...	...	...
2024-02-14	USC00050848	BOULDER, CO US	39.99282	-105.26683	1673.0	0.00	41.0
2024-02-15	USC00050848	BOULDER, CO US	39.99282	-105.26683	1673.0	0.00	39.0
2024-02-16	USC00050848	BOULDER, CO US	39.99282	-105.26683	1673.0	0.20	23.0
2024-02-17	USC00050848	BOULDER, CO US	39.99282	-105.26683	1673.0	0.22	23.0
2024-02-18	USC00050848	BOULDER, CO US	39.99282	-105.26683	1673.0	0.00	42.0

	PRCP	TOBS
DATE
1893-10-01	0.94	NaN
1893-10-02	0.00	NaN
1893-10-03	0.00	NaN
1893-10-04	0.04	NaN
1893-10-05	0.00	NaN
...	...	...
2024-02-14	0.00	41.0
2024-02-15	0.00	39.0
2024-02-16	0.20	23.0
2024-02-17	0.22	23.0
2024-02-18	0.00	42.0

	PRCP	TOBS	TCel
DATE
1893-10-01	0.94	NaN	NaN
1893-10-02	0.00	NaN	NaN
1893-10-03	0.00	NaN	NaN
1893-10-04	0.04	NaN	NaN
1893-10-05	0.00	NaN	NaN
...	...	...	...
2024-02-14	0.00	41.0	5.000000
2024-02-15	0.00	39.0	3.888889
2024-02-16	0.20	23.0	-5.000000
2024-02-17	0.22	23.0	-5.000000
2024-02-18	0.00	42.0	5.555556

	PRCP	TOBS	TCel	celcius_column
DATE
1893-10-01	0.94	NaN	NaN	NaN
1893-10-02	0.00	NaN	NaN	NaN
1893-10-03	0.00	NaN	NaN	NaN
1893-10-04	0.04	NaN	NaN	NaN
1893-10-05	0.00	NaN	NaN	NaN
...	...	...	...	...
2024-02-14	0.00	41.0	5.000000	5.000000
2024-02-15	0.00	39.0	3.888889	3.888889
2024-02-16	0.20	23.0	-5.000000	-5.000000
2024-02-17	0.22	23.0	-5.000000	-5.000000
2024-02-18	0.00	42.0	5.555556	5.555556

	PRCP	TOBS	TCel	celcius_column
DATE
1983-12-31	0.068588	53.319749	11.844305	11.844305
1984-12-31	0.050656	50.601093	10.333940	10.333940
1985-12-31	0.047781	52.354571	11.308095	11.308095
1986-12-31	0.058493	55.616438	13.120244	13.120244
1987-12-31	0.070740	54.205479	12.336377	12.336377
1988-12-31	0.046311	54.650273	12.583485	12.583485
1989-12-31	0.058585	55.400943	13.000524	13.000524
1990-12-31	0.053782	59.463504	15.257502	15.257502
1991-12-31	0.058000	54.498623	12.499235	12.499235
1992-12-31	0.047486	54.556164	12.531202	12.531202
1993-12-31	0.062365	50.829341	10.460745	10.460745
1994-12-31	0.046000	38.715789	3.730994	3.730994
1995-12-31	0.080630	54.792818	12.662676	12.662676
1996-12-31	0.059235	55.233516	12.907509	12.907509
1997-12-31	0.078055	54.274725	12.374847	12.374847
1998-12-31	0.061068	55.931507	13.295282	13.295282
1999-12-31	0.071099	56.079452	13.377473	13.377473
2000-12-31	0.043434	56.719780	13.733211	13.733211
2001-12-31	0.049863	56.457534	13.587519	13.587519
2002-12-31	0.038027	56.638356	13.687976	13.687976
2003-12-31	0.060329	57.230137	14.016743	14.016743
2004-12-31	0.074235	55.420765	13.011536	13.011536
2005-12-31	0.047726	56.871233	13.817352	13.817352
2006-12-31	0.052904	57.772603	14.318113	14.318113
2007-12-31	0.047205	56.616438	13.675799	13.675799
2008-12-31	0.046503	56.175342	13.430746	13.430746
2009-12-31	0.057216	54.212575	12.340319	12.340319
2010-12-31	0.055644	55.854795	13.252664	13.252664
2011-12-31	0.061068	55.975275	13.319597	13.319597
2012-12-31	0.042760	59.857534	15.476408	15.476408
2013-12-31	0.093562	55.454795	13.030441	13.030441
2014-12-31	0.064575	55.367123	12.981735	12.981735
2015-12-31	0.073753	56.710744	13.728191	13.728191
2016-12-31	0.047131	57.836066	14.353370	14.353370
2017-12-31	0.061617	60.129129	15.627294	15.627294
2018-12-31	0.052740	57.005479	13.891933	13.891933
2019-12-31	0.057644	54.426997	12.459443	12.459443
2020-12-31	0.046721	57.691460	14.273033	14.273033
2021-12-31	0.056658	57.538462	14.188034	14.188034
2022-12-31	0.051479	56.139726	13.410959	13.410959
2023-12-31	0.062740	55.694215	13.163453	13.163453

Get started with open reproducible science! (API version)¶

It’s another ESIIL Earth Data Science Workflow¶

Don’t get caught by these interactive coding notebook gotchas¶

Run your code in the right environment to avoid import errors¶

Always run your code start to finish before submitting¶

Check your code to make sure it’s clean and easy to read¶

Label and describe your plots¶

Get started with open reproducible science!¶

Human-readable and Machine-readable¶

Readable, well-documented scientific workflows are easier to reproduce¶

What the fork?! Who wrote this?¶

Python packages let you use code written by experts around the world¶

There are more Earth Observation data online than any one person could ever look at¶

You can access NCEI GHCNd Data from the internet using its API 🖥️ 📡 🖥️¶

Download and get started working with NCEI data¶

Plot the precpitation column (PRCP) vs time to explore the data¶

Subsetting and Resampling¶

Now we are ready to calculate annual statistics¶

YOUR BOULDER PLOT HEADLINE HERE 📰 🗞️ 📻¶

THIS ISN’T THE END! 😄¶

Your turn: pick a new location and/or measurement to plot 🌏 📈¶

Congratulations, you’re almost done with this coding challenge 🤩 – now make sure that your code is reproducible¶

BONUS: Create a shareable Markdown of your work¶

	PRCP	TOBS	TCel	celcius_column
DATE
1983-01-01	0.0	NaN	NaN	NaN
1983-01-02	0.0	NaN	NaN	NaN
1983-01-03	0.0	NaN	NaN	NaN
1983-01-04	0.0	NaN	NaN	NaN
1983-01-05	0.0	NaN	NaN	NaN
...	...	...	...	...
2023-12-27	0.0	41.0	5.000000	5.000000
2023-12-28	0.0	NaN	NaN	NaN
2023-12-29	0.0	39.0	3.888889	3.888889
2023-12-30	0.0	38.0	3.333333	3.333333
2023-12-31	0.0	33.0	0.555556	0.555556

	DATE	PRCP	TOBS	TCel	celcius_column
year
1983	1983-12-31	0.068588	53.319749	11.844305	11.844305
1984	1984-12-31	0.050656	50.601093	10.333940	10.333940
1985	1985-12-31	0.047781	52.354571	11.308095	11.308095
1986	1986-12-31	0.058493	55.616438	13.120244	13.120244
1987	1987-12-31	0.070740	54.205479	12.336377	12.336377
1988	1988-12-31	0.046311	54.650273	12.583485	12.583485
1989	1989-12-31	0.058585	55.400943	13.000524	13.000524
1990	1990-12-31	0.053782	59.463504	15.257502	15.257502
1991	1991-12-31	0.058000	54.498623	12.499235	12.499235
1992	1992-12-31	0.047486	54.556164	12.531202	12.531202
1993	1993-12-31	0.062365	50.829341	10.460745	10.460745
1994	1994-12-31	0.046000	38.715789	3.730994	3.730994
1995	1995-12-31	0.080630	54.792818	12.662676	12.662676
1996	1996-12-31	0.059235	55.233516	12.907509	12.907509
1997	1997-12-31	0.078055	54.274725	12.374847	12.374847
1998	1998-12-31	0.061068	55.931507	13.295282	13.295282
1999	1999-12-31	0.071099	56.079452	13.377473	13.377473
2000	2000-12-31	0.043434	56.719780	13.733211	13.733211
2001	2001-12-31	0.049863	56.457534	13.587519	13.587519
2002	2002-12-31	0.038027	56.638356	13.687976	13.687976
2003	2003-12-31	0.060329	57.230137	14.016743	14.016743
2004	2004-12-31	0.074235	55.420765	13.011536	13.011536
2005	2005-12-31	0.047726	56.871233	13.817352	13.817352
2006	2006-12-31	0.052904	57.772603	14.318113	14.318113
2007	2007-12-31	0.047205	56.616438	13.675799	13.675799
2008	2008-12-31	0.046503	56.175342	13.430746	13.430746
2009	2009-12-31	0.057216	54.212575	12.340319	12.340319
2010	2010-12-31	0.055644	55.854795	13.252664	13.252664
2011	2011-12-31	0.061068	55.975275	13.319597	13.319597
2012	2012-12-31	0.042760	59.857534	15.476408	15.476408
2013	2013-12-31	0.093562	55.454795	13.030441	13.030441
2014	2014-12-31	0.064575	55.367123	12.981735	12.981735
2015	2015-12-31	0.073753	56.710744	13.728191	13.728191
2016	2016-12-31	0.047131	57.836066	14.353370	14.353370
2017	2017-12-31	0.061617	60.129129	15.627294	15.627294
2018	2018-12-31	0.052740	57.005479	13.891933	13.891933
2019	2019-12-31	0.057644	54.426997	12.459443	12.459443
2020	2020-12-31	0.046721	57.691460	14.273033	14.273033
2021	2021-12-31	0.056658	57.538462	14.188034	14.188034
2022	2022-12-31	0.051479	56.139726	13.410959	13.410959
2023	2023-12-31	0.062740	55.694215	13.163453	13.163453