# Import pandas
import pandas as pd

# DO NOT MODIFY THIS TEST CELL
points = 0
try:
    pd.DataFrame()
    points += 5
    print('\u2705 Great work! You correctly imported the pandas library.')
except:
    print('\u274C Oops - pandas was not imported correctly.')
print('You earned {} of 5 points for importing pandas'.format(points))

✅ Great work! You correctly imported the pandas library.
You earned 5 of 5 points for importing pandas

# Getting data from NCEI for Rapid City, CO
rapidcityurl = (
    'https://www.ncei.noaa.gov/access/services/data/v1?'
    'dataset=daily-summaries'
    '&dataTypes=TOBS,PRCP'
    '&stations=USC00396947'
    '&startDate=1949-10-01'
    '&endDate=2024-05-03'
    '&includeStationName=true'
    '&includeStationLocation=1'
    '&units=standard')
rapidcityurl

'https://www.ncei.noaa.gov/access/services/data/v1?dataset=daily-summaries&dataTypes=TOBS,PRCP&stations=USC00396947&startDate=1949-10-01&endDate=2024-05-03&includeStationName=true&includeStationLocation=1&units=standard'

# DO NOT MODIFY THIS TEST CELL
resp_url = _
points = 0

if type(resp_url)==str:
    points += 3
    print('\u2705 Great work! You correctly called your url variable.')
else:
    print('\u274C Oops - your url variable was not called correctly.')

if len(resp_url)==218:
    points += 3
    print('\u2705 Great work! Your url is the correct length.')
else:
    print('\u274C Oops - your url variable is not the correct length.')

print('You earned {} of 6 points for defining a url variable'.format(points))

✅ Great work! You correctly called your url variable.
✅ Great work! Your url is the correct length.
You earned 6 of 6 points for defining a url variable

# creating a data frame for Rapid City
rapidcity_df = pd.read_csv(
  rapidcityurl,
  index_col='DATE',
  parse_dates=True,
  na_values=['NaN'])
rapidcity_df

# DO NOT MODIFY THIS TEST CELL
tmax_df_resp = _
points = 0

if isinstance(tmax_df_resp, pd.DataFrame):
    points += 1
    print('\u2705 Great work! You called a DataFrame.')
else:
    print('\u274C Oops - make sure to call your DataFrame for testing.')

print('You earned {} of 2 points for downloading data'.format(points))

✅ Great work! You called a DataFrame.
You earned 1 of 2 points for downloading data

# Check that the data was imported into a pandas DataFrame
type(rapidcity_df)

pandas.core.frame.DataFrame

# Checking column names to know all columns in data
rapidcity_df.columns

Index(['STATION', 'NAME', 'LATITUDE', 'LONGITUDE', 'ELEVATION', 'PRCP',
       'TOBS'],
      dtype='object')

# Rewriting data frame to only have precipitations and TOBS data
rapidcity_df = rapidcity_df[['PRCP', 'TOBS']]
rapidcity_df

# DO NOT MODIFY THIS TEST CELL
tmax_df_resp = _
points = 0

summary = [round(val, 2) for val in tmax_df_resp.mean().values]
if summary == [0.05, 54.53]:
    points += 4
    print('\u2705 Great work! You correctly downloaded data.')
else:
    print('\u274C Oops - your data are not correct.')
print('You earned {} of 5 points for downloading data'.format(points))

❌ Oops - your data are not correct.
You earned 0 of 5 points for downloading data

# Plotting Rapid City PRCP and TOBS 
rapidcity_df.plot()

<Axes: xlabel='DATE'>

# Plotting Daily Observed Temperature for Rapid City from 1944-2024
rapidcity_df.plot(
    y='TOBS',
    title='Rapid City Daily Observed Temperature 1944-2024',
    xlabel='Date',
    ylabel='Temperature (F)',
    legend=False,
    color='blue',
    figsize=(10,5),
    fontsize=14)

<Axes: title={'center': 'Rapid City Daily Observed Temperature 1944-2024'}, xlabel='Date', ylabel='Temperature (F)'>

# Convert to celcius
rapidcity_df.loc[:,'TCel'] = (rapidcity_df['TOBS'] - 32) * 5 / 9
rapidcity_df

/tmp/ipykernel_6497/1789627478.py:2: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  rapidcity_df.loc[:,'TCel'] = (rapidcity_df['TOBS'] - 32) * 5 / 9

# DO NOT MODIFY THIS TEST CELL
tmax_df_resp = _
points = 0

if isinstance(tmax_df_resp, pd.DataFrame):
    points += 1
    print('\u2705 Great work! You called a DataFrame.')
else:
    print('\u274C Oops - make sure to call your DataFrame for testing.')

summary = [round(val, 2) for val in tmax_df_resp.mean().values]
if summary == [0.05, 54.53, 12.52]:
    points += 4
    print('\u2705 Great work! You correctly converted to Celcius.')
else:
    print('\u274C Oops - your data are not correct.')
print('You earned {} of 5 points for converting to Celcius'.format(points))

✅ Great work! You called a DataFrame.
❌ Oops - your data are not correct.
You earned 1 of 5 points for converting to Celcius

# Creating a function to convert from fahrenheit to celsius
def to_celsius(fahrenheit):
    """Convert temperature to Celsius"""
    return (fahrenheit - 32) * 5 / 9

# Displaying dataframe with new column, celsius
rapidcity_df['celsius'] = rapidcity_df['TOBS'].apply(to_celsius)
rapidcity_df

/tmp/ipykernel_6497/2859914288.py:7: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  rapidcity_df['celsius'] = rapidcity_df['TOBS'].apply(to_celsius)

# Subset the data
rapidcitysubset = rapidcity_df.loc['1983':'2023']
rapidcitysubset

# DO NOT MODIFY THIS TEST CELL
df_resp = _
points = 0

if isinstance(df_resp, pd.DataFrame):
    points += 1
    print('\u2705 Great work! You called a DataFrame.')
else:
    print('\u274C Oops - make sure to call your DataFrame for testing.')

summary = [round(val, 2) for val in df_resp.mean().values]
if summary == [0.06, 55.67, 13.15]:
    points += 5
    print('\u2705 Great work! You correctly converted to Celcius.')
else:
    print('\u274C Oops - your data are not correct.')
print('You earned {} of 5 points for subsetting'.format(points))

✅ Great work! You called a DataFrame.
❌ Oops - your data are not correct.
You earned 1 of 5 points for subsetting

# Resample the data to look at yearly mean values
rapidyearly = rapidcitysubset.resample('YE').mean()
rapidyearly

# DO NOT MODIFY THIS TEST CELL
df_resp = _
points = 0

if isinstance(df_resp, pd.DataFrame):
    points += 1
    print('\u2705 Great work! You called a DataFrame.')
else:
    print('\u274C Oops - make sure to call your DataFrame for testing.')

summary = [round(val, 2) for val in df_resp.mean().values]
if summary == [0.06, 55.37, 12.99]:
    points += 5
    print('\u2705 Great work! You correctly converted to Celcius.')
else:
    print('\u274C Oops - your data are not correct.')
print('You earned {} of 5 points for resampling'.format(points))

✅ Great work! You called a DataFrame.
❌ Oops - your data are not correct.
You earned 1 of 5 points for resampling

# Plot mean annual temperature values from 1983 to 2023
rapidyearly.plot(
    y='TOBS',
    title='Rapid City Annual Mean Temperatures 1983-2023',
    xlabel='Year',
    ylabel='Temperature (F)',
    legend=False,
    color='blue',
    figsize=(10,5),
    fontsize=14
)

<Axes: title={'center': 'Rapid City Annual Mean Temperatures 1983-2023'}, xlabel='Year', ylabel='Temperature (F)'>

#Recreating with Rainier Paradise Ranger Station in Mount Rainier
#USC00456898  46.7858 -121.7425 1654.1 WA RAINIER PARADISE RS   
rainierurl = (
    'https://www.ncei.noaa.gov/access/services/data/v1?'
    'dataset=daily-summaries'
    '&dataTypes=TOBS,PRCP'
    '&stations=USC00456898'
    '&startDate=1916-12-01'
    '&endDate=2024-05-12'
    '&includeStationName=true'
    '&includeStationLocation=1'
    '&units=standard')
rainierurl

'https://www.ncei.noaa.gov/access/services/data/v1?dataset=daily-summaries&dataTypes=TOBS,PRCP&stations=USC00456898&startDate=1916-12-01&endDate=2024-05-12&includeStationName=true&includeStationLocation=1&units=standard'

# creating a data frame for Rainier
rainier_df = pd.read_csv(
  rainierurl,
  index_col='DATE',
  parse_dates=True,
  na_values=['NaN'])
rainier_df

# Keeping only precipitation and TOBS columns
rainier_df = rainier_df[['PRCP', 'TOBS']]
rainier_df

# Plotting Rainier Daily Observed Temperature
rainier_df.plot(
    y='TOBS',
    title='Rainier Paradise Ranger Station City Daily Observed Temperature 1916-2024',
    xlabel='Date',
    ylabel='Temperature (F)',
    legend=False,
    color='blue',
    figsize=(10,5),
    fontsize=14)

<Axes: title={'center': 'Rainier Paradise Ranger Station City Daily Observed Temperature 1916-2024'}, xlabel='Date', ylabel='Temperature (F)'>

# Convert to celcius
rainier_df.loc[:,'TCel'] = (rainier_df['TOBS'] - 32) * 5 / 9
rainier_df

/tmp/ipykernel_6497/1784484435.py:2: SettingWithCopyWarning: 
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  rainier_df.loc[:,'TCel'] = (rainier_df['TOBS'] - 32) * 5 / 9

# creating subset from 1980 to 2023
rainiersubset = rainier_df.loc['1980':'2023']
rainiersubset

# Resampling to get only mean yearly values 
rainieryearly = rainiersubset.resample('YE').mean()
rainieryearly

# Plot mean annual temperature values for Rainier from 1980 to 2023
rainieryearly.plot(
    y='TOBS',
    title='Rainier Paradise Ranger Station Annual Mean Temperatures 1980-2023',
    xlabel='Year',
    ylabel='Temperature (F)',
    legend=False,
    color='blue',
    figsize=(10,5),
    fontsize=14
)

<Axes: title={'center': 'Rainier Paradise Ranger Station Annual Mean Temperatures 1980-2023'}, xlabel='Year', ylabel='Temperature (F)'>

%%capture
%%bash
jupyter nbconvert *.ipynb --to markdown

%%capture
%%bash
jupyter nbconvert *.ipynb --to html

	STATION	NAME	LATITUDE	LONGITUDE	ELEVATION	PRCP	TOBS
DATE
1949-10-01	USC00396947	RAPID CITY 4 NW, SD US	44.12055	-103.28417	1060.4	0.00	51.0
1949-10-02	USC00396947	RAPID CITY 4 NW, SD US	44.12055	-103.28417	1060.4	0.00	51.0
1949-10-03	USC00396947	RAPID CITY 4 NW, SD US	44.12055	-103.28417	1060.4	0.00	52.0
1949-10-04	USC00396947	RAPID CITY 4 NW, SD US	44.12055	-103.28417	1060.4	0.00	45.0
1949-10-05	USC00396947	RAPID CITY 4 NW, SD US	44.12055	-103.28417	1060.4	0.00	50.0
...	...	...	...	...	...	...	...
2024-04-28	USC00396947	RAPID CITY 4 NW, SD US	44.12055	-103.28417	1060.4	0.00	NaN
2024-04-29	USC00396947	RAPID CITY 4 NW, SD US	44.12055	-103.28417	1060.4	0.37	30.0
2024-04-30	USC00396947	RAPID CITY 4 NW, SD US	44.12055	-103.28417	1060.4	0.00	44.0
2024-05-01	USC00396947	RAPID CITY 4 NW, SD US	44.12055	-103.28417	1060.4	0.00	33.0
2024-05-02	USC00396947	RAPID CITY 4 NW, SD US	44.12055	-103.28417	1060.4	0.35	39.0

	PRCP	TOBS
DATE
1949-10-01	0.00	51.0
1949-10-02	0.00	51.0
1949-10-03	0.00	52.0
1949-10-04	0.00	45.0
1949-10-05	0.00	50.0
...	...	...
2024-04-28	0.00	NaN
2024-04-29	0.37	30.0
2024-04-30	0.00	44.0
2024-05-01	0.00	33.0
2024-05-02	0.35	39.0

	PRCP	TOBS	TCel
DATE
1949-10-01	0.00	51.0	10.555556
1949-10-02	0.00	51.0	10.555556
1949-10-03	0.00	52.0	11.111111
1949-10-04	0.00	45.0	7.222222
1949-10-05	0.00	50.0	10.000000
...	...	...	...
2024-04-28	0.00	NaN	NaN
2024-04-29	0.37	30.0	-1.111111
2024-04-30	0.00	44.0	6.666667
2024-05-01	0.00	33.0	0.555556
2024-05-02	0.35	39.0	3.888889

	PRCP	TOBS	TCel	celsius
DATE
1949-10-01	0.00	51.0	10.555556	10.555556
1949-10-02	0.00	51.0	10.555556	10.555556
1949-10-03	0.00	52.0	11.111111	11.111111
1949-10-04	0.00	45.0	7.222222	7.222222
1949-10-05	0.00	50.0	10.000000	10.000000
...	...	...	...	...
2024-04-28	0.00	NaN	NaN	NaN
2024-04-29	0.37	30.0	-1.111111	-1.111111
2024-04-30	0.00	44.0	6.666667	6.666667
2024-05-01	0.00	33.0	0.555556	0.555556
2024-05-02	0.35	39.0	3.888889	3.888889

	PRCP	TOBS	TCel	celsius
DATE
1983-01-01	0.00	30.0	-1.111111	-1.111111
1983-01-02	0.00	29.0	-1.666667	-1.666667
1983-01-03	0.00	40.0	4.444444	4.444444
1983-01-04	0.00	33.0	0.555556	0.555556
1983-01-05	0.00	43.0	6.111111	6.111111
...	...	...	...	...
2023-12-27	0.31	32.0	0.000000	0.000000
2023-12-28	0.00	17.0	-8.333333	-8.333333
2023-12-29	0.00	28.0	-2.222222	-2.222222
2023-12-30	0.00	NaN	NaN	NaN
2023-12-31	0.00	NaN	NaN	NaN

Climate change is impacting the way people live around the world¶

Get started with open reproducible science!¶

Human-readable and Machine-readable¶

What the fork?! Who wrote this?¶

Python packages let you use code written by experts around the world¶

There are more Earth Observation data online than any one person could ever look at¶

You can access NCEI GHCNd Data from the internet using its API 🖥️ 📡 🖥️¶

Download and get started working with NCEI data¶

Plot the precpitation column (PRCP) vs time to explore the data¶

Subsetting and Resampling¶

Now we are ready to calculate annual statistics¶

Rapid City, CO colder than 40 years ago and temperatures continue to shift! 📰 🗞️ 📻¶

THIS ISN’T THE END! 😄¶

Your turn: pick a new location and/or measurement to plot 🌏 📈¶

Congratulations, you’re almost done with this coding challenge 🤩 – now make sure that your code is reproducible¶

BONUS: Create a shareable Markdown of your work¶

Temperatures on the rise in Mount Rainier, WA over the last 40 years! 📰 🗞️ 📻¶

	PRCP	TOBS	TCel	celsius
DATE
1983-12-31	0.038849	59.302632	15.168129	15.168129
1984-12-31	0.026145	54.458182	12.476768	12.476768
1985-12-31	0.039091	50.691667	10.384259	10.384259
1986-12-31	0.069551	53.672673	12.040374	12.040374
1987-12-31	0.039011	56.988950	13.882750	13.882750
1988-12-31	0.028017	56.983240	13.879578	13.879578
1989-12-31	0.056359	38.072829	3.373794	3.373794
1990-12-31	0.039068	40.363112	4.646174	4.646174
1991-12-31	0.056875	39.945869	4.414372	4.414372
1992-12-31	0.036714	39.525862	4.181034	4.181034
1993-12-31	0.055881	35.522581	1.956989	1.956989
1994-12-31	0.034540	39.479769	4.155427	4.155427
1995-12-31	0.063609	39.150568	3.972538	3.972538
1996-12-31	0.058785	36.547486	2.526381	2.526381
1997-12-31	0.057634	38.825073	3.791707	3.791707
1998-12-31	0.068343	40.563739	4.757633	4.757633
1999-12-31	0.073104	41.688202	5.382335	5.382335
2000-12-31	0.050771	39.750751	4.305973	4.305973
2001-12-31	0.049639	43.371134	6.317297	6.317297
2002-12-31	0.036126	33.482143	0.823413	0.823413
2003-12-31	0.039186	40.455253	4.697363	4.697363
2004-12-31	0.030242	38.877828	3.821016	3.821016
2005-12-31	0.044620	40.627119	4.792844	4.792844
2006-12-31	0.042870	40.873278	4.929599	4.929599
2007-12-31	0.038515	34.806931	1.559406	1.559406
2008-12-31	0.025892	34.204969	1.224983	1.224983
2009-12-31	0.053828	35.871324	2.150735	2.150735
2010-12-31	0.056767	39.012384	3.895769	3.895769
2011-12-31	0.060282	40.313846	4.618803	4.618803
2012-12-31	0.019341	42.008746	5.560415	5.560415
2013-12-31	0.060685	38.392638	3.551466	3.551466
2014-12-31	0.057726	39.211310	4.006283	4.006283
2015-12-31	0.057260	41.351275	5.195153	5.195153
2016-12-31	0.039508	42.161644	5.645358	5.645358
2017-12-31	0.034082	41.013889	5.007716	5.007716
2018-12-31	0.057335	36.670732	2.594851	2.594851
2019-12-31	0.085056	36.159544	2.310858	2.310858
2020-12-31	0.044006	41.023438	5.013021	5.013021
2021-12-31	0.032225	40.363248	4.646249	4.646249
2022-12-31	0.028421	39.331395	4.072997	4.072997
2023-12-31	0.046313	40.144578	4.524766	4.524766

	STATION	NAME	LATITUDE	LONGITUDE	ELEVATION	PRCP	TOBS
DATE
1916-12-01	USC00456898	RAINIER PARADISE RANGER STATION, WA US	46.78639	-121.74222	1650.5	NaN	29.0
1916-12-02	USC00456898	RAINIER PARADISE RANGER STATION, WA US	46.78639	-121.74222	1650.5	NaN	28.0
1916-12-03	USC00456898	RAINIER PARADISE RANGER STATION, WA US	46.78639	-121.74222	1650.5	NaN	21.0
1916-12-04	USC00456898	RAINIER PARADISE RANGER STATION, WA US	46.78639	-121.74222	1650.5	NaN	23.0
1916-12-05	USC00456898	RAINIER PARADISE RANGER STATION, WA US	46.78639	-121.74222	1650.5	NaN	22.0
...	...	...	...	...	...	...	...
2024-05-08	USC00456898	RAINIER PARADISE RANGER STATION, WA US	46.78639	-121.74222	1650.5	NaN	NaN
2024-05-09	USC00456898	RAINIER PARADISE RANGER STATION, WA US	46.78639	-121.74222	1650.5	NaN	54.0
2024-05-10	USC00456898	RAINIER PARADISE RANGER STATION, WA US	46.78639	-121.74222	1650.5	0.0	61.0
2024-05-11	USC00456898	RAINIER PARADISE RANGER STATION, WA US	46.78639	-121.74222	1650.5	0.0	59.0
2024-05-12	USC00456898	RAINIER PARADISE RANGER STATION, WA US	46.78639	-121.74222	1650.5	0.0	54.0

	PRCP	TOBS	TCel
DATE
1980-01-01	1.29	29.0	-1.666667
1980-01-02	0.08	31.0	-0.555556
1980-01-03	0.74	18.0	-7.777778
1980-01-04	0.10	21.0	-6.111111
1980-01-05	1.58	18.0	-7.777778
...	...	...	...
2023-12-27	NaN	NaN	NaN
2023-12-28	NaN	36.0	2.222222
2023-12-29	0.00	40.0	4.444444
2023-12-30	0.20	34.0	1.111111
2023-12-31	0.39	32.0	0.000000

	PRCP	TOBS	TCel
DATE
1980-12-31	0.340847	34.983516	1.657509
1981-12-31	0.337315	36.912088	2.728938
1982-12-31	0.316418	34.668524	1.482513
1983-12-31	0.355205	35.173077	1.762821
1984-12-31	0.337637	33.704918	0.947177
1985-12-31	0.228000	35.640110	2.022283
1986-12-31	0.310932	38.142466	3.412481
1987-12-31	0.199331	39.781818	4.323232
1988-12-31	0.328297	37.186301	2.881279
1989-12-31	0.274848	35.632597	2.018109
1990-12-31	0.405439	35.107042	1.726135
1991-12-31	0.347582	36.430137	2.461187
1992-12-31	0.272932	37.699454	3.166363
1993-12-31	0.218822	33.498630	0.832572
1994-12-31	0.384620	35.877483	2.154157
1995-12-31	0.382644	35.853968	2.141093
1996-12-31	0.354772	36.933824	2.741013
1997-12-31	0.398710	35.944984	2.191658
1998-12-31	0.330840	36.889205	2.716225
1999-12-31	0.342132	35.739394	2.077441
2000-12-31	0.261652	33.385382	0.769657
2001-12-31	0.332028	33.288401	0.715778
2002-12-31	0.289858	37.241379	2.911877
2003-12-31	0.357840	35.927419	2.181900
2004-12-31	0.301335	40.064706	4.480392
2005-12-31	0.297229	38.962536	3.868076
2006-12-31	0.378636	38.075758	3.375421
2007-12-31	0.299623	37.391975	2.995542
2008-12-31	0.318908	35.789272	2.105151
2009-12-31	0.264627	36.655052	2.586140
2010-12-31	0.276537	38.596330	3.664628
2011-12-31	0.370717	34.744681	1.524823
2012-12-31	0.339748	36.509434	2.505241
2013-12-31	0.286890	38.206294	3.447941
2014-12-31	0.345017	38.678457	3.710254
2015-12-31	0.321603	41.861314	5.478508
2016-12-31	0.375076	38.674658	3.708143
2017-12-31	0.297438	40.143791	4.524328
2018-12-31	0.385768	38.235880	3.464378
2019-12-31	0.256429	38.764331	3.757962
2020-12-31	0.488738	37.295276	2.941820
2021-12-31	0.340103	40.833333	4.907407
2022-12-31	0.227745	41.918301	5.510167
2023-12-31	0.232778	43.404669	6.335927

Climate change is impacting the way people live around the world¶

Get started with open reproducible science!¶

Human-readable and Machine-readable¶

What the fork?! Who wrote this?¶

Python packages let you use code written by experts around the world¶

There are more Earth Observation data online than any one person could ever look at¶

You can access NCEI GHCNd Data from the internet using its API 🖥️ 📡 🖥️¶

Download and get started working with NCEI data¶

Plot the precpitation column (PRCP) vs time to explore the data¶

Subsetting and Resampling¶

Now we are ready to calculate annual statistics¶

**Rapid City, CO colder than 40 years ago and temperatures continue to shift! ** 📰 🗞️ 📻¶

THIS ISN’T THE END! 😄¶

Your turn: pick a new location and/or measurement to plot 🌏 📈¶

Congratulations, you’re almost done with this coding challenge 🤩 – now make sure that your code is reproducible¶

BONUS: Create a shareable Markdown of your work¶

**Temperatures on the rise in Mount Rainier, WA over the last 40 years! ** 📰 🗞️ 📻¶

Rapid City, CO colder than 40 years ago and temperatures continue to shift! 📰 🗞️ 📻¶

Temperatures on the rise in Mount Rainier, WA over the last 40 years! 📰 🗞️ 📻¶