# Import required packages
import pandas as pd
import numpy as np

Boulder_data = ('https://www.ncei.noaa.gov/access/services/data/v1'
                '?dataset=daily-summaries'
                '&dataTypes=TOBS,PRCP'
                '&stations=USC00050848'
                '&units=standard'
                '&startDate=1901-10-01'
                '&endDate=2023-09-30')
Boulder_data

'https://www.ncei.noaa.gov/access/services/data/v1?dataset=daily-summaries&dataTypes=TOBS,PRCP&stations=USC00050848&units=standard&startDate=1901-10-01&endDate=2023-09-30'

# Import data into Python from NCEI API
Boulder_df = pd.read_csv(
    Boulder_data,
    index_col='DATE', 
    parse_dates=True,
    na_values=['NaN'])
Boulder_df

#Choose a different location
DC_data = ('https://www.ncei.noaa.gov/access/services/data/v1'
                '?dataset=daily-summaries'
                '&dataTypes=TOBS,PRCP'
                '&stations=USC00186350'
                '&units=standard'
                '&startDate=1950-10-01'
                '&endDate=2023-09-30')
DC_data

'https://www.ncei.noaa.gov/access/services/data/v1?dataset=daily-summaries&dataTypes=TOBS,PRCP&stations=USC00186350&units=standard&startDate=1950-10-01&endDate=2023-09-30'

# Import data into Python from NCEI API
DC_df = pd.read_csv(
    DC_data,
    index_col='DATE', 
    parse_dates=True,
    na_values=['NaN'])
DC_df

# Plot data
DC_df.plot(
    y='TOBS',
    title='Washington, DC Temperature',
    xlabel='Year',
    ylabel='Temp ($^\circ$F)',
    legend = False)

<Axes: title={'center': 'Washington, DC Temperature'}, xlabel='Year', ylabel='Temp ($^\\circ$F)'>

# Resample to annual
ann_DC_df = DC_df.resample('YS').agg({'PRCP': np.sum, 'TOBS': np.mean})
ann_DC_df

/tmp/ipykernel_30674/2078979801.py:2: FutureWarning: The provided callable <function sum at 0x73932fd37250> is currently using SeriesGroupBy.sum. In a future version of pandas, the provided callable will be used directly. To keep current behavior pass 'sum' instead.
  ann_DC_df = DC_df.resample('YS').agg({'PRCP': np.sum, 'TOBS': np.mean})
/tmp/ipykernel_30674/2078979801.py:2: FutureWarning: The provided callable <function mean at 0x73932fd581f0> is currently using SeriesGroupBy.mean. In a future version of pandas, the provided callable will be used directly. To keep current behavior pass 'mean' instead.
  ann_DC_df = DC_df.resample('YS').agg({'PRCP': np.sum, 'TOBS': np.mean})

# Plot the annual data
ann_DC_df.plot(
    y='PRCP',
    title='Washington, DC Average Annual Precip',
    xlabel='Year',
    ylabel='Precip (in)',
    legend = False)

<Axes: title={'center': 'Washington, DC Average Annual Precip'}, xlabel='Year', ylabel='Precip (in)'>

	STATION	PRCP	TOBS
DATE
1901-10-01	USC00050848	0.0	62.0
1901-10-02	USC00050848	0.0	60.0
1901-10-03	USC00050848	0.0	57.0
1901-10-04	USC00050848	0.0	53.0
1901-10-05	USC00050848	0.0	49.0
...	...	...	...
2023-09-26	USC00050848	0.0	74.0
2023-09-27	USC00050848	0.0	69.0
2023-09-28	USC00050848	0.0	73.0
2023-09-29	USC00050848	0.0	66.0
2023-09-30	USC00050848	0.0	78.0

	STATION	PRCP	TOBS
DATE
1950-10-01	USC00186350	0.00	80.0
1950-10-02	USC00186350	0.00	81.0
1950-10-03	USC00186350	0.00	81.0
1950-10-04	USC00186350	0.27	61.0
1950-10-05	USC00186350	0.00	62.0
...	...	...	...
2023-09-26	USC00186350	0.07	58.0
2023-09-27	USC00186350	0.04	58.0
2023-09-28	USC00186350	0.00	53.0
2023-09-29	USC00186350	0.01	61.0
2023-09-30	USC00186350	0.00	66.0

	PRCP	TOBS
DATE
1950-01-01	9.05	53.363636
1951-01-01	39.90	64.176966
1952-01-01	48.09	61.715190
1953-01-01	20.73	67.351695
1954-01-01	32.56	64.362573
...	...	...
2019-01-01	43.92	54.866667
2020-01-01	63.66	55.389831
2021-01-01	42.55	55.108635
2022-01-01	43.04	53.752941
2023-01-01	27.35	56.803922

Climate coding challenge, Part 6¶

There are more Earth Observation data online than any one person could ever look at¶

Access NCEI GHCNd Data from the internet using its API 🖥️ 📡 🖥️¶

Download and get started working with NCEI data¶