# Step 0: libraries

# Libraries for working with NCEI data
from pathlib import Path
import pandas as pd

# Libraries for plotting and saving plot
import hvplot.pandas
import holoviews as hv

# Making trend (slope) lines
import numpy as np
from sklearn.metrics import r2_score

# Step 0.1

# Project paths 
PROJECT_ROOT = Path("..").resolve()
DATA_DIR = PROJECT_ROOT / "data"
TEMP_DIR = DATA_DIR / "temperature"

# Step 1: Import data into python
# Using your downloaded data we will pull and read the CSV

## NOTE ##
# It is good practice to rename your data files into something descriptive and easy to identify
# For example, I have renamed the Ramona, CA station data as 'ncei-climate-ramona.csv' 
# Instead of typing this out we will create a var called csv_path

# Specify path
csv_path = TEMP_DIR / "ncei-climate-ramona.csv"

ramona_climate_df = pd.read_csv(
    csv_path,
    index_col="DATE",
    parse_dates=True,
    na_values=["NaN"]
)

ramona_climate_df.head()

# Step 2: Clean the dataframe
ramona_climate_max_min_df = ramona_climate_df[['TMAX', 'TMIN']]

# We are using TMAX and TMIN because we later want to plot the average yearly max-min temperature.
# This will help clarify if Ramona, CA is not only getting warmer, but how much hotter these temps are year to year.
# The same logic applies to how much that min temp is rising over time.  
# We are generally more interested in the effects of these extremes when it comes to ecosystem responses. 

# I also know the climate of Ramona, CA well. We generally have more extreme temperature swings in the winter and sping. 
# In the summer we stay consistently hot and do not really cool off that much in the evenings. 
# As a result, the TAVG will actually mask a lot of the seasonal swings that are important to fire season in Ramona, CA
# Especially during the months we see the most fire activity, which is October

# Call the new variable
ramona_climate_max_min_df

# Step 3: Convert temperature units
# Label the TMAX column as the correct temperature (temp_f)

climate_temp = ramona_climate_max_min_df.rename(columns={
    "TMAX": "max_temp_f",
    "TMIN": "min_temp_f"
})

# We will then convert temp_f to temp_c (celcius) using a basic equation

climate_temp['max_temp_c'] = ((climate_temp['max_temp_f']-32)*5/9)
climate_temp['min_temp_c'] = ((climate_temp['min_temp_f']-32)*5/9)

# Call the new var to see the date, temp_f and temp_c columns
climate_temp.head()

# Step 4: Plot the data using only farenheit 

# Make a new variable using climate_temp to have a new var ann_ramona_climate_df that calculates the average annual value of the temp
#'YS' is the start of the calendar year
# mean() will calculate the average temperature of both the temp_f and temp-c columns for var climate_temp
ann_ramona_climate_df = (
    climate_temp
    .resample('YS')
    .mean()
)

# Here rename the index column from DATE to year so that the displayed table is easier to interpret
ann_ramona_climate_df.index = ann_ramona_climate_df.index.year
ann_ramona_climate_df.index.name = "year"

# Call the new var
ann_ramona_climate_df

# Note that we now have years listed with the max and min temps now
# Since we are using mean here we lose the high peaks Ramona, CA gets in the summers (usually over 100+)

#### CONT ####
# Step 4: Plot the data using only farenheit 

# Use new var ann_ramona_climate_df to plot the annual data

# Give this plot a descriptive title and label the x and y axis

# By setting y to max_temp_f it will display only the max farenheit data
# We will do this again to make a separate figure for min_temp_f

### Why create individual figures? ###
# Mainly because the range of the graph (y) with both plotted will make it harder to see the magnitude of peaks and lows

# Creating the slope for the ramona_climate_max_f figure

# Extract values
x = ann_ramona_climate_df.index.values.astype(float)
y_max = ann_ramona_climate_df["max_temp_f"].values

# Compute linear regression (slope & intercept)
slope_max, intercept_max = np.polyfit(x, y_max, 1)
y_max_trend = slope_max * x + intercept_max

# Use hvplot not plot so that the resulting figure is interactive
ramona_climate_max_f = ann_ramona_climate_df.hvplot(
    y=["max_temp_f"],
    title= 'Ramona, CA Average Max Yearly Temperature',
    xlabel='Year',
    ylabel='Temperature (°F)',
    line_width=2,
)

# Trend line as separate HoloViews Curve
trend_line_max = hv.Curve(
    (x, y_max_trend),
    kdims="Year", vdims="Temperature (°F)"
).opts(color="red", line_width=2, line_dash="dashed", alpha=0.7)

# Overlay the trend on only this figure
ramona_climate_max_f_with_trend = ramona_climate_max_f * trend_line_max

# Display it
ramona_climate_max_f_with_trend

# We can also call the slope, intercept and R2 per year and per decade

# In the cell above we already calculated the slope_max and intercept_max so we reuse them here

# Compute predicted values for R²
y_max_pred = slope_max * x + intercept_max

# R-squared
r2_max = r2_score(y_max, y_max_pred)

# Decadal slope
slope_max_decade = slope_max * 10

# Print summary
# What this print code does it automatically label the values into something legible for us to use
# This will display everything in appropriate units
# The intercept isn't helpful here because its predicting the temperature at year=0 (which is 0 AD) and entirely meaningless for this
print("=== Ramona, CA Annual Max Temperature Trend ===")
print(f"Slope (per year):   {slope_max:.4f} °F/year")
print(f"Slope (per decade): {slope_max_decade:.4f} °F/decade")
print(f"Intercept:          {intercept_max:.2f}")
print(f"R²:                 {r2_max:.4f}")

=== Ramona, CA Annual Max Temperature Trend ===
Slope (per year):   0.1250 °F/year
Slope (per decade): 1.2496 °F/decade
Intercept:          -174.67
R²:                 0.4500

# We can also see it without the trend line

# Call the plot variable with no trend
ramona_climate_max_f

#### CONT ####
# Step 4: Plot the data using only farenheit

# Now we will do the same code as above but just using temp_min_f instead

# Use new var ann_ramona_climate_df to plot the annual data

# Give this plot a descriptive title and label the x and y axis

# By setting y to min_temp_f it will display only the min farenheit data

# Extract values for regression
x = ann_ramona_climate_df.index.values.astype(float)
y_min = ann_ramona_climate_df["min_temp_f"].values

# Compute linear regression (slope & intercept)
slope_min, intercept_min = np.polyfit(x, y_min, 1)
y_min_trend = slope_min * x + intercept_min

# Plot actual values (min temperatures)
ramona_climate_min_f = ann_ramona_climate_df.hvplot(
    y="min_temp_f",
    title="Ramona, CA Average Min Yearly Temperature",
    xlabel="Year",
    ylabel="Temperature (°F)",
    line_width=2,
)

# Trend line as separate HoloViews Curve
trend_line_min = hv.Curve(
    (x, y_min_trend),
    kdims="Year",
    vdims="Temperature (°F)"
).opts(
    color="red",
    line_width=2,
    line_dash="dashed",
    alpha=0.7
)

# Overlay the trend on only this figure
ramona_climate_min_f_with_trend = ramona_climate_min_f * trend_line_min

# Display it
ramona_climate_min_f_with_trend

#### CONT ####
# Step 4: Plot the data using only farenheit
# We can also call the slope, intercept and R2 per year and per decade

# In the cell above we already calculated the slope_min and intercept_min so we reuse them here
# Predicted values for R²
y_min_pred = slope_min * x + intercept_min

# R-squared
r2_min = r2_score(y_min, y_min_pred)

# Decadal slope
slope_min_decade = slope_min * 10

# Print summary
print("=== Ramona, CA Annual Min Temperature Trend ===")
print(f"Slope (per year):   {slope_min:.4f} °F/year")
print(f"Slope (per decade): {slope_min_decade:.4f} °F/decade")
print(f"Intercept:          {intercept_min:.2f}")
print(f"R²:                 {r2_min:.4f}")

=== Ramona, CA Annual Min Temperature Trend ===
Slope (per year):   0.0507 °F/year
Slope (per decade): 0.5071 °F/decade
Intercept:          -56.59
R²:                 0.1290

# We can also see it without the trend line

# Call the plot variable with no trend
ramona_climate_min_f

#### CONT ####
# Step 4: Plot the data using only farenheit

# To make it easier to view these figures we can stack them
# When we save these as html and static images we can save them both individually and joined

# You will notice that I have labeled these figures differently. That is because I don't want the trend line showing here
# Like we have in the independent figures above. 

# Specifying .cols() makes python stack these top and bottom

ramona_max_temp = ann_ramona_climate_df.hvplot(
    y="max_temp_f",
    title="Annual Average Maximum Temperature",
    xlabel="Year", ylabel="Temperature (°F)", line_width=2,
)

ramona_min_temp = ann_ramona_climate_df.hvplot(
    y="min_temp_f",
    title="Annual Average Minimum Temperature",
    xlabel="Year", ylabel="Temperature (°F)", line_width=2,
)
(ramona_max_temp + ramona_min_temp).cols(1)

# Step 5: Save the plots 
FIG_DIR = PROJECT_ROOT / "figures"
FIG_DIR.mkdir(exist_ok=True)

# Interacitve figures with NO trend lines

hv.save(ramona_climate_min_f, FIG_DIR / "Ramona_avg_min_yr_temp_f.html")

hv.save(ramona_climate_max_f, FIG_DIR / "Ramona_avg_max_yr_temp_f.html")

combined = (ramona_max_temp + ramona_min_temp).cols(1)
hv.save(combined, FIG_DIR / "ramona_max_min_temps_vertical.html")

# Interactive figures WITH trend lines

hv.save(ramona_climate_max_f_with_trend, FIG_DIR / "ramona_max_temp_trend.html")

hv.save(ramona_climate_min_f_with_trend, FIG_DIR / "ramona_min_temp_trend.html")


# Static figures with NO trend lines

hv.save(ramona_climate_max_f, FIG_DIR / "ramona_avg_max_temp_f_year.png", fmt="png")

hv.save(ramona_climate_min_f, FIG_DIR / "ramona_avg_min_temp_f_year.png", fmt="png")

hv.save(combined, FIG_DIR / "ramona_max_min_stacked.png", fmt="png")

# Static figures WITH trend lines

hv.save(ramona_climate_max_f_with_trend, FIG_DIR / "ramona_max_temp_f_trend.png", fmt="png")

hv.save(ramona_climate_min_f_with_trend, FIG_DIR / "ramona_min_temp_f_trend.png", fmt="png")

# Store any variables for future notebooks
%store ann_ramona_climate_df

Stored 'ann_ramona_climate_df' (DataFrame)

	STATION	NAME	TAVG	TMAX	TMIN
DATE
1998-04-16	USW00053120	RAMONA AIRPORT, CA US	48.0	61.0	34.0
1998-04-17	USW00053120	RAMONA AIRPORT, CA US	53.0	69.0	36.0
1998-04-18	USW00053120	RAMONA AIRPORT, CA US	55.0	72.0	37.0
1998-04-19	USW00053120	RAMONA AIRPORT, CA US	59.0	77.0	41.0
1998-04-20	USW00053120	RAMONA AIRPORT, CA US	63.0	82.0	43.0

	TMAX	TMIN
DATE
1998-04-16	61.0	34.0
1998-04-17	69.0	36.0
1998-04-18	72.0	37.0
1998-04-19	77.0	41.0
1998-04-20	82.0	43.0
...	...	...
2025-08-22	100.0	62.0
2025-08-23	103.0	61.0
2025-08-24	95.0	61.0
2025-08-25	95.0	63.0
2025-08-26	93.0	58.0

	max_temp_f	min_temp_f	max_temp_c	min_temp_c
DATE
1998-04-16	61.0	34.0	16.111111	1.111111
1998-04-17	69.0	36.0	20.555556	2.222222
1998-04-18	72.0	37.0	22.222222	2.777778
1998-04-19	77.0	41.0	25.000000	5.000000
1998-04-20	82.0	43.0	27.777778	6.111111

	max_temp_f	min_temp_f	max_temp_c	min_temp_c
year
1998	74.799127	45.506550	23.777293	7.503639
1999	75.240331	42.930939	24.022406	6.072744
2000	75.763085	45.421488	24.312825	7.456382
2001	73.967033	45.068681	23.315018	7.260379
2002	74.620879	44.258242	23.678266	6.810134
2003	75.513889	45.663889	24.174383	7.591049
2004	75.456284	45.084699	24.142380	7.269277
2005	75.476712	45.643836	24.153729	7.579909
2006	76.753425	44.879452	24.863014	7.155251
2007	76.723757	44.475138	24.846532	6.930632
2008	77.543175	46.175487	25.301764	7.875271
2009	76.894150	45.194986	24.941195	7.330548
2010	74.341737	44.593838	23.523187	6.996576
2011	75.332418	43.016529	24.073565	6.120294
2012	77.463014	44.630137	25.257230	7.016743
2013	76.805479	44.586301	24.891933	6.992390
2014	79.200000	47.158904	26.222222	8.421613
2015	78.076712	47.284932	25.598174	8.491629
2016	77.969863	46.405479	25.538813	8.003044
2017	78.952381	47.678771	26.084656	8.710428
2018	78.589041	47.378082	25.882801	8.543379
2019	75.945205	46.126027	24.414003	7.847793
2020	78.409836	44.877049	25.783242	7.153916
2021	77.175824	44.690411	25.097680	7.050228
2022	78.755495	46.453297	25.975275	8.029609
2023	75.458791	45.570248	24.143773	7.539027
2024	78.388430	45.484848	25.771350	7.491582
2025	77.710084	45.084034	25.394491	7.268908

Using this notebook¶

Climate Trends in Ramona, California (1998–2025)¶

How this supports the broader project¶

Step 0: Libraries¶

Step 1: Import the climate data¶

Step 2: Clean the dateframe¶

Step 3: Convert temperature units¶

Step 4: Plot the data using only farenheit¶

Step 5: Save the plot¶

WARNING¶

What the code in 'Step 0.1: Project Paths' does¶

Selecting your own data from NOAA/NCEI¶

Ramona, CA station information¶

Step 1: Import data into python¶

Step 2: clean the dataframe¶

Step 3: convert temperature units¶

Step 4: plot the data using only farenheit¶

Why resample to annual averages?¶

Understanding the trend calculations below¶

Step: 5 Save the Plot¶

Storing variables for later notebooks¶

Ramona, CA: The hot is getting hotter and the cold is getting warmer¶

Temperature Trends in Ramona, CA (1998–2025)¶

Minimum Temperature Trend (Nighttime Lows)¶

Maximum Temperature Trend (Daytime Highs)¶

Overall Implications¶

So why have we spent our first notebook looking at climate for Ramona, CA if our focus in on fire?¶