%store -r

# Step 1: Libraries & Paths

import os
from pathlib import Path
import zipfile

import geopandas as gpd
import rioxarray as rxr
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt

# Some of the pathing has changed between notebooks.
# Reset directories:
PROJECT_ROOT = Path(r"C:\Users\kayle\Desktop\earth-analytics\Final project\ramona-fire-recovery")
DATA_DIR = PROJECT_ROOT / "data"
BOUNDARY_DIR = DATA_DIR / "boundaries"

# New: landcover dir
LANDCOVER_DIR = DATA_DIR / "raw" / "landcover"

LANDCOVER_DIR

WindowsPath('C:/Users/kayle/Desktop/earth-analytics/Final project/ramona-fire-recovery/data/raw/landcover')

# Step 2: Extract NLCD 2024 GeoTIFFs from zip
zip_path = LANDCOVER_DIR / "Annual_NLCD_LndCov_2024_CU_C1V1.zip"
tif_name_2024 = "Annual_NLCD_LndCov_2024_CU_C1V1.tif"
tif_path_2024 = LANDCOVER_DIR / tif_name_2024

if not tif_path_2024.exists():
    print("Extracting NLCD 2024 from zip...")
    with zipfile.ZipFile(zip_path, "r") as zf:
        zf.extractall(LANDCOVER_DIR)
else:
    print("NLCD 2024 .tif already extracted.")

tif_path_2024

NLCD 2024 .tif already extracted.

WindowsPath('C:/Users/kayle/Desktop/earth-analytics/Final project/ramona-fire-recovery/data/raw/landcover/Annual_NLCD_LndCov_2024_CU_C1V1.tif')

# Step 3: Open and inspect the raster
# load the raster
nlcd_2024 = rxr.open_rasterio(
    tif_path_2024,
    chunks={"x": 2048, "y": 2048},   # small-ish tiles
    masked=True
).squeeze(drop=True)

print("CRS:", nlcd_2024.rio.crs)
print("Shape:", nlcd_2024.shape)

# You will notice in the output that this raster CRS is not California Albers. As we already have a variable with this projection
# (cedar_3310), we do not have to reproject this array.

CRS: PROJCS["AEA        WGS84",GEOGCS["WGS 84",DATUM["WGS_1984",SPHEROID["WGS 84",6378137,298.257223563,AUTHORITY["EPSG","7030"]],AUTHORITY["EPSG","6326"]],PRIMEM["Greenwich",0],UNIT["degree",0.0174532925199433,AUTHORITY["EPSG","9122"]],AUTHORITY["EPSG","4326"]],PROJECTION["Albers_Conic_Equal_Area"],PARAMETER["latitude_of_center",23],PARAMETER["longitude_of_center",-96],PARAMETER["standard_parallel_1",29.5],PARAMETER["standard_parallel_2",45.5],PARAMETER["false_easting",0],PARAMETER["false_northing",0],UNIT["metre",1,AUTHORITY["EPSG","9001"]],AXIS["Easting",EAST],AXIS["Northing",NORTH]]
Shape: (105000, 160000)

# Step 4: Define NLCD classes
# NLCD classes (Annual NLCD CONUS Collection 1.1)
NLCD_CLASSES = {
    11: "Open Water",
    12: "Perennial Ice/Snow",
    21: "Developed, Open Space",
    22: "Developed, Low Intensity",
    23: "Developed, Medium Intensity",
    24: "Developed, High Intensity",
    31: "Barren Land",
    41: "Deciduous Forest",
    42: "Evergreen Forest",
    43: "Mixed Forest",
    51: "Dwarf Scrub",
    52: "Shrub/Scrub",
    71: "Grassland/Herbaceous",
    81: "Pasture/Hay",
    82: "Cultivated Crops",
    90: "Woody Wetlands",
    95: "Emergent Herbaceous Wetlands"
}

def landcover_counts(da, nodata_values=(0,)):
    arr = da.values.astype("int32").ravel()
    mask = np.isin(arr, list(nodata_values), invert=True)
    arr = arr[mask]

    unique, counts = np.unique(arr, return_counts=True)
    total = counts.sum()

    df = pd.DataFrame({
        "class_code": unique,
        "pixel_count": counts,
        "percent": (counts / total) * 100
    })
    df["class_name"] = df["class_code"].map(NLCD_CLASSES)
    return df.sort_values("percent", ascending=False).reset_index(drop=True)

# Step 5.1 set fire years
# Year sets for fires (these will be reused in later notebooks)
CEDAR_YEARS = {
    "pre_fire":  [2000, 2001, 2002],
    "fire_year": [2003],
    "post_fire": [2004, 2005, 2010, 2015, 2020],
}

WITCH_YEARS = {
    "pre_fire":  [2004, 2005, 2006],
    "fire_year": [2007],
    "post_fire": [2008, 2010, 2015, 2020],
}

CEDAR_YEARS, WITCH_YEARS

({'pre_fire': [2000, 2001, 2002],
  'fire_year': [2003],
  'post_fire': [2004, 2005, 2010, 2015, 2020]},
 {'pre_fire': [2004, 2005, 2006],
  'fire_year': [2007],
  'post_fire': [2008, 2010, 2015, 2020]})

# Step 5L Clip NLCD 2024 land cover to cedar fire area (cedar_3310)
# Example: if you already have cedar_3310 in memory:
import rasterio
from rasterio.windows import from_bounds
import xarray as xr

with rasterio.open(tif_path_2024) as src:
    # Make sure Cedar is in same CRS
    cedar_bounds = cedar_3310.to_crs(src.crs).total_bounds  # minx, miny, maxx, maxy

    window = from_bounds(*cedar_bounds, transform=src.transform)

    nlcd_cedar_arr = src.read(1, window=window)  # band 1, cropped window
    nlcd_cedar_transform = src.window_transform(window)
    nlcd_cedar_crs = src.crs

# Turn into an xarray DataArray with rioxarray metadata
rows, cols = nlcd_cedar_arr.shape
y = np.arange(rows)
x = np.arange(cols)

nlcd_2024_cedar = xr.DataArray(
    nlcd_cedar_arr,
    dims=("y", "x"),
    coords={"y": y, "x": x},
).rio.write_crs(nlcd_cedar_crs, inplace=True).rio.write_transform(nlcd_cedar_transform, inplace=True)

df_cedar_2024 = landcover_counts(nlcd_2024_cedar)
df_cedar_2024.head()

# Step 6: Visualize land composition
fig, ax = plt.subplots(figsize=(8, 4))
ax.bar(df_cedar_2024["class_name"], df_cedar_2024["percent"])
ax.set_xticklabels(df_cedar_2024["class_name"], rotation=90)
ax.set_ylabel("Percent of area (%)")
ax.set_title("Cedar Fire Area Landcover Composition (NLCD 2024)")
plt.tight_layout()

C:\Users\kayle\AppData\Local\Temp\ipykernel_13968\2360616132.py:4: UserWarning: set_ticklabels() should only be used with a fixed number of ticks, i.e. after set_ticks() or using a FixedLocator.
  ax.set_xticklabels(df_cedar_2024["class_name"], rotation=90)

# Step 7: Save the figure 
FIG_DIR = PROJECT_ROOT / "figures"
FIG_DIR.mkdir(exist_ok=True)

# Since we just named this fig, that is what we call below
# Unlike the previous notebook we did not use hvplot, but matplotlib

# Landcover percentage chart as STATIC figure
fig.savefig(FIG_DIR / "cedar_landcover_2024.png", dpi=300, bbox_inches="tight")

# Store variables
%store PROJECT_ROOT DATA_DIR BOUNDARY_DIR LANDCOVER_DIR FIG_DIR cedar_2003 cedar_3310 witch_2007 witch_3310 ramona_3310 ramona_buffer ramona_buffer_union target_crs NLCD_CLASSES CEDAR_YEARS WITCH_YEARS

Stored 'PROJECT_ROOT' (WindowsPath)
Stored 'DATA_DIR' (WindowsPath)
Stored 'BOUNDARY_DIR' (WindowsPath)
Stored 'LANDCOVER_DIR' (WindowsPath)
Stored 'FIG_DIR' (WindowsPath)
Stored 'cedar_2003' (GeoDataFrame)
Stored 'cedar_3310' (GeoDataFrame)
Stored 'witch_2007' (GeoDataFrame)
Stored 'witch_3310' (GeoDataFrame)
Stored 'ramona_3310' (GeoDataFrame)
Stored 'ramona_buffer' (GeoSeries)
Stored 'ramona_buffer_union' (Polygon)
Stored 'target_crs' (str)
Stored 'NLCD_CLASSES' (dict)
Stored 'CEDAR_YEARS' (dict)
Stored 'WITCH_YEARS' (dict)

Using this notebook¶

Step 0: Load stored variables¶

Step 1: Libraries and (if needed) define project paths and directories.¶

Step 2: Extract the NLCD 2024 GeoTIFF from the downloaded zip file.¶

Step 3: Open and inspect the NLCD raster¶

Step 4: Define NLCD class codes and helper functions for summarizing land cover.¶

Step 5: Clip NLCD 2024 to the Cedar Fire perimeter¶

Step 6: Visualize land cover composition¶

Step 7: Save figures¶

Step 8: Store key variables for use in later land cover and RCMAP notebooks.¶

Step 0: Load stored variables¶

Step 1: Import libraries and set up project paths¶

Step 2: Extract NLCD 2024 GeoTIFF from zip¶

Step 3: Open and inspect the NLCD 2024 raster¶

Step 4: Define NLCD class codes and helper functions¶

Step 5.1: Define fire-year sets for later analysis¶

Step 5: Clip NLCD 2024 to the Cedar Fire area and summarize land cover¶

Step 6: Visualize land cover composition in the Cedar Fire area (2024)¶

Step 8: Store variables for later notebooks¶

What we learn from NLCD 2024¶

	class_code	pixel_count	percent	class_name
0	52	1547703	62.441369	Shrub/Scrub
1	22	218128	8.800274	Developed, Low Intensity
2	23	216846	8.748553	Developed, Medium Intensity
3	21	184886	7.459141	Developed, Open Space
4	71	123661	4.989046	Grassland/Herbaceous