DataIntegrationGroup · jirhiker · Jun 12, 2026 · Jun 11, 2026 · Jun 11, 2026 · Jun 11, 2026
diff --git a/.gitignore b/.gitignore
@@ -52,4 +52,7 @@ app.yaml
 docs/
 
 #Codex
-.codex
+.codex
+# Claude Code
+.claude/settings.local.json
+.claude/worktrees/
diff --git a/alembic/versions/u8v9w0x1y2z3_add_ngwmn_views_from_ocotillo_model.py b/alembic/versions/u8v9w0x1y2z3_add_ngwmn_views_from_ocotillo_model.py
@@ -0,0 +1,213 @@
+"""add NGWMN views sourced from the new Ocotillo data model
+
+Replaces the legacy NMA_view_NGWMN_* copy tables as the source for NGWMN
+exports. These views reproduce the original AMPAPI (SQL Server) view
+definitions but read from the new Ocotillo tables:
+
+- NGWMN_WaterLevels:      observation/sample/field_activity/field_event/thing
+- NGWMN_WellConstruction: thing/well_screen/well_casing_material
+- NGWMN_Lithology:        thing_geologic_formation_association/geologic_formation
+
+Revision ID: u8v9w0x1y2z3
+Revises: t6u7v8w9x0y1
+Create Date: 2026-06-11 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+from alembic import op
+from sqlalchemy import inspect, text
+
+# revision identifiers, used by Alembic.
+revision: str = "u8v9w0x1y2z3"
+down_revision: Union[str, Sequence[str], None] = "t6u7v8w9x0y1"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+REQUIRED_TABLES = {
+    "thing",
+    "well_screen",
+    "well_casing_material",
+    "observation",
+    "sample",
+    "field_activity",
+    "field_event",
+    "parameter",
+    "thing_geologic_formation_association",
+    "geologic_formation",
+}
+
+DROP_WATERLEVELS_SQL = 'DROP VIEW IF EXISTS "NGWMN_WaterLevels"'
+DROP_WELLCONSTRUCTION_SQL = 'DROP VIEW IF EXISTS "NGWMN_WellConstruction"'
+DROP_LITHOLOGY_SQL = 'DROP VIEW IF EXISTS "NGWMN_Lithology"'
+
+
+def _create_waterlevels_view() -> str:
+    # Mirrors dbo.view_NGWMN_WaterLevels:
+    #   SELECT PointID, DateMeasured, DepthToWaterBGS, 'ft bgs', CASE
+    #   MeasurementMethod..., CASE DataQuality..., PublicRelease
+    #   FROM WaterLevels WHERE PublicRelease = 1
+    #
+    # The transfer stored observation.value as depth-to-water below the
+    # measuring point (DepthToWater) and measuring_point_height separately,
+    # so DepthToWaterBGS = value - measuring_point_height (0 when no MP
+    # height was recorded).
+    #
+    # observation_datetime was converted to UTC during transfer; rows whose
+    # legacy timestamp had no time component were stored at 00:00 UTC, so
+    # only rows with a real time component are shifted back to local time
+    # before taking the date.
+    #
+    # MeasurementMethod/WLAccuracy reproduce the legacy CASE expressions,
+    # keyed on the lexicon meanings the transfer wrote (LU_MeasurementMethod
+    # and LU_DataQuality), including the legacy quirk mapping code O
+    # ("Observed...") to 'Acoustic Sounder'.
+    return """
+        CREATE VIEW "NGWMN_WaterLevels" AS
+        SELECT
+            t.name AS "PointID",
+            CASE
+                WHEN (o.observation_datetime AT TIME ZONE 'UTC')::time = '00:00:00'
+                THEN (o.observation_datetime AT TIME ZONE 'UTC')::date
+                ELSE (o.observation_datetime AT TIME ZONE 'America/Denver')::date
+            END AS "DateMeasured",
+            o.value - COALESCE(o.measuring_point_height, 0) AS "DepthToWaterBGS",
+            'ft bgs' AS "WLUnits",
+            CASE s.sample_method
+                WHEN 'Steel-tape measurement' THEN 'Steel tape'
+                WHEN 'Electric tape measurement (E-probe)' THEN 'Electric tape'
+                WHEN 'Observed (required for F, N, and W water level status)' THEN 'Acoustic Sounder'
+                WHEN 'Estimated' THEN 'Estimated'
+                WHEN 'Reported, method not known' THEN 'Reported'
+                WHEN 'Pressure-gage measurement' THEN 'Pressure gauge'
+                WHEN 'Unknown (for legacy data only; not for new data entry)' THEN 'Unknown; from legacy data'
+                ELSE NULL
+            END AS "MeasurementMethod",
+            CASE o.nma_data_quality
+                WHEN 'Water level accurate to within two hundreths of a foot' THEN '0.02 ft'
+                WHEN 'Water level accurate to within one foot' THEN '1.0 ft'
+                WHEN 'Water level accuracy not to nearest foot or water level not repeatable' THEN 'Unknown'
+                ELSE NULL
+            END AS "WLAccuracy",
+            TRUE AS "PublicRelease"
+        FROM observation AS o
+        JOIN sample AS s ON s.id = o.sample_id
+        JOIN field_activity AS fa ON fa.id = s.field_activity_id
+        JOIN field_event AS fe ON fe.id = fa.field_event_id
+        JOIN thing AS t ON t.id = fe.thing_id
+        JOIN parameter AS p ON p.id = o.parameter_id
+        WHERE p.parameter_name = 'groundwater level'
+          AND o.release_status = 'public'
+          AND s.release_status = 'public'
+          AND fa.release_status = 'public'
+          AND fe.release_status = 'public'
+          AND t.release_status = 'public'
+    """
+
+
+def _create_wellconstruction_view() -> str:
+    # Mirrors dbo.view_NGWMN_WellConstruction:
+    #   WellData LEFT JOIN WellScreens ON WellData.WellID = WellScreens.WellID
+    # CasingTop is 0 whenever a casing depth exists (casing assumed to start
+    # at ground surface). The legacy free-text CasingDescription was reduced
+    # to controlled material terms during transfer, so it is rebuilt here as
+    # a comma-separated list of well_casing_material terms.
+    return """
+        CREATE VIEW "NGWMN_WellConstruction" AS
+        SELECT
+            t.name AS "PointID",
+            CASE WHEN t.well_casing_depth IS NOT NULL THEN 0::double precision END AS "CasingTop",
+            t.well_casing_depth AS "CasingBottom",
+            CASE WHEN t.well_casing_depth IS NOT NULL THEN 'ft bgs' END AS "CasingDepthUnits",
+            ws.screen_depth_top AS "ScreenTop",
+            ws.screen_depth_bottom AS "ScreenBottom",
+            CASE WHEN ws.screen_depth_bottom IS NOT NULL THEN 'ft bgs' END AS "ScreenBottomUnit",
+            ws.screen_description AS "ScreenDescription",
+            cm.materials AS "CasingDescription"
+        FROM thing AS t
+        LEFT JOIN well_screen AS ws
+            ON ws.thing_id = t.id AND ws.release_status = 'public'
+        LEFT JOIN LATERAL (
+            SELECT string_agg(wcm.material, ', ' ORDER BY wcm.material) AS materials
+            FROM well_casing_material AS wcm
+            WHERE wcm.thing_id = t.id AND wcm.release_status = 'public'
+        ) AS cm ON TRUE
+        WHERE t.thing_type = 'water well'
+          AND t.release_status = 'public'
+    """
+
+
+def _create_lithology_view() -> str:
+    # Mirrors dbo.view_NGWMN_Lithology:
+    #   Stratigraphy INNER JOIN LU_Lithology ON Lithology = ABBREVIATION
+    # The new model keeps the resolved lithology term on geologic_formation
+    # (the abbreviation code was not migrated), so the term backs both the
+    # Lithology and TERM columns. The inner join is reproduced by requiring
+    # a non-null lithology. StratSource was not migrated and is NULL.
+    return """
+        CREATE VIEW "NGWMN_Lithology" AS
+        SELECT
+            tgfa.id AS "OBJECTID",
+            t.name AS "PointID",
+            gf.lithology AS "Lithology",
+            gf.lithology AS "TERM",
+            NULL::character varying AS "StratSource",
+            tgfa.top_depth AS "StratTop",
+            CASE WHEN tgfa.top_depth IS NOT NULL THEN 'ft bgs' END AS "StratTopUnit",
+            tgfa.bottom_depth AS "StratBottom",
+            CASE WHEN tgfa.bottom_depth IS NOT NULL THEN 'ft bgs' END AS "StratBottomUnit"
+        FROM thing_geologic_formation_association AS tgfa
+        JOIN thing AS t ON t.id = tgfa.thing_id
+        JOIN geologic_formation AS gf ON gf.id = tgfa.geologic_formation_id
+        WHERE gf.lithology IS NOT NULL
+          AND tgfa.release_status = 'public'
+          AND t.release_status = 'public'
+    """
+
+
+def upgrade() -> None:
+    bind = op.get_bind()
+    inspector = inspect(bind)
+    existing_tables = set(inspector.get_table_names(schema="public"))
+    missing = REQUIRED_TABLES - existing_tables
+    if missing:
+        raise RuntimeError(
+            "Cannot create NGWMN views. Missing required tables: "
+            f"{', '.join(sorted(missing))}"
+        )
+
+    op.execute(text(DROP_WATERLEVELS_SQL))
+    op.execute(text(_create_waterlevels_view()))
+    op.execute(
+        text(
+            'COMMENT ON VIEW "NGWMN_WaterLevels" IS '
+            "'Public manual groundwater level measurements in the NGWMN "
+            "exchange format, sourced from the Ocotillo observation model.'"
+        )
+    )
+
+    op.execute(text(DROP_WELLCONSTRUCTION_SQL))
+    op.execute(text(_create_wellconstruction_view()))
+    op.execute(
+        text(
+            'COMMENT ON VIEW "NGWMN_WellConstruction" IS '
+            "'Well casing and screen intervals in the NGWMN exchange format, "
+            "sourced from the Ocotillo thing/well_screen model.'"
+        )
+    )
+
+    op.execute(text(DROP_LITHOLOGY_SQL))
+    op.execute(text(_create_lithology_view()))
+    op.execute(
+        text(
+            'COMMENT ON VIEW "NGWMN_Lithology" IS '
+            "'Lithology intervals in the NGWMN exchange format, sourced from "
+            "the Ocotillo geologic formation associations.'"
+        )
+    )
+
+
+def downgrade() -> None:
+    op.execute(text(DROP_LITHOLOGY_SQL))
+    op.execute(text(DROP_WELLCONSTRUCTION_SQL))
+    op.execute(text(DROP_WATERLEVELS_SQL))
diff --git a/alembic/versions/v0w1x2y3z4a5_add_transducer_daily_data_materialized_view.py b/alembic/versions/v0w1x2y3z4a5_add_transducer_daily_data_materialized_view.py
@@ -0,0 +1,116 @@
+"""add transducer daily data materialized view
+
+Aggregates raw transducer observations into one row per well, parameter,
+day, and QC status. This is the new-model replacement for the legacy
+NMA_WaterLevelsContinuous_Pressure_Daily table, which AMPAPI rebuilt
+nightly from the raw continuous pressure record.
+
+Revision ID: v0w1x2y3z4a5
+Revises: u8v9w0x1y2z3
+Create Date: 2026-06-11 00:00:00.000000
+"""
+
+from typing import Sequence, Union
+
+from alembic import op
+from sqlalchemy import inspect, text
+
+# revision identifiers, used by Alembic.
+revision: str = "v0w1x2y3z4a5"
+down_revision: Union[str, Sequence[str], None] = "u8v9w0x1y2z3"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+REQUIRED_TABLES = {
+    "transducer_observation",
+    "deployment",
+    "thing",
+    "parameter",
+}
+
+DROP_VIEW_SQL = "DROP MATERIALIZED VIEW IF EXISTS transducer_daily_data"
+
+
+def _create_transducer_daily_data_view() -> str:
+    # transducer_observation.value is depth to water in feet below ground
+    # surface (the transfer wrote DepthToWaterBGS directly), so the daily
+    # depth columns need no measuring-point correction.
+    #
+    # The transfer wrote legacy timestamps unshifted (naive local clock
+    # readings stored as UTC), so bucketing on the UTC date preserves the
+    # original measurement dates.
+    #
+    # QC status: the transfer marked QCed rows release_status='public' and
+    # un-reviewed rows 'private', so qced mirrors the legacy QCed flag.
+    return """
+        CREATE MATERIALIZED VIEW transducer_daily_data AS
+        SELECT
+            d.thing_id,
+            t.name AS point_id,
+            tob.parameter_id,
+            p.parameter_name,
+            (tob.observation_datetime AT TIME ZONE 'UTC')::date AS date_measured,
+            (tob.release_status = 'public') AS qced,
+            avg(tob.value) AS depth_to_water_bgs,
+            min(tob.value) AS depth_to_water_bgs_min,
+            max(tob.value) AS depth_to_water_bgs_max,
+            count(*) AS measurement_count,
+            min(tob.observation_datetime) AS first_measurement_at,
+            max(tob.observation_datetime) AS last_measurement_at,
+            avg(tob.nma_waterlevelscontinuous_pressure_temperature_water) AS temperature_water,
+            avg(tob.nma_waterlevelscontinuous_pressure_water_head) AS water_head,
+            avg(tob.nma_waterlevelscontinuous_pressure_water_head_adjusted) AS water_head_adjusted,
+            avg(tob.nma_waterlevelscontinuous_pressure_conddl_ms_cm) AS conddl_ms_cm
+        FROM transducer_observation AS tob
+        JOIN deployment AS d ON d.id = tob.deployment_id
+        JOIN thing AS t ON t.id = d.thing_id
+        JOIN parameter AS p ON p.id = tob.parameter_id
+        GROUP BY
+            d.thing_id,
+            t.name,
+            tob.parameter_id,
+            p.parameter_name,
+            (tob.observation_datetime AT TIME ZONE 'UTC')::date,
+            (tob.release_status = 'public')
+    """
+
+
+def upgrade() -> None:
+    bind = op.get_bind()
+    inspector = inspect(bind)
+    existing_tables = set(inspector.get_table_names(schema="public"))
+    missing = REQUIRED_TABLES - existing_tables
+    if missing:
+        raise RuntimeError(
+            "Cannot create transducer_daily_data. Missing required tables: "
+            f"{', '.join(sorted(missing))}"
+        )
+
+    op.execute(text(DROP_VIEW_SQL))
+    op.execute(text(_create_transducer_daily_data_view()))
+    op.execute(
+        text(
+            "COMMENT ON MATERIALIZED VIEW transducer_daily_data IS "
+            "'Daily aggregates of transducer observations per well, parameter, "
+            "and QC status. Replacement for the legacy "
+            "NMA_WaterLevelsContinuous_Pressure_Daily table. Refresh with "
+            "REFRESH MATERIALIZED VIEW CONCURRENTLY transducer_daily_data.'"
+        )
+    )
+    # Unique index required for REFRESH MATERIALIZED VIEW CONCURRENTLY.
+    op.execute(
+        text(
+            "CREATE UNIQUE INDEX ux_transducer_daily_data_key "
+            "ON transducer_daily_data (thing_id, parameter_id, date_measured, qced)"
+        )
+    )
+    op.execute(
+        text(
+            "CREATE INDEX ix_transducer_daily_data_point_id_date "
+            "ON transducer_daily_data (point_id, date_measured)"
+        )
+    )
+
+
+def downgrade() -> None:
+    op.execute(text(DROP_VIEW_SQL))