UNSW-CEEM · nick-gorman · Apr 23, 2026 · Apr 23, 2026 · Apr 23, 2026 · Dec 6, 2025
diff --git a/.github/workflows/cicd.yml b/.github/workflows/cicd.yml
@@ -1,11 +1,44 @@
 name: Continuous Integration and Deployment
 
 on:
+  pull_request:
+  push:
+    branches: [master, offline-test-suite]   # TEMP: remove `offline-test-suite` before merge — used to bootstrap CI while the pull_request trigger isn't yet on master
   release:
     types: [created]
   workflow_dispatch:
 
 jobs:
+  # Offline test suite — runs on every PR and push to master.
+  # test_performance_stats.py covers `custom_tables` and still hits AEMO
+  # + references local files that aren't in CI. Parked until ported.
+  # Everything else runs against the in-process dummy server from
+  # tests/conftest.py and is fully offline.
+  test:
+    name: Tests (Python ${{ matrix.python-version }}, ${{ matrix.os }})
+    runs-on: ${{ matrix.os }}
+    strategy:
+      fail-fast: false
+      matrix:
+        os: [ubuntu-latest, windows-latest, macos-latest]
+        python-version: ["3.10", "3.11", "3.12", "3.13"]
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+      - name: Install uv
+        uses: astral-sh/setup-uv@v3
+        with:
+          enable-cache: true
+      - name: Set up Python ${{ matrix.python-version }}
+        run: uv python install ${{ matrix.python-version }}
+      - name: Sync dependencies
+        run: uv sync --python ${{ matrix.python-version }}
+      - name: Run tests
+        run: >
+          uv run pytest tests/
+          --ignore=tests/test_performance_stats.py
+          -v
+
   # Publishes to PyPi if tests are passed and release is created
   publish:
     if: github.event_name == 'release' && github.event.action == 'created'

diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
@@ -51,19 +51,22 @@ Ready to contribute? Here's how to set up `ispypsa` for local development.
     $ git checkout -b name-of-your-bugfix-or-feature
     ```
 
-6. When you're done making changes, check that your changes pass any tests.
-
-    - Configure an environment variable called "NEMOSIS_TEST_CACHE" specifying the location of the raw data cache to use
-      while testing
-    - Run all tests by running `uv run -m unittest discover tests`
-    - Run a subset of tests using the name of the test class or method, for example 
-      `uv run -m unittest discover tests -v -k TestDynamicDataCompilerWithSettlementDateFiltering`
-    - All tests should pass before a PR is considered good to merge into main. However, the tests are very long running
-      so it is best to test on a small subset of tests that are likely to fail, before running the full suite. 
-      Additionally, the full suite should be run twice, once with an empty cache, and then again with cache prefilled.
-    - We acknowledge the testing process is currently a bit cumbersome and slow, any contributions to improve this
-      process are welcomed :)
-    - A bit more info to come on testing once I get them all working again . . . 
+6. When you're done making changes, check that your changes pass the tests:
+
+    ```console
+    $ uv run pytest tests/ \
+        --ignore=tests/test_data_fetch_methods.py \
+        --ignore=tests/test_errors_and_warnings.py \
+        --ignore=tests/test_format_options.py \
+        --ignore=tests/test_performance_stats.py \
+        --ignore=tests/test_processing_info_maps.py
+    ```
+
+    The suite is fully offline and runs in under a minute. The five ignored files are legacy
+    network-hitting tests slated for removal. CI runs the same invocation on every PR.
+
+    For details on how the test suite is structured, how to add tests for new tables, and how
+    fixtures are maintained, see [testing_and_maintenance.md](testing_and_maintenance.md).
 
 7. Commit your changes and open a pull request.
 

diff --git a/pyproject.toml b/pyproject.toml
@@ -16,7 +16,7 @@ dependencies = [
     "openpyxl>=3.1.5",
 ]
 readme = "README.md"
-requires-python = ">= 3.9"
+requires-python = ">= 3.10"
 
 [build-system]
 requires = ["hatchling"]

diff --git a/src/nemosis/defaults.py b/src/nemosis/defaults.py
@@ -1,7 +1,7 @@
 import os
 
 names = {
-    "FCAS Providers": "NEM Registration and Exemption List.xls",
+    "FCAS Providers": "NEM Registration and Exemption List.xlsx",
     "DISPATCHLOAD": "PUBLIC_DVD_DISPATCHLOAD",
     "NEXT_DAY_DISPATCHLOAD": "PUBLIC_NEXT_DAY_DISPATCHLOAD",
     "DUDETAILSUMMARY": "PUBLIC_DVD_DUDETAILSUMMARY",
@@ -22,7 +22,7 @@
     "FCAS_4_SECOND": "FCAS",
     "ELEMENTS_FCAS_4_SECOND": "Elements_FCAS.csv",
     "VARIABLES_FCAS_4_SECOND": "Ancillary Services Market Causer Pays Variables File.csv",
-    "Generators and Scheduled Loads": "NEM Registration and Exemption List.xls",
+    "Generators and Scheduled Loads": "NEM Registration and Exemption List.xlsx",
     "MNSP_INTERCONNECTOR": "PUBLIC_DVD_MNSP_INTERCONNECTOR",
     "MNSP_PEROFFER": "PUBLIC_DVD_MNSP_PEROFFER",
     "INTERCONNECTOR": "PUBLIC_DVD_INTERCONNECTOR",
@@ -133,8 +133,8 @@
 static_table_url = {
     "ELEMENTS_FCAS_4_SECOND": "https://www.nemweb.com.au/Reports/Current/Causer_Pays_Elements/",
     "VARIABLES_FCAS_4_SECOND": "https://aemo.com.au/-/media/files/electricity/nem/settlements_and_payments/settlements/auction-reports/archive/ancillary-services-market-causer-pays-variables-file.csv",
-    "Generators and Scheduled Loads": "https://www.aemo.com.au/-/media/Files/Electricity/NEM/Participant_Information/NEM-Registration-and-Exemption-List.xls",
-    "_downloader.download_xl": "https://www.aemo.com.au/-/media/Files/Electricity/NEM/Participant_Information/NEM-Registration-and-Exemption-List.xls",
+    "Generators and Scheduled Loads": "https://www.aemo.com.au/-/media/files/electricity/nem/Participant_Information/NEM-Registration-and-Exemption-List.xlsx",
+    "_downloader.download_xl": "https://www.aemo.com.au/-/media/files/electricity/nem/Participant_Information/NEM-Registration-and-Exemption-List.xlsx",
 }
 
 aemo_mms_url = "http://www.nemweb.com.au/Data_Archive/Wholesale_Electricity/MMSDM/{}/MMSDM_{}_{}/MMSDM_Historical_Data_SQLLoader/DATA/{}.zip"

diff --git a/testing_and_maintenance.md b/testing_and_maintenance.md
@@ -0,0 +1,224 @@
+# Testing and maintenance
+
+This document covers how the NEMOSIS test suite is structured, how to run it, and how to extend or
+maintain it as AEMO's data formats evolve.
+
+## Overview
+
+The end-to-end suite runs against a local dummy HTTP server (defined in `tests/conftest.py`) that
+serves pre-filtered AEMO data committed to `tests/fixtures/data/`. The server is a bare
+`SimpleHTTPServer` rooted at the fixture tree, which mirrors AEMO's URL paths verbatim — at test
+time NEMOSIS's hostname is swapped for the local server and everything else is real.
+
+The whole suite is fast (under a minute) and network-free.
+
+## Running tests
+
+```console
+$ uv run pytest tests/ --ignore=tests/test_performance_stats.py
+```
+
+`test_performance_stats.py` is the last legacy network-hitting file. It covers the
+`custom_tables` module (VWAP, capacity factors, plant stats) which hasn't been ported offline
+yet — most of its assertions run on synthetic DataFrames and are trivially portable, but a
+few depend on local plant-stats files (`E:\plants_stats_test_data\`) that exist only on one
+developer's machine. CI uses the same invocation (see `.github/workflows/cicd.yml`).
+
+To run a single file:
+
+```console
+$ uv run pytest tests/end_to_end_table_tests/test_dispatch_price.py -v
+```
+
+## Suite layout
+
+```
+tests/
+  conftest.py                      # Dummy HTTP server fixture
+  fixtures/
+    spec.py                        # What to download for each table
+    build.py                       # Downloads + filters + writes fixture files
+    data/                          # Committed fixture tree (mirrors AEMO URLs)
+  end_to_end_table_tests/
+    _boundaries.py                 # Shared boundary-test helper
+    test_<table>.py                # One file per AEMO table
+    DECISIONS.md                   # Internal design notes (transitional)
+  test_filters.py                  # Pure unit tests
+  test_date_generators.py
+  test_query_wrappers.py
+  test_errors.py                   # Argument validation + NoDataToReturn + cache idempotency
+  test_processing_info_maps.py     # Cross-table validation of search_type classification
+  test_performance_stats.py        # Legacy custom_tables tests — ignored in CI
+```
+
+Each test file in `end_to_end_table_tests/` covers one AEMO table. Files start with a module
+docstring explaining the table's shape and which eras the fixture covers.
+
+## The fixture system
+
+`tests/fixtures/data/` is a verbatim mirror of AEMO's URL tree. For example:
+
+```
+http://www.nemweb.com.au/Data_Archive/Wholesale_Electricity/MMSDM/2018/...
+        ↓
+tests/fixtures/data/Data_Archive/Wholesale_Electricity/MMSDM/2018/...
+```
+
+This means the dummy server doesn't need any clever routing — it just serves static files at the
+matching paths.
+
+Fixtures are filtered down (~50× smaller than raw AEMO archives) by:
+
+- **Row filter**: each table keeps only two DUIDs / two REGIONIDs / one INTERCONNECTORID. The
+  selection lives in `tests/fixtures/spec.py` (`DUIDS`, `REGIONS`, etc.).
+- **Time filter**: only the first 3 and last 2 days of each month, controlled by
+  `KEEP_FIRST_DAYS` / `KEEP_LAST_DAYS` in `build.py`.
+- **Section filter** (scrape-pattern files only): for files like `PUBLIC_DAILY` that bundle many
+  logical tables in one CSV, the build script keeps only the section NEMOSIS reads and strips the
+  D-rows from the rest, preserving the I-row markers NEMOSIS counts against.
+
+Total fixture tree: ~12 MB across ~200 files.
+
+## Eras
+
+An era is a single month (or day, for scrape-pattern tables) chosen because it straddles a known
+AEMO format change or sits on a year boundary. Each table's fixture covers one or more eras. The
+full list lives in `tests/fixtures/spec.py::ERAS`:
+
+| Era       | Purpose                                                                   |
+|-----------|---------------------------------------------------------------------------|
+| `2018-05` | Pre-5-min-trading baseline                                                |
+| `2020-01` | Year boundary, pre-5-min, monthly bidding                                 |
+| `2021-02` | Last viable MMS month for bidding before the 3-year gap                   |
+| `2021-05` | First month of the new 5-min NEM and daily bidding layouts                |
+| `2022-01` | Year boundary, 5-min dispatch, 30-min trading legacy                      |
+| `2022-06` | Legacy era (kept to avoid fixture churn — could be retired)               |
+| `2024-09` | First month after `PUBLIC_DVD_` → `PUBLIC_ARCHIVE#` rename                |
+| `2025-01` | Year boundary, `PUBLIC_ARCHIVE#` format, post-bidding-gap                 |
+| `recent`  | Pinned to a date inside AEMO's rolling current-data window                |
+
+The three Jan-1 eras (2020-01, 2022-01, 2025-01) exist primarily for the boundary test matrix —
+year wraps are exercised by anchoring boundary cases on Jan 1.
+
+## The boundary test matrix
+
+`_boundaries.py` generates a parametrised matrix of (era × flavour × time-of-day) cases for every
+dynamic time-series table. Each case asserts entity-set match, exact per-entity row count,
+first/last timestamp, no duplicates, and regular stride.
+
+**Vocabulary:**
+
+- **Era** — a tagged anchor month (e.g. `2021-05`).
+- **T** — time of day for a probe point (e.g. `00:00`, `04:00`, `04:05`).
+- **Stride** — the table's native interval, in minutes (5, 30, etc.).
+- **Boundary** — midnight on day 1 of the era month — the natural fence between fixture files.
+- **Flavour** — how the query window is positioned relative to the boundary:
+  - `at` — 1h forward window starting at T on day 1.
+  - `before` — 1h backward window ending at T on day 1.
+  - `into` — variable window from `last-day-of-prev-month@23:00` to `day1@T`, straddles the
+    boundary at every T.
+
+**Tables not covered by the helper** (with reasons, in `_boundaries.py::_HELPER_DOES_NOT_COVER`):
+
+- `BIDDAYOFFER_D`, `MNSP_DAYOFFER` — daily stride.
+- `BIDPEROFFER_D` — partitioned by AEMO trading day (04:05 → 04:00 next day) not calendar day.
+- `MNSP_PEROFFER` — multi-dimensional rows + known bug (see Known quirks).
+- `DISPATCHCONSTRAINT` — variable per-interval presence.
+
+These tables keep their per-era smoke tests; only the matrix is skipped.
+
+## Adding a test for a new table
+
+1. **Pick eras** the table should cover. Refer to the era table above. Most dynamic time-series
+   tables use the dispatch set: `2018-05`, `2020-01`, `2021-05`, `2022-01`, `2024-09`, `2025-01`
+   (the three Jan-1 eras give year-boundary coverage for the matrix).
+2. **Add the table to `tests/fixtures/spec.py::DYNAMIC_TABLES`** with its filter spec — which
+   eras, which row filter columns and values, which columns to keep, etc.
+3. **Run `uv run python tests/fixtures/build.py`** to download, filter, and write the fixture
+   files into `tests/fixtures/data/`.
+4. **Write `test_<table_lower>.py`** in `tests/end_to_end_table_tests/`, following the style of
+   an existing file. Use the `nemosis_fixture` fixture (from `conftest.py`) to get a fresh cache
+   directory. If the table is suitable for the boundary matrix, parametrise on
+   `boundary_cases("<TABLE_NAME>")` and assert with `assert_boundary_shape(...)`.
+5. **Run** `uv run pytest tests/end_to_end_table_tests/test_<table>.py -v` and iterate.
+
+## Refreshing fixtures
+
+Most fixtures are stable and don't need refreshing — the eras are anchored to historical months
+that AEMO doesn't change. The exception is the `recent` era, which is pinned to a date inside
+AEMO's rolling current-data window (`/Reports/Current/...`). That window only retains the last
+few months of data, so the `recent` fixtures age out periodically.
+
+The committed fixtures keep working indefinitely — staleness only bites when you next try to
+*rebuild* (e.g. adding a new table that uses the `recent` era, or refiltering an existing one).
+At that point AEMO will return 404s for the scrape-pattern tables, which is the signal to refresh.
+
+To refresh:
+
+1. Update `spec.ERAS["recent"]` to a date inside AEMO's current window (within the last ~2
+   months is safe).
+2. Re-run `uv run python tests/fixtures/build.py`.
+3. Commit the updated fixtures.
+
+Tables that use the `recent` era: `DAILY_REGION_SUMMARY`, `NEXT_DAY_DISPATCHLOAD`,
+`INTERMITTENT_GEN_SCADA`.
+
+## Adding a new era
+
+When AEMO changes a data format, add an era to capture the transition:
+
+1. Pick a single month (or a Jan-1 month if you also want year-boundary coverage) that straddles
+   the change.
+2. Add it to `spec.ERAS`.
+3. Add the era key to the affected tables' `eras` lists in `spec.DYNAMIC_TABLES`.
+4. Re-run `uv run python tests/fixtures/build.py` to fetch the new fixtures.
+5. If the format change affects the table's row count, columns, or stride, adjust the test file
+   accordingly (era-parametrise where behaviour differs).
+
+## Known quirks
+
+These have bitten contributors before. Worth a read before adding a test.
+
+- **`filter_cols` must be a subset of `select_columns`** when calling `dynamic_data_compiler`.
+- **`select_columns` for tables wrapped by `drop_duplicates_by_primary_key`** (MNSP_PEROFFER,
+  MNSP_DAYOFFER, the effective-date config tables) must include every column in
+  `defaults.table_primary_keys[table]`, or NEMOSIS errors with a `KeyError` on the missing dedupe
+  columns. SPDCONNECTIONPOINTCONSTRAINT is a particularly easy one to trip on — its primary key
+  includes BIDTYPE.
+- **Prev-month / prev-day buffering** in NEMOSIS's date generator only fires when `start_time`
+  lands on a natural boundary (first of month, midnight). Tests that probe interior points don't
+  see those extra buffer requests.
+- **`filter_on_effective_date` runs before `most_recent_records_before_start_time`** and drops any
+  row with `EFFECTIVEDATE >= end_time`. Effective-date fixture entities therefore need at least
+  one record dated *before* the test's `start_time`, or the test sees an empty frame.
+- **Effective-date config tables** have `search_type = "all"` in NEMOSIS, which by default scans
+  every month from `nem_data_model_start_time` (2009-07) through `end_time` — ~180 HTTP requests
+  per call. Tests narrow this to a single month by monkeypatching
+  `defaults.nem_data_model_start_time` to the era date, and opt out of the build-time time trim
+  via `keep_full_month: True` in `spec.py`.
+- **Year-straddle queries aren't covered.** A true year-boundary crossing for a non-Jan era —
+  e.g. `[2024/08/15, 2025/01/15]` — would exercise `year_and_month_gen`'s `start_year < end_year`
+  branch with many months of iteration. The fixture doesn't include Sep/Oct/Nov 2024, so such
+  queries 404 on intervening months. If a future contributor needs this coverage, extend the
+  fixture to include the intervening months (cost: fixture size) or add a unit test against
+  `year_and_month_gen` directly.
+- **Mid-month queries return empty frames.** The fixture builder keeps only the first 3 and last
+  2 days of each era month (see `KEEP_FIRST_DAYS` / `KEEP_LAST_DAYS` in `build.py`). A test that
+  queries, say, `[2021/05/15, 2021/05/16]` will get back a non-erroring empty DataFrame from every
+  covered table — NEMOSIS's own code path is fine, the fixture just doesn't have those rows. If
+  you're writing a test whose window lands in the kept-days gap, either anchor it to day 1–3 / the
+  last 2 days of the era, or `assert not data.empty` explicitly so the empty case fails loudly
+  rather than sliding past a soft subset check.
+- **`MNSP_PEROFFER` is effectively unreadable past ~April 2021**. AEMO began writing
+  `MNSP_BIDOFFERPERIOD` data into the existing `PUBLIC_DVD_MNSP_PEROFFER_*` archives, then
+  renamed the archive stub outright in Aug-2024. NEMOSIS's defaults know neither transition.
+  Pre-existing bug, tracked in the test file and `spec.py`. `MNSP_DAYOFFER` is unaffected.
+
+## Parked tables
+
+- **FCAS_4_SECOND** — AEMO's Causer Pays archive is empty at every URL NEMOSIS tries (existing
+  upstream issue #64). No fixture, no test.
+- **FCAS_4s_SCADA_MAP** — built by `custom_tables.py::fcas4s_scada_match`, which consumes
+  `FCAS_4_SECOND` values to find lowest-error element↔DUID matches. Blocked on the same upstream
+  outage. A standalone fixture would mean fabricating the 4-second values the algorithm exists to
+  match — no meaningful test.