From c289a28f39468c6fc7d4e57ee59c94d924ef25bc Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 14:36:51 -0500
Subject: [PATCH 01/15] ghcp(crawl): ex0 bootstrap scaffolding

---
 .copilot-track/crawl/README.md   | 118 ++++++++++++++++++++
 ai-track-docs/SYSTEM-OVERVIEW.md | 104 ++++++++++++++++++
 ai-track-docs/architecture.mmd   |  91 ++++++++++++++++
 ai-track-docs/build-test.md      | 180 +++++++++++++++++++++++++++++++
 omnibus                          |   2 +-
 5 files changed, 494 insertions(+), 1 deletion(-)
 create mode 100644 .copilot-track/crawl/README.md
 create mode 100644 ai-track-docs/SYSTEM-OVERVIEW.md
 create mode 100644 ai-track-docs/architecture.mmd
 create mode 100644 ai-track-docs/build-test.md
diff --git a/.copilot-track/crawl/README.md b/.copilot-track/crawl/README.md
new file mode 100644
index 0000000000..8d6e1a24ef
--- /dev/null
+++ b/.copilot-track/crawl/README.md
@@ -0,0 +1,118 @@
+# Copilot Crawl — README
+
+This folder is the **home base** for AI-assisted incremental development on Chef Server.
+It captures the conventions that let Copilot (and human reviewers) follow the chain of
+work across multiple PRs, reproduce decisions, and audit AI involvement.
+
+---
+
+## 1. Chain-PRs
+
+Large features are broken into a **sequential chain of small pull requests**, each building
+on the previous merge commit.
+
+```
+main ──┬── feat/TICKET-step-1  (merged)
+       │        │
+       └────────┴── feat/TICKET-step-2  (open, base = step-1)
+                         │
+                         └── feat/TICKET-step-3  (draft, base = step-2)
+```
+
+Rules:
+- **One logical change per PR** — reviewers should be able to understand the diff in < 15 min.
+- **Base branch = previous step**, not `main`, until the chain is ready to land.
+- Each PR title begins with the Jira ID and step number:
+  `[TICKET-123] Step 2/4 — Add bifrost ACL migration`
+- When a parent PR is force-pushed or rebased, **repair the chain** before requesting review
+  (see the `sha-cascade-repair` agent in Copilot for automated help).
+- Merge order is strictly sequential; never merge step N+1 before step N.
+
+---
+
+## 2. Evidence in PRs
+
+Every AI-assisted PR must include a structured **Evidence block** in its description so that
+reviewers and auditors can trace what was generated vs. hand-written.
+
+### Minimum evidence block
+
+```markdown
+### AI Assistance Evidence
+| Item | Detail |
+|---|---|
+| **Model** | Claude Sonnet 4.6 (claude-sonnet-4.6) |
+| **Prompt summary** | Created bifrost schema migration for new acl_v2 table |
+| **Files generated** | `src/oc_bifrost/schema/deploy/acl_v2.sql` |
+| **Files hand-edited post-generation** | `src/oc_bifrost/rebar.config` (version pin) |
+| **Tests added** | `src/oc_bifrost/test/bifrost_acl_v2_tests.erl` |
+| **Coverage delta** | +3 % (87 % → 90 %) |
+| **Compliance label** | `ai-assisted` label applied ✅ |
+| **Jira field** | `customfield_11170` set to "Yes" ✅ |
+```
+
+- Attach the **raw Copilot session plan** (`plan.md`) as a PR comment or gist link when the
+  task spanned multiple turns.
+- If the AI produced code that was **rejected or significantly rewritten**, note that too —
+  it improves future prompts.
+
+---
+
+## 3. Prompt Usage
+
+### Writing effective prompts for this codebase
+
+| Do | Don't |
+|---|---|
+| Reference specific file paths and service names | Ask for "the server code" without context |
+| Specify the target language (Erlang / Ruby) and test framework | Leave the framework ambiguous |
+| Ask for one logical unit at a time | Bundle schema + API + tests in one giant prompt |
+| Include "do not modify submodules or vendor folders" | Assume the AI knows repo boundaries |
+| Mention the relevant Jira ID for traceability | Describe work without a ticket reference |
+
+### Recommended prompt template
+
+```
+Context: Chef Server repo, service: <oc_erchef|oc_bifrost|bookshelf|oc-id|chef-server-ctl>
+Jira: <TICKET-ID>
+Task: <one clear sentence>
+
+Constraints:
+- Do not modify files under omnibus/ (submodule) or any vendor/ directory
+- Follow existing code patterns in src/<service>/
+- Add EUnit / RSpec tests for all new code
+- Target ≥ 85 % line coverage
+
+Output: source file(s) + test file(s) + a brief summary of what changed and why
+```
+
+### Iterating on generated code
+
+1. Review the diff with `git diff` before accepting.
+2. Run `make all` (Erlang) or `bundle exec rspec` (Ruby) locally.
+3. If tests fail, paste the failure output back to the AI with: *"Fix the failing tests above
+   without changing the public API"*.
+4. Commit only after all quality gates pass (see [`build-test.md`](../../ai-track-docs/build-test.md)).
+
+---
+
+## 4. Session Artifacts
+
+Files placed in this folder (`.copilot-track/crawl/`) are **not deployed** and are excluded
+from packaging. They exist solely for AI context and audit purposes:
+
+| File | Purpose |
+|---|---|
+| `README.md` | This file — conventions and workflow |
+| `plan-<TICKET>.md` | Per-ticket implementation plan from Copilot |
+| `session-<date>.log` | Optional: exported Copilot session transcript |
+
+---
+
+## 5. Quick Reference Links
+
+- System overview → [`ai-track-docs/SYSTEM-OVERVIEW.md`](../../ai-track-docs/SYSTEM-OVERVIEW.md)
+- Build & test guide → [`ai-track-docs/build-test.md`](../../ai-track-docs/build-test.md)
+- Architecture diagram → [`ai-track-docs/architecture.mmd`](../../ai-track-docs/architecture.mmd)
+- Contributing guide → [`CONTRIBUTING.md`](../../CONTRIBUTING.md)
+- Code review checklist → [`CODE_REVIEW_CHECKLIST.md`](../../CODE_REVIEW_CHECKLIST.md)
diff --git a/ai-track-docs/SYSTEM-OVERVIEW.md b/ai-track-docs/SYSTEM-OVERVIEW.md
new file mode 100644
index 0000000000..963afe8d71
--- /dev/null
+++ b/ai-track-docs/SYSTEM-OVERVIEW.md
@@ -0,0 +1,104 @@
+# Chef Server — System Overview
+
+> **Version tracked**: see [`VERSION`](../VERSION)  
+> **Audience**: AI assistants, new contributors, on-call engineers
+
+---
+
+## Purpose
+
+Chef Server is the central hub for Chef-based infrastructure automation. It stores node
+data, cookbooks, roles, environments, and policy files, and enforces access control for
+all Chef clients.
+
+---
+
+## Repository Layout
+
+```
+chef-server/
+├── src/                  # All service source trees
+│   ├── oc_erchef/        # Core REST API (Erlang/OTP)
+│   ├── oc_bifrost/       # Authorization service (Erlang/OTP)
+│   ├── bookshelf/        # S3-compatible cookbook storage (Erlang/OTP)
+│   ├── oc-id/            # OAuth2 / identity provider (Ruby on Rails)
+│   ├── chef-server-ctl/  # Management CLI (Ruby)
+│   └── nginx/            # Reverse proxy + routing config
+├── omnibus/              # Omnibus packaging (git submodule — do not edit directly)
+├── habitat/              # Habitat build plans
+├── dev/                  # Vagrant-based DVM development environment
+├── oc-chef-pedant/       # End-to-end API test suite (Ruby)
+├── docs-chef-io/         # Public documentation source
+└── ai-track-docs/        # AI-assistant reference docs (this folder)
+```
+
+---
+
+## Service Map
+
+| Service | Language | Role | Port (default) |
+|---|---|---|---|
+| **oc_erchef** | Erlang/OTP | Primary REST API; handles all `/organizations/*` routes | 8000 |
+| **oc_bifrost** | Erlang/OTP | ACL / authorization enforcement | 9463 |
+| **bookshelf** | Erlang/OTP | Stores cookbook tarballs & checksums | 4321 |
+| **oc-id** | Ruby (Rails) | OAuth2 identity provider for web UI & tokens | 9090 |
+| **nginx** | C / Lua | TLS termination, routing, rate-limiting | 443 / 80 |
+| **PostgreSQL** | — | Persistent data store for all services | 5432 |
+
+---
+
+## Data Flow (request path)
+
+```
+Chef Client / Knife
+      │  HTTPS
+      ▼
+   nginx (TLS termination)
+      │
+      ├──▶ oc_erchef  (API logic)
+      │         │
+      │         ├──▶ oc_bifrost  (authz check)
+      │         ├──▶ bookshelf   (cookbook blobs)
+      │         └──▶ PostgreSQL  (node / metadata)
+      │
+      └──▶ oc-id  (OAuth2 flows)
+```
+
+---
+
+## Key Abstractions
+
+- **Organization** — top-level multi-tenant boundary; almost every API call is scoped to an org.
+- **Actor** — a user or client (node) that authenticates via RSA-signed requests.
+- **ACE / Bifrost object** — every Chef resource (node, cookbook, role …) is backed by a Bifrost
+  access-control entry.
+- **Cookbook** — versioned bundle of recipes, templates, and files stored in bookshelf.
+
+---
+
+## Technology Notes
+
+- Erlang services use **rebar3**, OTP supervision trees, **sqerl** (SQL), and **pooler**
+  (connection pooling).
+- Database schema is versioned with **sqitch** migrations found in each service's
+  `schema/` subdirectory.
+- Ruby tooling uses **Bundler**; Rails app (`oc-id`) follows Rails 7.x conventions.
+- Omnibus is a **git submodule** — never edit files under `omnibus/` directly; open PRs
+  against the omnibus repo and update the submodule ref.
+
+---
+
+## Authentication Model
+
+Requests are signed with **RSA-SHA256** using the Chef request-signing protocol (`mixlib-authn`).
+The server validates the signature against the actor's stored public key and then delegates
+permission checks to oc_bifrost.
+
+---
+
+## Further Reading
+
+- [`build-test.md`](./build-test.md) — how to build, run, and test each service
+- [`architecture.mmd`](./architecture.mmd) — Mermaid component diagram
+- [`dev/README.md`](../dev/README.md) — DVM local development guide
+- [`CONTRIBUTING.md`](../CONTRIBUTING.md) — contribution workflow
diff --git a/ai-track-docs/architecture.mmd b/ai-track-docs/architecture.mmd
new file mode 100644
index 0000000000..9e1d2e9b8b
--- /dev/null
+++ b/ai-track-docs/architecture.mmd
@@ -0,0 +1,91 @@
+%%  Chef Server — Component Architecture
+%%  Render with: mmdc -i architecture.mmd -o architecture.svg
+%%  Or paste into https://mermaid.live
+
+graph TB
+    subgraph Clients
+        KC[knife / chef-client]
+        WebUI[Chef Manage / Web UI]
+        OAuth[OAuth2 Consumer]
+    end
+
+    subgraph Ingress
+        NGINX[nginx\nTLS termination\nRouting / rate-limit]
+    end
+
+    subgraph CoreAPI["Core API  (oc_erchef — Erlang/OTP)"]
+        Router[webmachine router]
+        AuthN[mixlib-authn\nRequest signing]
+        Resources[Resource handlers\n/orgs /nodes /cookbooks …]
+        DB_Pool[sqerl + pooler\nPostgreSQL pool]
+    end
+
+    subgraph AuthZ["Authorization  (oc_bifrost — Erlang/OTP)"]
+        BifrostAPI[Bifrost REST API]
+        ACL[(ACL objects\nin PostgreSQL)]
+    end
+
+    subgraph Storage["Cookbook Storage  (bookshelf — Erlang/OTP)"]
+        BShelfAPI[S3-compat API]
+        BlobStore[(Cookbook tarballs\n& checksums on disk)]
+    end
+
+    subgraph Identity["Identity  (oc-id — Ruby on Rails)"]
+        OAuthSrv[OAuth2 server\nDoorkeeper]
+        UserDB[(Users / tokens\nin PostgreSQL)]
+    end
+
+    subgraph DataStore
+        PG[(PostgreSQL\nshared cluster)]
+    end
+
+    subgraph Management
+        CSCtl[chef-server-ctl\nRuby CLI]
+    end
+
+    %% Client → Ingress
+    KC  -->|HTTPS signed req| NGINX
+    WebUI -->|HTTPS| NGINX
+    OAuth -->|OAuth2| NGINX
+
+    %% Ingress → Services
+    NGINX -->|/organizations/*| Router
+    NGINX -->|/id/*| OAuthSrv
+
+    %% erchef internals
+    Router --> AuthN
+    AuthN --> Resources
+    Resources --> DB_Pool
+    DB_Pool --> PG
+
+    %% erchef → bifrost
+    Resources -->|authz check| BifrostAPI
+    BifrostAPI --> ACL
+    ACL --> PG
+
+    %% erchef → bookshelf
+    Resources -->|cookbook blobs| BShelfAPI
+    BShelfAPI --> BlobStore
+
+    %% oc-id internals
+    OAuthSrv --> UserDB
+    UserDB --> PG
+
+    %% Management
+    CSCtl -.->|reconfigure / restart| NGINX
+    CSCtl -.->|reconfigure / restart| Router
+    CSCtl -.->|reconfigure / restart| BifrostAPI
+    CSCtl -.->|reconfigure / restart| OAuthSrv
+
+    %% Styling
+    classDef erlang fill:#7b4ea0,color:#fff,stroke:#5a3070
+    classDef ruby fill:#cc342d,color:#fff,stroke:#992218
+    classDef infra fill:#2e7d32,color:#fff,stroke:#1b5e20
+    classDef data fill:#1565c0,color:#fff,stroke:#0d47a1
+    classDef client fill:#e65100,color:#fff,stroke:#bf360c
+
+    class Router,AuthN,Resources,DB_Pool,BifrostAPI,ACL,BShelfAPI erlang
+    class OAuthSrv,CSCtl ruby
+    class NGINX infra
+    class PG,BlobStore,UserDB data
+    class KC,WebUI,OAuth client
diff --git a/ai-track-docs/build-test.md b/ai-track-docs/build-test.md
new file mode 100644
index 0000000000..f86d3e173c
--- /dev/null
+++ b/ai-track-docs/build-test.md
@@ -0,0 +1,180 @@
+# Chef Server — Build & Test Reference
+
+> Quick reference for building and testing every service tier.  
+> All commands assume you are inside the relevant service directory unless noted.
+
+---
+
+## Prerequisites
+
+| Tool | Purpose |
+|---|---|
+| Erlang/OTP ≥ 25 | Erlang services |
+| rebar3 | Erlang build & test |
+| Ruby ≥ 3.1 | Ruby services & tooling |
+| Bundler | Ruby dependency management |
+| PostgreSQL | Integration / CT tests |
+| Vagrant + VirtualBox | Full dev environment (DVM) |
+| Docker / docker-compose | Container-based smoke tests |
+
+---
+
+## Development VM (DVM) — Recommended Start
+
+```bash
+cd dev/
+vagrant up                              # provision VM (~first run: several minutes)
+vagrant ssh
+sudo -i
+dvm load oc_erchef                      # symlink source for hot-reload
+dvm start oc_erchef                     # start service inside VM
+```
+
+Reload Erlang modules without restarting:
+
+```bash
+dvm reload oc_erchef
+```
+
+---
+
+## Erlang Services (`oc_erchef`, `oc_bifrost`, `bookshelf`)
+
+### Full build (clean → compile → eunit → dialyzer)
+
+```bash
+cd src/<service>/
+make all
+```
+
+### Granular steps
+
+```bash
+rebar3 clean
+rebar3 compile
+rebar3 eunit                            # unit tests
+rebar3 dialyzer                         # type analysis
+rebar3 ct                               # Common Test integration suite
+```
+
+### Code style
+
+```bash
+./scripts/elvis rock                    # from repo root, or:
+rebar3 as lint lint                     # where configured
+```
+
+### Coverage report
+
+```bash
+rebar3 cover
+# HTML report appears in _build/test/cover/
+```
+
+---
+
+## Ruby Services & Tooling
+
+### `oc-id` (Rails OAuth2 provider)
+
+```bash
+cd src/oc-id/
+bundle install
+bundle exec rails db:setup              # first time
+bundle exec rails db:migrate
+bundle exec rspec                       # test suite
+bundle exec rails server                # dev server on :3000
+```
+
+### `chef-server-ctl` (management CLI)
+
+```bash
+cd src/chef-server-ctl/
+bundle install
+bundle exec rspec
+```
+
+### Style
+
+```bash
+bundle exec rubocop                     # Ruby style (where .rubocop.yml present)
+```
+
+---
+
+## End-to-End / API Tests
+
+```bash
+cd oc-chef-pedant/
+bundle install
+bundle exec rspec spec/                 # requires a running Chef Server stack
+```
+
+Run against the Vagrant VM:
+
+```bash
+cd dev/
+vagrant ssh -c "sudo -i chef-server-ctl test"
+```
+
+---
+
+## Docker Compose (smoke test stack)
+
+```bash
+# From repo root
+docker-compose up -d
+docker-compose exec chef-server-ctl chef-server-ctl test
+docker-compose down
+```
+
+---
+
+## Omnibus Packaging
+
+> `omnibus/` is a **git submodule** — do not edit files there.  
+> To build a package, work against the omnibus repo directly.
+
+```bash
+cd omnibus/
+make dev-build                          # requires omnibus toolchain
+```
+
+---
+
+## Habitat Builds
+
+```bash
+# Single service
+hab pkg build src/oc_erchef
+
+# All services
+./habitat_pkgs_build.sh
+```
+
+---
+
+## CI / Quality Gates
+
+| Check | Command | Must pass? |
+|---|---|---|
+| Erlang unit tests | `rebar3 eunit` | ✅ |
+| Erlang dialyzer | `rebar3 dialyzer` | ✅ |
+| Erlang CT integration | `rebar3 ct` | ✅ |
+| Ruby specs | `bundle exec rspec` | ✅ |
+| Elvis style | `./scripts/elvis rock` | ✅ |
+| Pedant API tests | `bundle exec rspec` (oc-chef-pedant) | ✅ |
+
+Coverage target: **≥ 85 %** line coverage for all critical modules.
+
+---
+
+## Common Troubleshooting
+
+| Symptom | Fix |
+|---|---|
+| `rebar3 compile` fails on missing dep | Run `rebar3 get-deps` then retry |
+| CT tests can't connect to PostgreSQL | Ensure pg is running; check `test.config` for DB params |
+| `bundle install` fails with native ext errors | Install OS dev headers (`libpq-dev`, `libxml2-dev`) |
+| Vagrant VM times out on `vagrant up` | Increase VirtualBox RAM; see `dev/Vagrantfile` |
+| Hot-reload not picking up changes | Confirm `dvm load` was run; check symlinks in `/srv/` |
diff --git a/omnibus b/omnibus
index 7ac2883aa2..0b489f38be 160000
--- a/omnibus
+++ b/omnibus
@@ -1 +1 @@
-Subproject commit 7ac2883aa2c6615675045fff4d42039ec69ce0bd
+Subproject commit 0b489f38bebecaef19bd9c23c454f65435d533ef

From d83daa9270e1c048e29dfc2cd935ba67c82350b6 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 16:05:18 -0500
Subject: [PATCH 02/15] =?UTF-8?q?exercise=202=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20ex1+ex2=20repo=20orientation,=20low-risk=20module,=20determi?=
 =?UTF-8?q?nistic=20tests?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Updated SYSTEM-OVERVIEW.md with language/framework summary, entry points,
  test approach, and chosen low-risk module (bksw_format.erl) with justification
- Updated build-test.md with exact bookshelf build/test commands, verified
  test output, and two new troubleshooting entries (GCC segfault, rebar3 path)
- Added src/bookshelf/test/bksw_format_tests.erl with 5 deterministic EUnit
  tests covering all 4 exported functions in bksw_format (to_hex, to_base64,
  to_etag, to_date); all 5 tests pass

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ai-track-docs/SYSTEM-OVERVIEW.md         | 70 ++++++++++++++++++++++++
 ai-track-docs/build-test.md              | 53 +++++++++++++++---
 src/bookshelf/test/bksw_format_tests.erl | 23 ++++++++
 3 files changed, 137 insertions(+), 9 deletions(-)
 create mode 100644 src/bookshelf/test/bksw_format_tests.erl

diff --git a/ai-track-docs/SYSTEM-OVERVIEW.md b/ai-track-docs/SYSTEM-OVERVIEW.md
index 963afe8d71..be5e19f2da 100644
--- a/ai-track-docs/SYSTEM-OVERVIEW.md
+++ b/ai-track-docs/SYSTEM-OVERVIEW.md
@@ -96,6 +96,76 @@ permission checks to oc_bifrost.
 
 ---
 
+## Language & Framework Summary (Exercise 1)
+
+| Language | Services | Framework / Build Tool |
+|---|---|---|
+| **Erlang/OTP** | oc_erchef, oc_bifrost, bookshelf | rebar3, webmachine, sqerl, pooler |
+| **Ruby** | chef-server-ctl, oc-id, oc_bifrost schema | Rails 7, Thor, Bundler |
+| **SQL** | All services (schema migrations) | sqitch |
+| **Lua / nginx conf** | nginx, openresty-noroot | OpenResty |
+
+---
+
+## Entry Points
+
+| Service | Entry Point Path | Notes |
+|---|---|---|
+| oc_erchef | `src/oc_erchef/src/oc_erchef.app.src` | Composed of 10 sub-apps: `oc_chef_wm`, `chef_db`, `chef_objects`, `depsolver`, `chef_index`, `chef_telemetry`, `chef_license`, `data_collector`, `oc_chef_authz`, `chef_test` |
+| oc_bifrost | `src/oc_bifrost/apps/bifrost/` | Single OTP app |
+| bookshelf | `src/bookshelf/src/bksw_app.erl` | Entry via `bksw_app` application callback |
+| oc-id | `src/oc-id/` | Rails app; `config/application.rb` is the Rails entry point |
+| chef-server-ctl | `src/chef-server-ctl/chef-server-ctl.gemspec` | Thor-based CLI |
+| nginx | `src/nginx/` | Config templates rendered by omnibus |
+
+---
+
+## Test Approach
+
+| Service tier | Framework | Files | Run command |
+|---|---|---|---|
+| Erlang unit | EUnit (`*_tests.erl`) | 45 files | `rebar3 eunit` |
+| Erlang integration | Common Test (`*_SUITE.erl`) | 19 files | `rebar3 ct` |
+| Ruby | RSpec (`*_spec.rb`) | 47 files | `bundle exec rspec` |
+| End-to-end API | oc-chef-pedant | full suite | `bundle exec rspec` (from `oc-chef-pedant/`) |
+
+All Erlang services have a `Makefile` with a `make all` target that runs clean → compile → eunit → dialyzer.
+
+---
+
+## Chosen Low-Risk Module (Exercise 1)
+
+**`src/bookshelf/src/bksw_format.erl`**
+
+### What it does
+Pure formatting utility for bookshelf responses. Exports four stateless functions:
+
+| Function | Purpose |
+|---|---|
+| `to_date/1` | Formats a datetime tuple as an ISO 8601 string |
+| `to_base64/1` | Base64-encodes a binary |
+| `to_hex/1` | Converts a binary to a lowercase hex string |
+| `to_etag/1` | Wraps a hex digest in ETag quotes (`"abc123"`) |
+
+### Why it is low risk
+
+- **46 lines total** — entire module fits on one screen
+- **Pure functions** — no side effects, no process state, no supervision tree involvement
+- **No auth, no DB, no HTTP** — cannot accidentally break security, data integrity, or API contracts
+- **Self-contained** — zero internal dependencies beyond stdlib (`base64`, `io_lib`, `string`) and the `iso8601` library
+- **Easily testable** — input → output; no infrastructure required to run or verify tests
+- A bug here affects only the *formatting* of dates/ETags in bookshelf HTTP responses — not data loss, not authentication failure, not authorization bypass
+- Referenced in `src/bookshelf/test/bksw_sec_tests.erl`, so there is an existing test harness to extend
+
+### What kinds of changes are safe here
+
+- Adding/improving EUnit tests
+- Improving `to_hex` readability (the current implementation uses a list comprehension with `io_lib:format` — it could be made more idiomatic)
+- Adding a `-spec` type annotation for each exported function
+- Adding a `to_mime_type/1` or similar utility if bookshelf needs it in future exercises
+
+---
+
 ## Further Reading
 
 - [`build-test.md`](./build-test.md) — how to build, run, and test each service
diff --git a/ai-track-docs/build-test.md b/ai-track-docs/build-test.md
index f86d3e173c..c4ff146eab 100644
--- a/ai-track-docs/build-test.md
+++ b/ai-track-docs/build-test.md
@@ -47,27 +47,60 @@ cd src/<service>/
 make all
 ```
 
+> **bookshelf note**: `make all` also runs `elvis` style check and `xref`.
+> On this machine, `make all` may fail with a GCC segfault while compiling
+> the `jiffy` C NIF — a pre-existing system compiler bug unrelated to our code.
+> Use `./rebar3 eunit` directly to run the Erlang-only test path cleanly.
+
 ### Granular steps
 
 ```bash
-rebar3 clean
-rebar3 compile
-rebar3 eunit                            # unit tests
-rebar3 dialyzer                         # type analysis
-rebar3 ct                               # Common Test integration suite
+./rebar3 clean
+./rebar3 compile
+./rebar3 eunit                          # unit tests
+./rebar3 dialyzer                       # type analysis
+make ct                                 # Common Test integration suite (requires PostgreSQL)
+```
+
+> Each service ships its own `rebar3` binary at `src/<service>/rebar3`.
+> Use `./rebar3` rather than a global `rebar3` to ensure the correct version.
+
+### bookshelf — exact verified commands (Exercise 2 baseline)
+
+```bash
+cd src/bookshelf/
+
+./rebar3 eunit                          # run all EUnit tests including bksw_format_tests
+./rebar3 eunit --module bksw_format_tests  # run only the format tests
+./rebar3 dialyzer                       # type checking
+make ct                                 # integration tests (requires PostgreSQL running)
+```
+
+**Verified test output (all passing):**
+
+```
+======================== EUnit ========================
+module 'bksw_format_tests'
+  bksw_format_tests: to_hex_produces_lowercase_hex_string_test...[0.035 s] ok
+  bksw_format_tests: to_hex_empty_binary_produces_empty_string_test...ok
+  bksw_format_tests: to_base64_encodes_binary_test...[0.013 s] ok
+  bksw_format_tests: to_etag_wraps_hex_in_quotes_test...ok
+  bksw_format_tests: to_date_undefined_returns_epoch_test...ok
+  [done in 0.063 s]
+=======================================================
+  All 5 tests passed.
 ```
 
 ### Code style
 
 ```bash
-./scripts/elvis rock                    # from repo root, or:
-rebar3 as lint lint                     # where configured
+../../scripts/elvis rock                # from src/<service>/ directory
 ```
 
 ### Coverage report
 
 ```bash
-rebar3 cover
+./rebar3 cover
 # HTML report appears in _build/test/cover/
 ```
 
@@ -173,8 +206,10 @@ Coverage target: **≥ 85 %** line coverage for all critical modules.
 
 | Symptom | Fix |
 |---|---|
-| `rebar3 compile` fails on missing dep | Run `rebar3 get-deps` then retry |
+| `rebar3 compile` fails on missing dep | Run `./rebar3 get-deps` then retry |
 | CT tests can't connect to PostgreSQL | Ensure pg is running; check `test.config` for DB params |
 | `bundle install` fails with native ext errors | Install OS dev headers (`libpq-dev`, `libxml2-dev`) |
 | Vagrant VM times out on `vagrant up` | Increase VirtualBox RAM; see `dev/Vagrantfile` |
 | Hot-reload not picking up changes | Confirm `dvm load` was run; check symlinks in `/srv/` |
+| `make all` in bookshelf crashes with `cc1: internal compiler error: Segmentation fault` | GCC system bug compiling jiffy C NIF; use `./rebar3 eunit` to run Erlang tests directly |
+| `rebar3: command not found` | Each service ships its own binary; use `./rebar3` from inside `src/<service>/` |
diff --git a/src/bookshelf/test/bksw_format_tests.erl b/src/bookshelf/test/bksw_format_tests.erl
new file mode 100644
index 0000000000..a6d9b2f56d
--- /dev/null
+++ b/src/bookshelf/test/bksw_format_tests.erl
@@ -0,0 +1,23 @@
+-module(bksw_format_tests).
+-include_lib("eunit/include/eunit.hrl").
+
+%% to_hex/1 — binary input produces a lowercase hex string of the correct length and content
+to_hex_produces_lowercase_hex_string_test() ->
+    ?assertEqual("0a1b2c3d", bksw_format:to_hex(<<16#0a, 16#1b, 16#2c, 16#3d>>)).
+
+%% to_hex/1 — empty binary produces empty string
+to_hex_empty_binary_produces_empty_string_test() ->
+    ?assertEqual("", bksw_format:to_hex(<<>>)).
+
+%% to_base64/1 — round-trips through base64 correctly
+to_base64_encodes_binary_test() ->
+    ?assertEqual("dGVzdA==", bksw_format:to_base64(<<"test">>)).
+
+%% to_etag/1 — binary input is hex-encoded then wrapped in double quotes
+to_etag_wraps_hex_in_quotes_test() ->
+    ?assertEqual("\"0a1b2c3d\"",
+                 lists:flatten(bksw_format:to_etag(<<16#0a, 16#1b, 16#2c, 16#3d>>))).
+
+%% to_date/1 — undefined input returns the epoch sentinel string
+to_date_undefined_returns_epoch_test() ->
+    ?assertEqual(<<"1970-01-01T00:00:00.000Z">>, bksw_format:to_date(undefined)).

From 14d58445cb4e3150187f410c80bee4606a39e7f5 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 16:10:41 -0500
Subject: [PATCH 03/15] =?UTF-8?q?exercise=203=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20readability=20refactor=20of=20bksw=5Fformat.erl?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Extract byte_to_hex/1 private helper from to_hex/1 list comprehension;
  intent is now readable at a glance without parsing nested format calls
- Remove no-op string:to_lower/1 call (2.16.0b format already produces lowercase)
- Add -spec attributes for all 4 public functions and byte_to_hex/1
- All 5 existing EUnit tests pass; behavior unchanged

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 src/bookshelf/src/bksw_format.erl | 16 +++++++++++++---
 1 file changed, 13 insertions(+), 3 deletions(-)

diff --git a/src/bookshelf/src/bksw_format.erl b/src/bookshelf/src/bksw_format.erl
index 10361bdcbb..70b4166ca0 100644
--- a/src/bookshelf/src/bksw_format.erl
+++ b/src/bookshelf/src/bksw_format.erl
@@ -25,6 +25,7 @@
 %% API functions
 %%===================================================================
 
+-spec to_date(undefined | {datetime, calendar:datetime()} | calendar:datetime()) -> binary().
 to_date(undefined) ->
     <<"1970-01-01T00:00:00.000Z">>;
 to_date({datetime, Date}) ->
@@ -32,15 +33,24 @@ to_date({datetime, Date}) ->
 to_date(Date) ->
     iso8601:format(Date).
 
+-spec to_base64(binary()) -> string().
 to_base64(Bin) ->
     base64:encode_to_string(Bin).
 
+-spec to_hex(binary()) -> string().
 to_hex(Bin) ->
-      string:to_lower(lists:flatten([io_lib:format("~2.16.0b",
-                                                   [N])
-                                     || <<N>> <= Bin])).
+    lists:flatten([byte_to_hex(B) || <<B>> <= Bin]).
 
+-spec to_etag(binary() | string()) -> string().
 to_etag(Tag) when is_binary(Tag) ->
     to_etag(to_hex(Tag));
 to_etag(Tag) ->
     io_lib:format("\"~s\"", [Tag]).
+
+%%===================================================================
+%% Internal functions
+%%===================================================================
+
+-spec byte_to_hex(0..255) -> string().
+byte_to_hex(Byte) ->
+    io_lib:format("~2.16.0b", [Byte]).

From 4dfe5f3c72a7905a3919eb2cc066f8342d4384b0 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 16:28:31 -0500
Subject: [PATCH 04/15] =?UTF-8?q?exercise=204=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20docstrings=20and=20extending=20guide=20for=20bksw=5Fformat?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add @doc comments to all functions in bksw_format.erl explaining purpose,
  input shapes, edge cases, and examples
- Mark byte_to_hex/1 as @private
- Create ai-track-docs/extending-bksw_format.md with guidance on when/how
  to add new functions, current exports reference, a worked example, and
  module health guidelines
- All 5 EUnit tests pass

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ai-track-docs/extending-bksw_format.md | 115 +++++++++++++++++++++++++
 src/bookshelf/src/bksw_format.erl      |  23 +++++
 2 files changed, 138 insertions(+)
 create mode 100644 ai-track-docs/extending-bksw_format.md

diff --git a/ai-track-docs/extending-bksw_format.md b/ai-track-docs/extending-bksw_format.md
new file mode 100644
index 0000000000..61a1061b8a
--- /dev/null
+++ b/ai-track-docs/extending-bksw_format.md
@@ -0,0 +1,115 @@
+# Extending `bksw_format`
+
+**Module**: `src/bookshelf/src/bksw_format.erl`  
+**Test file**: `src/bookshelf/test/bksw_format_tests.erl`
+
+---
+
+## What this module is
+
+`bksw_format` is a small, pure utility module. It converts internal Erlang
+values into the string/binary representations required by bookshelf's
+S3-compatible HTTP API. All functions are stateless — no processes, no
+database, no side effects.
+
+---
+
+## When to add a function here
+
+Add a function to `bksw_format` when you need to:
+
+- Format an Erlang value into a specific HTTP header or response body string
+- Centralise a conversion used in more than one place in bookshelf
+- Keep formatting logic out of resource/request handler modules (`bksw_wm_*`)
+
+**Do not add** functions that perform I/O, call external services, or have
+side effects — those belong elsewhere in the bookshelf supervision tree.
+
+---
+
+## How to add a new formatting function
+
+### 1. Write the function with a `-spec`
+
+```erlang
+%% @doc One-line description of what this formats.
+%%
+%% More detail if needed — input shapes, edge cases, examples.
+-spec to_foo(InputType()) -> OutputType().
+to_foo(Value) ->
+    %% implementation
+    Value.
+```
+
+Place it in the `%% API functions` section, alphabetically or grouped by
+concern. Export it in the `-export` list at the top.
+
+### 2. Add a test in `bksw_format_tests.erl`
+
+Follow the existing pattern — one test function per behaviour, with a
+descriptive name ending in `_test`:
+
+```erlang
+to_foo_converts_value_correctly_test() ->
+    ?assertEqual(expected_output, bksw_format:to_foo(known_input)).
+
+to_foo_handles_edge_case_test() ->
+    ?assertEqual(edge_output, bksw_format:to_foo(edge_input)).
+```
+
+Always include at least:
+- A **happy-path** test with a known input/output pair
+- An **edge case** (empty binary, `undefined`, zero, etc.) if applicable
+
+### 3. Run tests
+
+```bash
+cd src/bookshelf/
+./rebar3 eunit
+```
+
+All tests must pass before committing.
+
+---
+
+## Current exports reference
+
+| Function | Input | Output | Notes |
+|---|---|---|---|
+| `to_date/1` | `undefined` \| `{datetime, D}` \| `D` | `binary()` | Returns epoch string for `undefined` |
+| `to_base64/1` | `binary()` | `string()` | Flat base64 string |
+| `to_hex/1` | `binary()` | `string()` | Lowercase, zero-padded, two chars per byte |
+| `to_etag/1` | `binary()` \| `string()` | `string()` | Hex-encodes binaries first, then wraps in `"..."` |
+
+---
+
+## Example: adding `to_content_md5/1`
+
+Suppose bookshelf needs to format a raw MD5 digest binary as the
+`Content-MD5` header value (base64-encoded):
+
+```erlang
+%% @doc Encode a raw MD5 digest binary as a Content-MD5 header string.
+-spec to_content_md5(binary()) -> string().
+to_content_md5(Digest) ->
+    to_base64(Digest).
+```
+
+Test:
+
+```erlang
+to_content_md5_encodes_md5_digest_test() ->
+    %% MD5 of empty string is d41d8cd98f00b204e9800998ecf8427e (hex)
+    RawMd5 = <<16#d4,16#1d,16#8c,16#d9,16#8f,16#00,16#b2,16#04,
+               16#e9,16#80,16#09,16#98,16#ec,16#f8,16#42,16#7e>>,
+    ?assertEqual("1B2M2Y8AsgTpgAmY7PhCfg==", bksw_format:to_content_md5(RawMd5)).
+```
+
+---
+
+## Keeping the module healthy
+
+- Keep all functions **pure** — no side effects
+- Keep the module **small** — if it grows beyond ~100 lines consider splitting
+- Keep `-spec` attributes on every function
+- Keep test coverage at **100 %** — this module is simple enough to achieve it
diff --git a/src/bookshelf/src/bksw_format.erl b/src/bookshelf/src/bksw_format.erl
index 70b4166ca0..cd3d56b9f8 100644
--- a/src/bookshelf/src/bksw_format.erl
+++ b/src/bookshelf/src/bksw_format.erl
@@ -14,6 +14,11 @@
 %% WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
 %% implied.  See the License for the specific language governing
 %% permissions and limitations under the License.
+%% @doc Formatting utilities for bookshelf HTTP responses.
+%%
+%% All functions in this module are pure (no side effects, no process state).
+%% They convert internal Erlang values into the string/binary representations
+%% required by the S3-compatible bookshelf API.
 -module(bksw_format).
 
 -export([to_base64/1,
@@ -25,6 +30,12 @@
 %% API functions
 %%===================================================================
 
+%% @doc Format a datetime value as an ISO 8601 binary string.
+%%
+%% Handles three input shapes:
+%%   - `undefined`         → epoch sentinel "1970-01-01T00:00:00.000Z"
+%%   - `{datetime, Date}`  → unwrap the tagged tuple, then format
+%%   - bare `Date`         → format directly via iso8601
 -spec to_date(undefined | {datetime, calendar:datetime()} | calendar:datetime()) -> binary().
 to_date(undefined) ->
     <<"1970-01-01T00:00:00.000Z">>;
@@ -33,14 +44,24 @@ to_date({datetime, Date}) ->
 to_date(Date) ->
     iso8601:format(Date).
 
+%% @doc Base64-encode a binary value, returning a flat string.
 -spec to_base64(binary()) -> string().
 to_base64(Bin) ->
     base64:encode_to_string(Bin).
 
+%% @doc Convert a binary to a lowercase hexadecimal string.
+%%
+%% Each byte is formatted as exactly two hex digits (zero-padded).
+%% Example: <<10, 255>> → "0aff"
 -spec to_hex(binary()) -> string().
 to_hex(Bin) ->
     lists:flatten([byte_to_hex(B) || <<B>> <= Bin]).
 
+%% @doc Wrap a value in HTTP ETag double-quotes.
+%%
+%% If given a binary, it is first hex-encoded via to_hex/1.
+%% If given a string, it is wrapped directly.
+%% Example: <<"abc">> → `"616263"`
 -spec to_etag(binary() | string()) -> string().
 to_etag(Tag) when is_binary(Tag) ->
     to_etag(to_hex(Tag));
@@ -51,6 +72,8 @@ to_etag(Tag) ->
 %% Internal functions
 %%===================================================================
 
+%% @private
+%% @doc Format a single byte as a two-digit lowercase hex string.
 -spec byte_to_hex(0..255) -> string().
 byte_to_hex(Byte) ->
     io_lib:format("~2.16.0b", [Byte]).

From c833ab19dff1930cf24b00fe1b880d0588b190b5 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 16:38:26 -0500
Subject: [PATCH 05/15] =?UTF-8?q?exercise=205=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20minimal=20input=20validation=20and=20negative=20tests=20for?=
 =?UTF-8?q?=20bksw=5Fformat?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Added is_binary/1 guards to to_hex/1 and to_base64/1
- Three new negative tests: rejects string and integer inputs
- All 8 tests passing (5 positive + 3 negative)

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 src/bookshelf/src/bksw_format.erl        |  8 ++++++--
 src/bookshelf/test/bksw_format_tests.erl | 12 ++++++++++++
 2 files changed, 18 insertions(+), 2 deletions(-)

diff --git a/src/bookshelf/src/bksw_format.erl b/src/bookshelf/src/bksw_format.erl
index cd3d56b9f8..e8d730393e 100644
--- a/src/bookshelf/src/bksw_format.erl
+++ b/src/bookshelf/src/bksw_format.erl
@@ -45,16 +45,20 @@ to_date(Date) ->
     iso8601:format(Date).
 
 %% @doc Base64-encode a binary value, returning a flat string.
+%%
+%% Raises function_clause if Bin is not a binary.
 -spec to_base64(binary()) -> string().
-to_base64(Bin) ->
+to_base64(Bin) when is_binary(Bin) ->
     base64:encode_to_string(Bin).
 
 %% @doc Convert a binary to a lowercase hexadecimal string.
 %%
 %% Each byte is formatted as exactly two hex digits (zero-padded).
 %% Example: <<10, 255>> → "0aff"
+%%
+%% Raises function_clause if Bin is not a binary.
 -spec to_hex(binary()) -> string().
-to_hex(Bin) ->
+to_hex(Bin) when is_binary(Bin) ->
     lists:flatten([byte_to_hex(B) || <<B>> <= Bin]).
 
 %% @doc Wrap a value in HTTP ETag double-quotes.
diff --git a/src/bookshelf/test/bksw_format_tests.erl b/src/bookshelf/test/bksw_format_tests.erl
index a6d9b2f56d..882dbaa87d 100644
--- a/src/bookshelf/test/bksw_format_tests.erl
+++ b/src/bookshelf/test/bksw_format_tests.erl
@@ -9,10 +9,22 @@ to_hex_produces_lowercase_hex_string_test() ->
 to_hex_empty_binary_produces_empty_string_test() ->
     ?assertEqual("", bksw_format:to_hex(<<>>)).
 
+%% to_hex/1 — non-binary input is rejected at the boundary
+to_hex_rejects_string_input_test() ->
+    ?assertError(function_clause, bksw_format:to_hex("not a binary")).
+
+%% to_hex/1 — non-binary integer input is rejected at the boundary
+to_hex_rejects_integer_input_test() ->
+    ?assertError(function_clause, bksw_format:to_hex(42)).
+
 %% to_base64/1 — round-trips through base64 correctly
 to_base64_encodes_binary_test() ->
     ?assertEqual("dGVzdA==", bksw_format:to_base64(<<"test">>)).
 
+%% to_base64/1 — non-binary input is rejected at the boundary
+to_base64_rejects_string_input_test() ->
+    ?assertError(function_clause, bksw_format:to_base64("not a binary")).
+
 %% to_etag/1 — binary input is hex-encoded then wrapped in double quotes
 to_etag_wraps_hex_in_quotes_test() ->
     ?assertEqual("\"0a1b2c3d\"",

From 5b7dce4f1e124a45e039252e2b41696053836809 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 16:41:54 -0500
Subject: [PATCH 06/15] =?UTF-8?q?exercise=206=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20performance=20baseline=20for=20bksw=5Fformat?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- timer:tc escript benchmark, 10k iterations per cell
- to_hex/1: 17–1485 µs avg across 16/128/1024 byte inputs (linear O(n))
- to_base64/1: 1–23 µs avg — stdlib base64 NIF, ~64x faster
- Variance notes: WSL2 scheduler jitter, JIT first-call spike documented
- No optimization recommended; no hotspot identified

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ai-track-docs/perf-baseline.md | 75 ++++++++++++++++++++++++++++++++++
 1 file changed, 75 insertions(+)
 create mode 100644 ai-track-docs/perf-baseline.md

diff --git a/ai-track-docs/perf-baseline.md b/ai-track-docs/perf-baseline.md
new file mode 100644
index 0000000000..42ea8288c1
--- /dev/null
+++ b/ai-track-docs/perf-baseline.md
@@ -0,0 +1,75 @@
+# Performance Baseline — `bksw_format`
+
+**Exercise**: 6 — Crawl Track v2.3.1  
+**Module**: `src/bookshelf/src/bksw_format.erl`  
+**Date**: 2026-05-18  
+**Environment**: WSL2 / Linux x86-64, Erlang/OTP (local `./rebar3` toolchain)  
+**Method**: `timer:tc/3` via escript, 10 000 iterations per cell, warm-up of 500 calls before measurement
+
+---
+
+## Benchmark Script
+
+```
+/tmp/bench_bksw.escript
+```
+
+Run from `src/bookshelf/`:
+
+```bash
+# 1. Compile the module (already compiled if tests were run)
+erlc -pa _build/default/lib/iso8601/ebin -o /tmp src/bksw_format.erl
+
+# 2. Run benchmark
+escript /tmp/bench_bksw.escript
+```
+
+---
+
+## Results
+
+### `to_hex/1` — pure-Erlang byte-by-byte hex encoding
+
+| Input size | min (µs) | avg (µs) | p99 (µs) | max (µs) |
+|------------|----------|----------|----------|----------|
+| 16 bytes   | 17       | 20       | 68       | 453      |
+| 128 bytes  | 140      | 159      | 289      | 891      |
+| 1 024 bytes| 1 230    | 1 485    | 4 350    | 5 464    |
+
+**Scaling note**: avg time grows roughly linearly with input size
+(~9.4 µs per 64 bytes), consistent with the O(n) `byte_to_hex/1` loop.
+
+### `to_base64/1` — delegates to Erlang stdlib `base64:encode/1`
+
+| Input size | min (µs) | avg (µs) | p99 (µs) | max (µs) |
+|------------|----------|----------|----------|----------|
+| 16 bytes   | 0        | 1        | 1        | 10 144   |
+| 128 bytes  | 2        | 2        | 18       | 328      |
+| 1 024 bytes| 18       | 23       | 82       | 868      |
+
+**Scaling note**: stdlib `base64:encode/1` is ~64× faster than the
+pure-Erlang `to_hex/1` at comparable sizes — C NIF under the hood.
+
+---
+
+## Variance Notes
+
+| Observation | Detail |
+|-------------|--------|
+| `to_hex` p99 is 3–4× avg | Typical Erlang scheduler jitter on a loaded WSL2 host; not a code issue |
+| `to_base64` 16 B max = 10 144 µs | One-time JIT compilation / first-call cost for the `base64` NIF; subsequent calls are sub-microsecond |
+| `to_hex` max is ~30× avg at 1 024 B | OS scheduler preemption on large inputs; no outlier pattern across runs |
+| Results are **not** suitable for wall-clock SLA decisions | Measurements taken in a shared dev VM; use a dedicated node for capacity planning |
+
+---
+
+## Takeaway
+
+Neither function is a hotspot concern at bookshelf's expected workload
+(cookbook metadata calls, not streaming). `to_hex/1` is the only
+pure-Erlang path and could be replaced with `binary:encode_hex/1`
+(OTP 24+) if sub-microsecond latency were ever required — but that is
+**out of scope** for the Crawl track and should only be done with a
+confirmed profiler signal.
+
+No optimization work is recommended at this time.

From 6b88e24b5b703a38568dd3148844003ad7c78ab0 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 16:44:21 -0500
Subject: [PATCH 07/15] =?UTF-8?q?exercise=207=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20dependency=20audit=20and=20pinning=20policy=20for=20bookshel?=
 =?UTF-8?q?f?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- 4 deps branch-tracked in rebar.lock (not reproducibly pinned): erlcloud,
  mini_s3, erlsom, sqerl — all on personal/feature branches
- 10 deps branch-tracked in config but ref-frozen in lock (safe today)
- Only iso8601 (tag) and meck (ref) are properly pinned in rebar.config
- OTP version mismatch: rebar.config requires 26.2.5.15, omnibus override
  has 26.2.5.14 commented out
- Platform debt noted: Ruby 3.1 EOL, Redis 5.x EOL, omnibus-ctl on main
- No files modified; audit-only

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ai-track-docs/dependencies.md | 137 ++++++++++++++++++++++++++++++++++
 1 file changed, 137 insertions(+)
 create mode 100644 ai-track-docs/dependencies.md

diff --git a/ai-track-docs/dependencies.md b/ai-track-docs/dependencies.md
new file mode 100644
index 0000000000..2ee40d03d2
--- /dev/null
+++ b/ai-track-docs/dependencies.md
@@ -0,0 +1,137 @@
+# Dependency Audit & Pinning Policy
+
+**Exercise**: 7 — Crawl Track v2.3.1  
+**Scope**: `src/bookshelf/` (Erlang) + platform overrides (`omnibus_overrides.rb`)  
+**Date**: 2026-05-18  
+**Files examined**: `src/bookshelf/rebar.config`, `src/bookshelf/rebar.lock`, `omnibus_overrides.rb`
+
+---
+
+## How rebar3 pinning works
+
+| Source | Role | Risk if mutable |
+|--------|------|-----------------|
+| `rebar.config` — `{branch, "..."}` | Declared intention | HIGH — resolves to tip-of-branch at fetch time |
+| `rebar.config` — `{tag, "..."}` | Semantic version label | LOW — tags *should* be immutable; can still be deleted |
+| `rebar.config` — `{ref, "sha"}` | Exact commit SHA | NONE — immutable |
+| `rebar.lock` — `{ref, "sha"}` | What was actually fetched | NONE — but only used if `rebar.lock` is present and not skipped |
+| `rebar.lock` — `{branch, "..."}` | **Not frozen** | HIGH — `rebar3 upgrade` or a missing lock will re-resolve |
+
+The lock file wins over `rebar.config` for reproducible builds **only if** it contains
+`{ref, sha}` entries. When the lock file itself records a `{branch, ...}`, the next
+`rebar3 upgrade` or clean checkout can pull a different commit silently.
+
+---
+
+## Bookshelf Erlang Dependencies
+
+### 🔴 Branch-tracked in lock file (highest risk)
+
+These four entries appear in `rebar.lock` with `{branch, ...}` instead of `{ref, sha}`.
+They are **not reproducibly pinned** and can drift on any clean fetch.
+
+| Dep | Branch in lock | Owner | Risk note |
+|-----|---------------|-------|-----------|
+| `erlcloud` | `CHEF-11677/CHEF-12498/lbaker` | chef fork | Personal feature branch; not stable |
+| `mini_s3` | `CHEF-11677/CHEF-12498/lbaker` | chef fork | Same branch as erlcloud — coupled |
+| `erlsom` | `integer_long_string_probs2` | chef fork | Feature branch; unclear if merged upstream |
+| `sqerl` | `shahid/sqerl-erl27.3-pg16.1` | chef fork | OTP 27 / PG 16.1 compatibility branch |
+
+**Recommended action** (do not execute without team review):  
+Run `./rebar3 lock` after a clean fetch to resolve to SHAs, then pin those SHAs
+in `rebar.config` as `{ref, "sha"}`. Treat the resulting lock file as the source
+of truth and commit it.
+
+### 🟡 Branch-tracked in config, ref-frozen in lock (medium risk)
+
+These are declared as `{branch, ...}` in `rebar.config` but the lock file has resolved
+them to a specific `{ref, sha}`. They are reproducible **today** but will drift on the
+next intentional `rebar3 upgrade`.
+
+| Dep | Config branch | Lock ref (first 8) | Notes |
+|-----|--------------|-------------------|-------|
+| `lager` | `master` | `a140ea93` | Core logging framework |
+| `cf` | `master` | `2bcf0040` | Color formatting |
+| `chef_secrets` | `main` | `a690fb9f` | Secret management |
+| `envy` | `master` | `0148fb4b` | Env var helpers |
+| `erlware_commons` | `lbaker/fix_for_ftmap` | `f511ed87` | Personal fix branch |
+| `mixer` | `master` | `d5f58392` | Module function injection |
+| `mochiweb` | `main` | `666ac57d` | HTTP server |
+| `observer_cli` | `master` | `baa70569` | Runtime introspection |
+| `opscoderl_wm` | `main` | `6495dd0f` | Webmachine wrapper |
+| `sync` | `master` | `7c9367e7` | Dev hot-reload (test only) |
+
+**Recommended action**: No immediate change needed. When any of these are intentionally
+upgraded, update the lock file and commit the new SHA pair together.
+
+### 🟢 Well-pinned (low risk)
+
+| Dep | Pin type | Value | Notes |
+|-----|----------|-------|-------|
+| `iso8601` | `{tag, "1.2.3"}` | `4603fc81` in lock | Only tag-pinned dep; lock also has SHA |
+| `meck` | `{ref, "5aaa24886..."}` | same in lock | Explicitly pinned with comment explaining why |
+
+---
+
+## OTP Version Constraint
+
+`rebar.config` line 5:
+```erlang
+{require_otp_vsn, "26.2.5.15"}.
+```
+
+`omnibus_overrides.rb` (commented out):
+```ruby
+#override :erlang, version: "26.2.5.14"
+```
+
+⚠️ **Mismatch**: the config requires `.15` but the omnibus override (when re-enabled)
+would install `.14`. If the Erlang override is ever uncommented without bumping the
+version, builds will fail at the rebar3 OTP version check.
+
+---
+
+## Platform Dependencies (`omnibus_overrides.rb`)
+
+| Package | Pinned version | Notes |
+|---------|---------------|-------|
+| Ruby | `3.1.7` | Ruby 3.1 EOL Apr 2025 — upgrade path needed (3.2 or 3.3) |
+| OpenSSL | FIPS `3.1.2` | FIPS-enabled; version locked intentionally |
+| Redis | `5.0.14` | Redis 5.x EOL Oct 2022 — significant upgrade risk |
+| Perl | `5.34.0` | Perl 5.34 EOL; 5.38 current stable |
+| runit | `2.1.1` | Pinned with known issue; `2.1.2` blocked by umbrella bug |
+| sqitch | `0.973` | DB migration tool; version seems stable for current schema |
+| logrotate | `3.19.0` | Utility; low risk |
+| nokogiri | `1.18.9` | Ruby XML — critical security surface; keep updated |
+| ohai | `v16.17.0` | Chef system profiler |
+| omnibus-ctl | `main` | 🔴 Branch tracking — same risk as branch deps above |
+
+---
+
+## Pinning Policy (Recommended)
+
+1. **Lock file is the contract.** The `rebar.lock` must be committed and reviewed on
+   every intentional dependency change. Do not run `rebar3 upgrade` silently.
+
+2. **No branch entries in the lock file.** Any `{branch, ...}` in `rebar.lock` is a
+   build reproducibility bug. Convert by capturing the current SHA and setting
+   `{ref, "sha"}` in `rebar.config`, then re-lock.
+
+3. **Personal branches are temporary.** `erlcloud`/`mini_s3`/`erlsom`/`erlware_commons`
+   all track personal branches (`lbaker/...`). These fixes should be either upstreamed
+   to a stable branch/tag or captured as a Chef-internal fork tag.
+
+4. **Platform upgrades are separate work.** Ruby 3.1 EOL and Redis 5.x EOL represent
+   real maintenance debt but require coordinated omnibus work — do not address during
+   Crawl track exercises.
+
+5. **Do not upgrade during Crawl exercises.** The exercises are about observation and
+   documentation, not upgrade execution. File findings as tech-debt tickets.
+
+---
+
+## What was NOT changed
+
+No `rebar.config`, `rebar.lock`, or `omnibus_overrides.rb` files were modified.
+This document is observation-only. Any pinning changes require a dedicated PR with
+CI validation.

From 67ad2fed425bfd6be68bdc4b64999bf04489c5c4 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 16:49:56 -0500
Subject: [PATCH 08/15] =?UTF-8?q?exercise=208=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20security=20hygiene=20audit=20and=20remediation?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Audit (security-hygiene.md):
- No hardcoded production credentials found in src/
- Bookshelf uses chef_secrets:get/2 for runtime secret loading (correct)
- oc_chef_action properly redacts password field from audit logs (correct)
- Habitat .pem files are template placeholders, not real keys (confirmed safe)
- AWS key in bksw_sec_tests is AKIAIOSFODNN7EXAMPLE docs placeholder (safe)

Remediations:
- .gitignore: added *.pem, *.key, .env*, *.secret, *.credentials and SSH
  key name patterns as safety net for future untracked secret files
- spec/fixtures/pivotal.pem: prepended test-only header (valid PEM format)
  to prevent false positives in secret scanners
- itest/setup_helper.erl: added TEST FIXTURE comment on zuperzecret literal

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .gitignore                                    |  19 +-
 ai-track-docs/security-hygiene.md             | 187 ++++++++++++++++++
 src/chef-server-ctl/spec/fixtures/pivotal.pem |   3 +
 .../apps/oc_chef_wm/itest/setup_helper.erl    |   1 +
 4 files changed, 209 insertions(+), 1 deletion(-)
 create mode 100644 ai-track-docs/security-hygiene.md

diff --git a/.gitignore b/.gitignore
index 54592e4c91..bf43dab1d6 100644
--- a/.gitignore
+++ b/.gitignore
@@ -44,4 +44,21 @@ chef-server-dependency-licenses.json
 license-cache
 
 # don't commit berks lock files
-Berksfile.lock
\ No newline at end of file
+Berksfile.lock
+
+# Secrets & credentials — never commit real key material
+# Note: *.pem files already tracked (habitat templates + test fixtures) are
+# intentional and remain tracked. This rule only blocks NEW untracked .pem files.
+*.pem
+*.key
+*.p12
+*.pfx
+.env
+.env.*
+*.secret
+*.credentials
+private_key*
+*_rsa
+*_dsa
+*_ecdsa
+*_ed25519
\ No newline at end of file
diff --git a/ai-track-docs/security-hygiene.md b/ai-track-docs/security-hygiene.md
new file mode 100644
index 0000000000..d84da13b53
--- /dev/null
+++ b/ai-track-docs/security-hygiene.md
@@ -0,0 +1,187 @@
+# Security & Secrets Hygiene Audit
+
+**Exercise**: 8 — Crawl Track v2.3.1  
+**Scope**: `src/` tree (Erlang + Ruby); platform config files  
+**Date**: 2026-05-18  
+**Method**: Pattern grep (`grep -rn`) across source, config, and fixture files; no dynamic scanning  
+**Tools used**: ripgrep patterns for passwords, tokens, AWS key format, PEM headers, env patterns
+
+---
+
+## Summary
+
+| Category | Finding | Severity | Action needed? |
+|----------|---------|----------|---------------|
+| Habitat PEM files | Template placeholders, not real keys | ✅ None | No |
+| Test fixture private key | Real RSA key, test-only scope | 🟡 Low | Document intent |
+| AWS key in test | AWS docs example key (`EXAMPLE`) | ✅ None | No |
+| Bookshelf credential loading | `chef_secrets:get/2` at runtime | ✅ Good | No |
+| Password redaction in audit log | `oc_chef_action` scrubs `"password"` field | ✅ Good | No |
+| `.gitignore` missing secret patterns | No `.pem`/`.key`/`.env` exclusions | 🟡 Low | Consider adding |
+| Test password literal | `<<"zuperzecret">>` in itest helper | 🟡 Low | Acceptable; note scope |
+| `omnibus-ctl` on `main` branch | Supply-chain drift risk | 🟡 Low | See dep audit |
+| No hardcoded production credentials | Confirmed across `src/` | ✅ Good | No |
+
+---
+
+## Detailed Findings
+
+### ✅ Habitat PEM files are templates (not real keys)
+
+```
+src/chef-server-ctl/habitat/config/pivotal.pem   → {{cfg.secrets.chef-server.superuser_key}}
+src/chef-server-ctl/habitat/config/webui_priv.pem → {{cfg.secrets.chef-server.webui_key}}
+```
+
+These files have `.pem` extensions but contain Habitat templating syntax only.
+Actual key material is injected at runtime by the Habitat supervisor from the
+secrets store. No credentials exposed.
+
+### 🟡 Test fixture RSA private key
+
+```
+src/chef-server-ctl/spec/fixtures/pivotal.pem    — 27-line RSA PRIVATE KEY block
+src/oc_erchef/apps/chef_objects/test/cert.pem    — test certificate
+src/oc_erchef/apps/oc_chef_wm/itest/public.pem  — test public key
+```
+
+These are **test-only** keys used for RSA signing/verification unit tests.
+They are not production credentials and are intentionally committed as test
+infrastructure. However:
+
+- No comments or README explains they are test-only — a future reader could
+  flag them incorrectly in a secret scanner.
+- They will trigger any `trufflehog`/`gitleaks`-style scanner without an
+  explicit allow-list entry.
+
+**Recommendation**: Add an `.allowlist` entry (or inline comment) if/when
+a secret scanner is added to CI. Do not remove the keys — tests depend on them.
+
+### ✅ AWS key in bookshelf tests is the AWS documentation example
+
+```
+src/bookshelf/test/bksw_sec_tests.erl:109
+  Credential=AKIAIOSFODNN7EXAMPLE/...
+```
+
+`AKIAIOSFODNN7EXAMPLE` is the [canonical AWS documentation placeholder key](https://docs.aws.amazon.com/general/latest/gr/aws-access-keys-best-practices.html).
+It is not a real access key and will not authenticate against any AWS account.
+Used correctly here for S3 authorization header parsing tests.
+
+### ✅ Bookshelf loads credentials via `chef_secrets` at runtime
+
+```erlang
+%% src/bookshelf/src/bksw_conf.erl lines 156–157
+{ok, AWSAccessKey} = chef_secrets:get(<<"bookshelf">>, <<"access_key_id">>),
+{ok, SecretKey}    = chef_secrets:get(<<"bookshelf">>, <<"secret_access_key">>),
+```
+
+Credentials are fetched from the `chef_secrets` service at startup, never
+embedded in source or config files. This is the correct pattern for this
+codebase. The `chef_secrets` library reads from an encrypted secrets file
+managed by `chef-server-ctl`.
+
+### ✅ Password field is redacted in audit/action logs
+
+```erlang
+%% src/oc_erchef/apps/oc_chef_wm/src/oc_chef_action.erl lines 100–102
+case ej:get({"password"}, Msg) of
+    undefined -> Msg;
+    _ -> ej:set({<<"password">>}, Msg, ?REDACTED_PASSWORD)
+end.
+```
+
+The `oc_chef_action` module explicitly scrubs the `"password"` field before
+emitting action log events. This prevents password leakage into activity
+stream / audit log storage. Good defense-in-depth.
+
+### 🟡 `.gitignore` has no patterns for secret file types
+
+Current `.gitignore` entries cover build artifacts, editor files, Terraform
+state, and Habitat results — but not private key or credential file extensions:
+
+```
+# Missing patterns that would add safety-net coverage:
+# *.pem       (would need explicit un-ignores for test fixtures)
+# *.key
+# .env
+# *.credentials
+```
+
+**Note**: Adding `*.pem` globally would require `!`-exceptions for the test
+fixture files. Given the intentional test fixtures, this is a team decision,
+not a simple one-liner fix.
+
+### 🟡 Test password literal in integration test helper
+
+```erlang
+%% src/oc_erchef/apps/oc_chef_wm/itest/setup_helper.erl:218
+{<<"password">>, <<"zuperzecret">>}
+```
+
+A literal password in a test fixture. This is acceptable — it is scoped to
+integration test setup and will never reach production. It will trigger naive
+secret scanners. If a scanner is added to CI, add an inline `# pragma: allowlist secret`
+or equivalent suppression comment.
+
+### ✅ oc-id secret_key_base uses Habitat templating
+
+```ruby
+# src/oc-id/habitat/config/secret_token.rb
+OcId::Application.config.secret_key_base = "{{cfg.secret_key_base}}"
+```
+
+Not hardcoded — injected via Habitat config at runtime.
+
+---
+
+## Secrets Handling Architecture (bookshelf)
+
+```
+chef-server-ctl (Ruby)
+  └─ writes encrypted secrets file (/etc/opscode/private-chef-secrets.json)
+       └─ read by chef_secrets Erlang library at OTP app startup
+            └─ bksw_conf:credentials/0 fetches access_key_id + secret_access_key
+                 └─ injected into #context{} record for per-request use
+                      └─ NEVER logged, NEVER serialized to disk
+```
+
+This is a well-structured secrets pipeline. No improvements needed for the
+Crawl track scope.
+
+---
+
+## Changes Made (Exercise 8 remediation)
+
+### 1. `.gitignore` — secret file pattern section added
+
+```
+*.pem  *.key  *.p12  *.pfx  .env  .env.*  *.secret  *.credentials
+private_key*  *_rsa  *_dsa  *_ecdsa  *_ed25519
+```
+
+Already-tracked `.pem` files (test fixtures, habitat templates) remain tracked —
+`.gitignore` only gates new untracked files. Adds a safety net against accidentally
+staging future real key material.
+
+### 2. `src/chef-server-ctl/spec/fixtures/pivotal.pem` — test-only header
+
+A plaintext header (valid PEM format; text before `-----BEGIN` is ignored by
+PEM parsers) was prepended to make the test-only nature explicit and to provide
+an allowlist hint for secret scanners.
+
+### 3. `src/oc_erchef/apps/oc_chef_wm/itest/setup_helper.erl` — fixture comment
+
+Added `%% TEST FIXTURE — not a production credential` comment adjacent to the
+`<<"zuperzecret">>` literal.
+
+---
+
+## Recommendations Summary
+
+| Item | Effort | Priority |
+|------|--------|----------|
+| Add comments to test `.pem` files marking them as test-only | Tiny | Low |
+| Add `.pem` allowlist if `gitleaks`/`trufflehog` added to CI | Small | When CI scanner is added |
+| Add `# pragma: allowlist secret` to `zuperzecret` line | Tiny | When CI scanner is added |
+| Upgrade `omnibus-ctl` from `main` to a tagged release | Medium | See dependencies.md |
diff --git a/src/chef-server-ctl/spec/fixtures/pivotal.pem b/src/chef-server-ctl/spec/fixtures/pivotal.pem
index 0c03bc74dc..a4f769a101 100644
--- a/src/chef-server-ctl/spec/fixtures/pivotal.pem
+++ b/src/chef-server-ctl/spec/fixtures/pivotal.pem
@@ -1,3 +1,6 @@
+This is a TEST-ONLY RSA key used exclusively in chef-server-ctl RSpec fixtures.
+It is NOT a production credential and grants no access to any environment.
+Do NOT replace this with a real key. Secret scanners should allowlist this file.
 -----BEGIN RSA PRIVATE KEY-----
 MIIEogIBAAKCAQEAvPo+oNPB7uuNkws0fC02KxSwdyqPLu0fhI1pOweNKAZeEIiE
 z2PkybathHWy8snSXGNxsITkf3eyvIIKa8OZWrlqpI3yv/5DOP8HTMCxnFuMJQtD
diff --git a/src/oc_erchef/apps/oc_chef_wm/itest/setup_helper.erl b/src/oc_erchef/apps/oc_chef_wm/itest/setup_helper.erl
index 74bab46e91..5ac4c7213a 100644
--- a/src/oc_erchef/apps/oc_chef_wm/itest/setup_helper.erl
+++ b/src/oc_erchef/apps/oc_chef_wm/itest/setup_helper.erl
@@ -215,6 +215,7 @@ base_end_per_suite(Config) ->
 make_user(Config, Name, AuthzId) ->
     User = chef_object:new_record(chef_user, ?API_MIN_VER, ?OSC_ORG_ID, AuthzId,
                                    {[{<<"username">>, Name},
+                                     %% TEST FIXTURE — not a production credential
                                      {<<"password">>, <<"zuperzecret">>},
                                      {<<"email">>, iolist_to_binary([Name, <<"@somewhere.com">>])},
                                      {<<"public_key">>, ?config(pubkey, Config)},

From 062633d1d624e9e24f396e54c18df8faf1dda2a4 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 16:57:30 -0500
Subject: [PATCH 09/15] =?UTF-8?q?exercise=209=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20structured=20logging=20improvements=20in=20bksw=5Fwm=5Fsql?=
 =?UTF-8?q?=5Fobject?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Three lager:error calls lacked req_id trace context despite #context{} being
in scope. These are integrity-critical events (checksum/MD5 mismatches, upload
failures) that operators need to correlate to specific requests.

Changes:
- send_streamed_body/1: add reqid=ReqId to pattern; log as key=value fields
- write_streamed_body/3: extract Ctx1#context.reqid into content-md5 mismatch log
- maybe_upload/3: promote error_logger to lager:error; add req_id to pattern;
  use key=value field format

All three now emit: req_id=<id> <event>: field=value ...

Docs: ai-track-docs/logging.md — logging stack, req_id convention, before/after,
best practices table

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ai-track-docs/logging.md                 | 152 +++++++++++++++++++++++
 src/bookshelf/src/bksw_wm_sql_object.erl |  12 +-
 2 files changed, 159 insertions(+), 5 deletions(-)
 create mode 100644 ai-track-docs/logging.md

diff --git a/ai-track-docs/logging.md b/ai-track-docs/logging.md
new file mode 100644
index 0000000000..ff603708a1
--- /dev/null
+++ b/ai-track-docs/logging.md
@@ -0,0 +1,152 @@
+# Structured Logging Guide — Bookshelf
+
+**Exercise**: 9 — Crawl Track v2.3.1  
+**Scope**: `src/bookshelf/`  
+**Date**: 2026-05-18
+
+---
+
+## Logging Stack
+
+Bookshelf uses **lager** (via parse transform) with a thin macro layer defined in
+`src/internal.hrl`:
+
+```erlang
+%% info/error → error_logger (visible via SASL in Common Test)
+-define(LOG_INFO(X, Y),  error_logger:info_msg(X, Y)).
+-define(LOG_ERROR(X, Y), error_logger:error_msg(X, Y)).
+
+%% debug → direct lager call (requires lager app running)
+-define(LOG_DEBUG(X, Y), lager:debug(X, Y)).
+```
+
+High-severity events (checksum mismatches, upload failures) use `lager:error/2`
+directly, which routes through lager's formatters and sinks.
+
+---
+
+## The `req_id` Convention
+
+Every bookshelf HTTP request gets a unique ID assigned at the webmachine layer:
+
+```erlang
+%% set by opscoderl_wm:read_req_id in bksw_wm_base
+#context{reqid = ReqId}
+```
+
+**The req_id must appear in every error and warning log line** emitted during
+request processing. This is the primary trace key for correlating nginx access
+logs, lager error logs, and external client errors.
+
+Format: `"req_id=~s ..."` (binary-safe string format with `~s`)
+
+---
+
+## Changes Made in Exercise 9
+
+Three error log lines in `bksw_wm_sql_object.erl` lacked `req_id` context despite
+having `#context{}` in scope. These are the highest-value lines to fix because
+they represent integrity failures (checksum/MD5 mismatches) that operators need
+to trace to a specific request.
+
+### Before → After
+
+**1. Download checksum mismatch** (`send_streamed_body/1`):
+```erlang
+%% Before — no trace context, no structured fields
+lager:error("checksum mismatch on download: expected: ~p; sent: ~p",
+            [ShaExpected, S])
+
+%% After — req_id added; field names are key=value tokens (grep-friendly)
+lager:error("req_id=~s checksum mismatch on download: expected=~p sent=~p",
+            [ReqId, ShaExpected, S])
+```
+The function pattern was also updated to extract `reqid = ReqId` directly:
+```erlang
+send_streamed_body(#context{..., reqid = ReqId}) -> ...
+```
+
+**2. Upload Content-MD5 mismatch** (`write_streamed_body/3`):
+```erlang
+%% Before
+lager:error("Mismatch between Content-MD5 and actual content. Content-MD5: ~p; Actual: ~p",
+            [RequestMd5, HashMd5])
+
+%% After — req_id from Ctx1 in scope; consistent key=value format
+lager:error("req_id=~s content-md5 mismatch on upload: content-md5=~p actual=~p",
+            [Ctx1#context.reqid, RequestMd5, HashMd5])
+```
+
+**3. Unknown upload response** (`maybe_upload/3`):
+```erlang
+%% Before — error_logger (lower visibility), no trace context
+error_logger:error_msg("maybe_upload unknown response: ~p~n", [Error])
+
+%% After — promoted to lager:error; req_id added; function pattern updated
+maybe_upload(Rq, #context{reqid = ReqId} = Ctx, Error) ->
+    lager:error("req_id=~s upload failed with unknown response: ~p", [ReqId, Error])
+```
+
+---
+
+## Logging Best Practices for Bookshelf
+
+### Always include `req_id` in request-scoped logs
+
+```erlang
+%% Good — traceable to a specific request
+lager:error("req_id=~s operation failed: reason=~p", [ReqId, Reason])
+
+%% Bad — unattributed, cannot be correlated
+lager:error("operation failed: ~p", [Reason])
+```
+
+### Use `key=value` field format in message strings
+
+Structured `key=value` tokens let operators grep and parse logs without a
+dedicated log parser:
+
+```bash
+# Find all errors for a specific request
+grep 'req_id=abc-123' /var/log/opscode/bookshelf/current
+
+# Find all checksum mismatches
+grep 'checksum mismatch on download' /var/log/opscode/bookshelf/current
+```
+
+### Choose the right level
+
+| Level | When to use | Macro/call |
+|-------|------------|------------|
+| `debug` | Per-request internals, normal control flow | `?LOG_DEBUG/2` |
+| `info` | Startup, configuration, lifecycle events | `?LOG_INFO/2` |
+| `error` | Integrity failures, unexpected states, security events | `lager:error/2` |
+
+### Prefer pattern extraction over record access in function heads
+
+```erlang
+%% Preferred — reqid visible in the function head
+send_streamed_body(#context{..., reqid = ReqId}) -> ...
+
+%% Acceptable when reqid is needed mid-function
+lager:error("req_id=~s ...", [Ctx#context.reqid, ...])
+```
+
+---
+
+## Modules with Good Existing Logging
+
+| Module | Pattern used | Notes |
+|--------|-------------|-------|
+| `bksw_io.erl` | `?LOG_DEBUG`, `?LOG_ERROR` macros | Good coverage of filesystem ops |
+| `bksw_sec.erl` | `?LOG_DEBUG` with `req_id=~p` | Correct trace pattern for auth failures |
+| `bksw_sup.erl` | `lager:info` | Startup lifecycle events only |
+| `bksw_cleanup_task.erl` | `lager:debug` | Background task logging |
+
+---
+
+## What Was Not Changed
+
+`bksw_format.erl` has no logging — it is a pure stateless utility module and
+should remain so. Logging belongs at the I/O and request-handling boundaries,
+not inside encoding/formatting primitives.
diff --git a/src/bookshelf/src/bksw_wm_sql_object.erl b/src/bookshelf/src/bksw_wm_sql_object.erl
index 1ef3bf1ad9..3a4677654a 100644
--- a/src/bookshelf/src/bksw_wm_sql_object.erl
+++ b/src/bookshelf/src/bksw_wm_sql_object.erl
@@ -198,8 +198,8 @@ maybe_upload(Rq, #context{entry_md = #db_file{} = Obj0}= Ctx0, {ok, DataId}) ->
 maybe_upload(Rq, Ctx, {error, Error}) -> %% Clean up and return useful error
     error_logger:error_msg("maybe_upload error: ~p~n", [Error]),
     {halt, Rq, Ctx};
-maybe_upload(Rq, Ctx, Error) -> %% Clean up and return useful error
-    error_logger:error_msg("maybe_upload unknown response: ~p~n", [Error]),
+maybe_upload(Rq, #context{reqid = ReqId} = Ctx, Error) -> %% Clean up and return useful error
+    lager:error("req_id=~s upload failed with unknown response: ~p", [ReqId, Error]),
     {halt, Rq, Ctx}.
 
 upload(Rq, Ctx) ->
@@ -213,12 +213,13 @@ upload(Rq, Ctx) ->
 send_streamed_body(#context{entry_md = #db_file{chunk_count = ChunkCount, hash_sha512 = ShaExpected},
                             transfer_state = #file_transfer_state{next_chunk = ChunkCount,
                                                                   hash_context_sha512 = ShaSent
-                                                                 } = _TransferState0}) ->
+                                                                 } = _TransferState0,
+                            reqid = ReqId}) ->
     case crypto:hash_final(ShaSent) of
         ShaExpected ->
             ok;
         S ->
-            lager:error("checksum mismatch on download: expected: ~p; sent: ~p", [ShaExpected, S])
+            lager:error("req_id=~s checksum mismatch on download: expected=~p sent=~p", [ReqId, ShaExpected, S])
     end,
     {<<>>, done};
 send_streamed_body(#context{entry_md = #db_file{data_id = DataId} = DbFile,
@@ -324,7 +325,8 @@ write_streamed_body({Data, done}, Rq0,
                     ok = finalize_maybe_create_file(Rq1, Ctx0, File1),
                     {{halt, 204}, Rq1, Ctx1};
                 _ ->
-                    lager:error("Mismatch between Content-MD5 and actual content. Content-MD5: ~p; Actual: ~p", [RequestMd5, HashMd5]),
+                    lager:error("req_id=~s content-md5 mismatch on upload: content-md5=~p actual=~p",
+                                [Ctx1#context.reqid, RequestMd5, HashMd5]),
                     %% Exiting here causes uploads to be abandoned, but the upload_cleanup task will
                     %% eventually clean things up.
                     {{halt, 406}, Rq0, Ctx1}

From e2201dd92b6b24fc9171bb9077d5ed486b26a3a1 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 17:01:24 -0500
Subject: [PATCH 10/15] =?UTF-8?q?exercise=2010=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20local=20test=20script=20and=20CI=20baseline=20documentation?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

CI finding: GitHub Actions runs security scans (trufflehog, trivy, grype,
BlackDuck, SonarQube) but build=false and unit-tests=false — Erlang unit
tests, dialyzer, and elvis are NOT executed by CI.

Local script: scripts/test-bookshelf-unit.sh
- Bypasses GCC segfault on jiffy C NIF compilation (pre-existing system bug)
- Uses ERL_LIBS + erlc to compile bksw_format + bksw_format_tests directly
- Runs eunit:test via erl -noshell with proper exit code propagation
- Cleans up temp files on exit; accepts 'verbose' argument
- All 8 tests pass: exit 0

Updated ai-track-docs/build-test.md:
- CI section rewritten with what runs vs what does not
- Local script usage documented
- Full local quality gate checklist

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ai-track-docs/build-test.md    | 61 ++++++++++++++++++++++++---
 scripts/test-bookshelf-unit.sh | 76 ++++++++++++++++++++++++++++++++++
 2 files changed, 132 insertions(+), 5 deletions(-)
 create mode 100755 scripts/test-bookshelf-unit.sh

diff --git a/ai-track-docs/build-test.md b/ai-track-docs/build-test.md
index c4ff146eab..c92441b580 100644
--- a/ai-track-docs/build-test.md
+++ b/ai-track-docs/build-test.md
@@ -189,14 +189,65 @@ hab pkg build src/oc_erchef
 
 ## CI / Quality Gates
 
+### GitHub Actions (`.github/workflows/ci-main-pull-request-stub.yml`)
+
+The repo's GitHub Actions CI runs on PRs to `main`, `develop`, and `release/**`.
+It delegates to a central `chef/common-github-actions` reusable workflow.
+
+**What CI does run:**
+
+| Scan | Tool | Fail threshold |
+|------|------|---------------|
+| Secret scanning | Trufflehog | Any secret found |
+| Dependency CVEs | Trivy + Grype | High / Critical |
+| SAST | BlackDuck Polaris | High / Critical |
+| SCA / SBOM | BlackDuck SCA | Blocker / Critical / Major |
+| Code quality | SonarQube | Configurable |
+
+**What CI does NOT run (as of this writing):**
+
+```yaml
+build: false
+unit-tests: false
+```
+
+Erlang unit tests, dialyzer, elvis, and Ruby specs are **not executed by CI**.
+They must be run locally before pushing. See local script below.
+
+### Local unit test script (bookshelf — Exercise 10)
+
+A reliable local runner is provided that bypasses the GCC/jiffy segfault:
+
+```bash
+# From repo root — run all 8 bksw_format_tests (quiet)
+bash scripts/test-bookshelf-unit.sh
+
+# Verbose EUnit output
+bash scripts/test-bookshelf-unit.sh verbose
+```
+
+**Script**: `scripts/test-bookshelf-unit.sh`  
+**Requirement**: `_build/default/lib/` must be populated (run `./rebar3 compile`
+once from `src/bookshelf/` — it fails on jiffy but fetches all deps first).
+
+### Full local quality check (bookshelf)
+
+```bash
+cd src/bookshelf/
+./rebar3 eunit            # unit tests (or use the script above if GCC segfaults)
+./rebar3 dialyzer         # type analysis
+../../scripts/elvis rock  # style check
+make ct                   # CT integration (requires PostgreSQL)
+```
+
 | Check | Command | Must pass? |
-|---|---|---|
-| Erlang unit tests | `rebar3 eunit` | ✅ |
+|-------|---------|------------|
+| Erlang unit tests | `rebar3 eunit` or `scripts/test-bookshelf-unit.sh` | ✅ |
 | Erlang dialyzer | `rebar3 dialyzer` | ✅ |
-| Erlang CT integration | `rebar3 ct` | ✅ |
+| Erlang CT integration | `rebar3 ct` | ✅ (needs PG) |
 | Ruby specs | `bundle exec rspec` | ✅ |
-| Elvis style | `./scripts/elvis rock` | ✅ |
-| Pedant API tests | `bundle exec rspec` (oc-chef-pedant) | ✅ |
+| Elvis style | `../../scripts/elvis rock` | ✅ |
+| Pedant API tests | `bundle exec rspec` (oc-chef-pedant) | ✅ (needs stack) |
 
 Coverage target: **≥ 85 %** line coverage for all critical modules.
 
diff --git a/scripts/test-bookshelf-unit.sh b/scripts/test-bookshelf-unit.sh
new file mode 100755
index 0000000000..49af28d2f0
--- /dev/null
+++ b/scripts/test-bookshelf-unit.sh
@@ -0,0 +1,76 @@
+#!/usr/bin/env bash
+# scripts/test-bookshelf-unit.sh
+#
+# Runs the bookshelf bksw_format EUnit suite without requiring Postgres,
+# a global rebar3 install, or a working C compiler.
+#
+# Background
+# ----------
+# 'make all' in src/bookshelf fails on this host with a GCC internal
+# compiler error (segfault) when building the jiffy C NIF.  rebar3 eunit
+# also triggers that path.  This script bypasses it by compiling only the
+# pure-Erlang sources directly with erlc and running eunit via erl -noshell.
+#
+# Requirements
+# ------------
+#   - Erlang/OTP on PATH (erl, erlc)
+#   - src/bookshelf/_build/default/lib/ populated (run ./rebar3 compile
+#     once from src/bookshelf/ — deps fetch succeeds even if jiffy fails)
+#
+# Usage
+#   bash scripts/test-bookshelf-unit.sh          # from repo root
+#   bash scripts/test-bookshelf-unit.sh verbose  # extra EUnit output
+#
+# Exit codes
+#   0  all tests passed
+#   1  one or more tests failed or compilation error
+
+set -euo pipefail
+
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+REPO_ROOT="$(cd "$SCRIPT_DIR/.." && pwd)"
+BOOKSHELF="$REPO_ROOT/src/bookshelf"
+BUILD_DIR="$BOOKSHELF/_build/default/lib"
+TMP_DIR="${TMPDIR:-/tmp}/bksw_test_$$"
+VERBOSE="${1:-}"
+
+# ── Preflight ──────────────────────────────────────────────────────────────
+if ! command -v erlc &>/dev/null; then
+    echo "ERROR: erlc not found on PATH" >&2
+    exit 1
+fi
+
+if [[ ! -d "$BUILD_DIR" ]]; then
+    echo "ERROR: $BUILD_DIR not found."
+    echo "       Run: cd src/bookshelf && ./rebar3 compile"
+    echo "       (compile will fail on jiffy; that is expected — deps still get fetched)"
+    exit 1
+fi
+
+# ── Setup ──────────────────────────────────────────────────────────────────
+mkdir -p "$TMP_DIR"
+trap 'rm -rf "$TMP_DIR"' EXIT
+
+export ERL_LIBS="$BUILD_DIR"
+
+# ── Compile source ─────────────────────────────────────────────────────────
+echo "==> Compiling bksw_format..."
+erlc -I "$BOOKSHELF/include" -o "$TMP_DIR" "$BOOKSHELF/src/bksw_format.erl"
+
+echo "==> Compiling bksw_format_tests..."
+erlc -I "$BOOKSHELF/include" -pa "$TMP_DIR" -o "$TMP_DIR" \
+    "$BOOKSHELF/test/bksw_format_tests.erl"
+
+# ── Run EUnit ──────────────────────────────────────────────────────────────
+EUNIT_OPTS="[verbose]"
+[[ -z "$VERBOSE" ]] && EUNIT_OPTS="[]"
+
+echo "==> Running EUnit (bksw_format_tests)..."
+erl -noshell \
+    -pa "$TMP_DIR" \
+    -eval "
+        case eunit:test(bksw_format_tests, $EUNIT_OPTS) of
+            ok   -> init:stop(0);
+            _Err -> init:stop(1)
+        end
+    "

From 211db2b63f67fe37b005256afe8109714e3d0e04 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 17:12:25 -0500
Subject: [PATCH 11/15] =?UTF-8?q?exercise=2011=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20PR=20hygiene=20pass=20(PR=20#4186=20updated)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Updated PR title and body with:
- Review focus table: 5 items with rationale (guards, logging, PEM, gitignore, script)
- Risk tiers: behaviour-change (low), log format (low), gitignore/docs (minimal)
- Rollback: full-branch revert + surgical per-commit options
- Verification: 5 runnable shell checks with expected output
- Evidence: EUnit output, perf table, security audit summary
- Commit message improvements proposed for c289a28f3 and d83daa927

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ai-track-docs/build-test.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/ai-track-docs/build-test.md b/ai-track-docs/build-test.md
index c92441b580..269f760e33 100644
--- a/ai-track-docs/build-test.md
+++ b/ai-track-docs/build-test.md
@@ -264,3 +264,5 @@ Coverage target: **≥ 85 %** line coverage for all critical modules.
 | Hot-reload not picking up changes | Confirm `dvm load` was run; check symlinks in `/srv/` |
 | `make all` in bookshelf crashes with `cc1: internal compiler error: Segmentation fault` | GCC system bug compiling jiffy C NIF; use `./rebar3 eunit` to run Erlang tests directly |
 | `rebar3: command not found` | Each service ships its own binary; use `./rebar3` from inside `src/<service>/` |
+
+<!-- ex11: PR #4186 updated with review focus, risks, verification, rollback, commit message proposals -->

From fad28cd369456b7d6a088ae4700809705d0fb42b Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 17:16:13 -0500
Subject: [PATCH 12/15] =?UTF-8?q?exercise=2012=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20backlog=20grooming=20=E2=80=94=205=20items=20from=20crawl=20?=
 =?UTF-8?q?findings?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

BACKLOG-001 (High/M): Pin 4 branch-tracked rebar.lock deps to SHA refs
  — erlcloud, mini_s3, erlsom, sqerl all on personal branches in lock file

BACKLOG-002 (High/S-M): Enable Erlang unit tests in GitHub Actions CI
  — build: false / unit-tests: false; no automated test gate on PRs

BACKLOG-003 (Med/S): Propagate req_id to 14 remaining untraced error logs
  — bksw_wm_sql_object (10) + bksw_wm_object (3) + bksw_io (1)

BACKLOG-004 (Med/S): Resolve OTP version mismatch omnibus vs rebar.config
  — rebar.config requires 26.2.5.15; commented omnibus override says .14

BACKLOG-005 (Med/S): Add trufflehog/gitleaks allowlist for test PEM fixtures
  — 5 tracked .pem files will trip scanner; no machine-readable allowlist

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ai-track-docs/BACKLOG-EX12.md | 229 ++++++++++++++++++++++++++++++++++
 1 file changed, 229 insertions(+)
 create mode 100644 ai-track-docs/BACKLOG-EX12.md

diff --git a/ai-track-docs/BACKLOG-EX12.md b/ai-track-docs/BACKLOG-EX12.md
new file mode 100644
index 0000000000..6589193879
--- /dev/null
+++ b/ai-track-docs/BACKLOG-EX12.md
@@ -0,0 +1,229 @@
+# Backlog — Crawl Track Findings
+
+**Exercise**: 12 — Crawl Track v2.3.1  
+**Generated from**: Exercises 0–11 repo analysis  
+**Date**: 2026-05-18  
+**Module under study**: `src/bookshelf/` (primary), `omnibus_overrides.rb`, `.github/`  
+
+Items are ordered by risk × fix-effort. Each includes a code link, acceptance
+criteria, and a suggested label.
+
+---
+
+## BACKLOG-001 · Fix 4 un-pinned branch entries in `rebar.lock`
+
+**Label**: `tech-debt` `reliability` `bookshelf`  
+**Size**: Medium  
+**Priority**: High
+
+### Problem
+
+Four dependencies in `src/bookshelf/rebar.lock` record `{branch, "..."}` instead
+of `{ref, "sha"}`. This means a `./rebar3 upgrade` or a clean checkout that skips
+the lock file will silently pull the tip of those branches — potentially introducing
+breaking changes with no code review.
+
+```
+# src/bookshelf/rebar.lock
+{<<"erlcloud">>,  {git, ..., {branch, "CHEF-11677/CHEF-12498/lbaker"}}, 0}
+{<<"mini_s3">>,   {git, ..., {branch, "CHEF-11677/CHEF-12498/lbaker"}}, 0}
+{<<"erlsom">>,    {git, ..., {branch, "integer_long_string_probs2"}},   0}
+{<<"sqerl">>,     {git, ..., {branch, "shahid/sqerl-erl27.3-pg16.1"}}, 0}
+```
+
+Three of the four are on personal developer branches (`lbaker/`, `shahid/`).
+
+### Acceptance Criteria
+
+- [ ] Each of the 4 deps in `rebar.config` is pinned to a `{ref, "sha"}` or a
+  stable `{tag, "..."}` in the declared source
+- [ ] `rebar.lock` contains no `{branch, ...}` entries for these four deps
+- [ ] The targeted SHAs are the same commits currently in use (no unintended upgrades)
+- [ ] `./rebar3 eunit` passes after the change
+
+### Code Links
+
+- `src/bookshelf/rebar.config` lines 19–41 (dep declarations)
+- `src/bookshelf/rebar.lock` lines 29–32, 49–52, 69–72, 101–104
+- Reference: `ai-track-docs/dependencies.md` §"Branch-tracked in lock file"
+
+---
+
+## BACKLOG-002 · Enable Erlang unit tests in GitHub Actions CI
+
+**Label**: `ci` `testing` `reliability`  
+**Size**: Small–Medium  
+**Priority**: High
+
+### Problem
+
+The GitHub Actions workflow stub has `build: false` and `unit-tests: false`.
+Erlang unit tests, dialyzer, elvis style checks, and Ruby RSpec are **not
+executed by CI** — they only run if a developer remembers to run them locally.
+A bad merge will not be caught until the build is attempted manually.
+
+```yaml
+# .github/workflows/ci-main-pull-request-stub.yml lines 96–99
+build: false
+unit-tests: false
+```
+
+### Acceptance Criteria
+
+- [ ] Erlang unit tests (`rebar3 eunit`) run on every PR to `main`
+- [ ] Dialyzer runs on every PR (or is explicitly deferred with a documented
+  reason)
+- [ ] Elvis style check runs on every PR
+- [ ] A failed unit test causes the CI check to fail and blocks merge
+- [ ] `scripts/test-bookshelf-unit.sh` (or equivalent) is usable as the CI
+  entry point if the GCC/jiffy issue is present on CI runners
+
+### Code Links
+
+- `.github/workflows/ci-main-pull-request-stub.yml` lines 96–99
+- `scripts/test-bookshelf-unit.sh` (local runner created in Ex10)
+- `src/bookshelf/Makefile` target `ci:` (line 67) — full CI sequence including CT
+
+---
+
+## BACKLOG-003 · Propagate `req_id` to all remaining untraced error logs in bookshelf
+
+**Label**: `observability` `bookshelf` `logging`  
+**Size**: Small  
+**Priority**: Medium
+
+### Problem
+
+Exercise 9 fixed 3 high-value error log lines. However 14 additional
+`error_logger:error_msg` calls in `bksw_wm_sql_object.erl`,
+`bksw_wm_object.erl`, and `bksw_io.erl` still emit without a `req_id`
+trace key. During an incident, operators cannot correlate these error messages
+to a specific client request.
+
+```erlang
+%% bksw_wm_sql_object.erl:229 — no trace context
+error_logger:error_msg("Error occurred during content download: missing chunk ~p ~p ~n",
+                       [ChunkId, DbFile])
+
+%% bksw_wm_object.erl:187 — no trace context
+error_logger:error_msg("Error occurred during content download: ~p~n", [Error])
+```
+
+### Acceptance Criteria
+
+- [ ] All `error_logger:error_msg` / `lager:error` calls in request-handling
+  modules (`bksw_wm_sql_object.erl`, `bksw_wm_object.erl`) include
+  `req_id=~s` as the first field when `#context{reqid}` is in scope
+- [ ] Log lines use `key=value` token format (grep-friendly)
+- [ ] `bksw_io.erl` filesystem errors are assessed — req_id is NOT in scope
+  there (correct), but bucket/path context should be present (already is)
+- [ ] No existing tests broken
+
+### Code Links
+
+- `src/bookshelf/src/bksw_wm_sql_object.erl` lines 174, 178, 199, 229, 232,
+  240, 245, 254, 271, 282
+- `src/bookshelf/src/bksw_wm_object.erl` lines 163, 187, 198
+- Reference: `ai-track-docs/logging.md` §"The req_id Convention"
+
+---
+
+## BACKLOG-004 · Resolve OTP version mismatch between `rebar.config` and `omnibus_overrides.rb`
+
+**Label**: `build` `reliability` `tech-debt`  
+**Size**: Small  
+**Priority**: Medium
+
+### Problem
+
+All three Erlang services (`oc_erchef`, `oc_bifrost`, `bookshelf`) require
+OTP `26.2.5.15` in `rebar.config`. The Omnibus build override for Erlang is
+commented out but specifies `26.2.5.14` — one patch behind:
+
+```erlang
+%% src/bookshelf/rebar.config:5  (same in oc_erchef and oc_bifrost)
+{require_otp_vsn, "26.2.5.15"}.
+```
+
+```ruby
+# omnibus_overrides.rb:4
+#override :erlang, version: "26.2.5.14"
+```
+
+If the Erlang override is uncommented without updating the version, all three
+services will fail `rebar3` OTP version enforcement during an omnibus build.
+The mismatch is a latent build-break trap.
+
+### Acceptance Criteria
+
+- [ ] The commented-out `:erlang` override in `omnibus_overrides.rb` is either
+  removed or updated to `26.2.5.15`
+- [ ] A comment is added explaining what OTP version the services require and
+  where to verify it
+- [ ] `doc/FrequentTasks.md` checklist (referenced in `omnibus_overrides.rb`)
+  is updated if it lists the Erlang version
+
+### Code Links
+
+- `omnibus_overrides.rb` line 4
+- `src/bookshelf/rebar.config` line 5
+- `src/oc_erchef/rebar.config` line 5
+- `src/oc_bifrost/rebar.config` line 12
+
+---
+
+## BACKLOG-005 · Add `trufflehog` / `gitleaks` allowlist for test fixture key material
+
+**Label**: `security` `ci` `dx`  
+**Size**: Small  
+**Priority**: Medium
+
+### Problem
+
+The GitHub Actions CI runs `perform-trufflehog-scan: true` with
+`fail-trufflehog-on-secrets-found: true`. The repository contains 5 committed
+`.pem` files that are intentional test fixtures and Habitat config templates
+(not real credentials). Without an allowlist, these will trigger scan failures
+on every CI run or prevent onboarding of the scanner.
+
+Exercise 8 added a plain-text header to `spec/fixtures/pivotal.pem` to make
+intent clear, but no machine-readable allowlist file exists.
+
+```
+src/chef-server-ctl/spec/fixtures/pivotal.pem   ← RSA key (test fixture)
+src/chef-server-ctl/habitat/config/pivotal.pem  ← Habitat template
+src/chef-server-ctl/habitat/config/webui_priv.pem ← Habitat template
+src/oc_erchef/apps/chef_objects/test/cert.pem   ← test certificate
+src/oc_erchef/apps/oc_chef_wm/itest/public.pem  ← test public key
+```
+
+Additionally, `zuperzecret` in `setup_helper.erl` will trip naive entropy-based
+scanners.
+
+### Acceptance Criteria
+
+- [ ] A `.trufflehog.yml` or `.gitleaks.toml` allowlist file exists at repo root
+  listing the 5 `.pem` files by path (or by file hash) as known-safe
+- [ ] The `zuperzecret` literal in `itest/setup_helper.erl` is covered by an
+  inline suppression comment (`# trufflehog:ignore` or equivalent)
+- [ ] CI secret scan passes with the allowlist in place
+- [ ] The allowlist file includes a comment explaining why each entry is excluded
+
+### Code Links
+
+- `src/chef-server-ctl/spec/fixtures/pivotal.pem` (header added in Ex8)
+- `src/oc_erchef/apps/oc_chef_wm/itest/setup_helper.erl` line 218
+- `.github/workflows/ci-main-pull-request-stub.yml` lines 71–73
+- Reference: `ai-track-docs/security-hygiene.md` §"Test fixture private key"
+
+---
+
+## Summary Table
+
+| ID | Title | Priority | Size | Label |
+|----|-------|----------|------|-------|
+| BACKLOG-001 | Pin 4 branch-tracked `rebar.lock` deps to SHAs | 🔴 High | M | `tech-debt` `reliability` |
+| BACKLOG-002 | Enable unit tests in GitHub Actions CI | 🔴 High | S–M | `ci` `testing` |
+| BACKLOG-003 | Propagate `req_id` to remaining 14 error logs | 🟡 Medium | S | `observability` |
+| BACKLOG-004 | Fix OTP version mismatch in omnibus override | 🟡 Medium | S | `build` `reliability` |
+| BACKLOG-005 | Add trufflehog/gitleaks allowlist for test PEMs | 🟡 Medium | S | `security` `ci` |

From 3ea23c79afbb525f317fa1f0fccb676c5fdaed3b Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 17:20:05 -0500
Subject: [PATCH 13/15] =?UTF-8?q?exercise=2013=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20hex=5Fencoding=5Fcase=20toggle=20for=20bksw=5Fformat:to=5Fhe?=
 =?UTF-8?q?x/1?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Adds a runtime-configurable toggle for hex letter case via the bookshelf
application environment:

  application:set_env(bookshelf, hex_encoding_case, uppercase)  % -> "0AFF"
  application:set_env(bookshelf, hex_encoding_case, lowercase)  % -> "0aff" (default)

Design:
- application:get_env/3 called once per to_hex/1 (not per byte)
- string:to_upper/1 only invoked on uppercase path (zero cost default)
- Any unknown value falls through to lowercase (fail-safe)
- No restart required; takes effect on next call

Tests (2 new, 10 total — all passing):
- to_hex_uppercase_toggle_produces_uppercase_test: set env, assert, always unset
- to_hex_default_is_lowercase_when_toggle_unset_test: confirm default

Docs: ai-track-docs/feature-toggles.md — config, risks, ETag consistency warning

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ai-track-docs/feature-toggles.md         | 111 +++++++++++++++++++++++
 src/bookshelf/src/bksw_format.erl        |  20 +++-
 src/bookshelf/test/bksw_format_tests.erl |  14 +++
 3 files changed, 142 insertions(+), 3 deletions(-)
 create mode 100644 ai-track-docs/feature-toggles.md

diff --git a/ai-track-docs/feature-toggles.md b/ai-track-docs/feature-toggles.md
new file mode 100644
index 0000000000..b478d8a4e3
--- /dev/null
+++ b/ai-track-docs/feature-toggles.md
@@ -0,0 +1,111 @@
+# Feature Toggles
+
+**Exercise**: 13 — Crawl Track v2.3.1  
+**Date**: 2026-05-18
+
+---
+
+## Toggle: `hex_encoding_case` — hex letter case in `bksw_format:to_hex/1`
+
+### What it controls
+
+The case of hex letters produced by `bksw_format:to_hex/1`, which flows into:
+
+- S3 ETag headers (via `bksw_format:to_etag/1`)
+- Request IDs (via `bksw_req:generate_id/0` → `to_base64`, not affected)
+- XML listing responses (via `bksw_xml:object_record/1`)
+
+### Why it exists
+
+The S3 specification does not mandate lowercase hex for ETags, but most AWS
+tooling and clients produce and compare lowercase. A small number of S3-compatible
+clients compare ETags case-insensitively or require uppercase. This toggle allows
+operators to switch case without a code deploy.
+
+### Configuration
+
+| Key | Value | Behavior |
+|-----|-------|----------|
+| `hex_encoding_case` | `lowercase` (**default**) | `"0aff"` — S3-standard, existing behavior |
+| `hex_encoding_case` | `uppercase` | `"0AFF"` — for compatibility with strict uppercase clients |
+
+### How to enable
+
+**At runtime** (takes effect immediately, no restart required):
+
+```erlang
+%% From an Erlang remote shell (remsh):
+application:set_env(bookshelf, hex_encoding_case, uppercase).
+
+%% To revert:
+application:set_env(bookshelf, hex_encoding_case, lowercase).
+%% or
+application:unset_env(bookshelf, hex_encoding_case).
+```
+
+**In the bookshelf `sys.config`** (requires restart):
+
+```erlang
+[
+  {bookshelf, [
+    {hex_encoding_case, uppercase},
+    %% ... other config
+  ]}
+].
+```
+
+### Implementation
+
+```erlang
+%% src/bookshelf/src/bksw_format.erl — to_hex/1
+to_hex(Bin) when is_binary(Bin) ->
+    Hex = lists:flatten([byte_to_hex(B) || <<B>> <= Bin]),
+    case application:get_env(bookshelf, hex_encoding_case, lowercase) of
+        uppercase -> string:to_upper(Hex);
+        _         -> Hex
+    end.
+```
+
+**Design decisions**:
+- `application:get_env/3` is called once per `to_hex/1` invocation (not per byte)
+- `string:to_upper/1` is only called on the uppercase path (default is zero-cost)
+- Any value other than `uppercase` (including unset, `lowercase`, or a typo)
+  falls through to the default lowercase behavior — fail-safe
+
+### Tests
+
+Two new tests in `src/bookshelf/test/bksw_format_tests.erl`:
+
+```erlang
+%% Toggle ON: uppercase mode
+to_hex_uppercase_toggle_produces_uppercase_test() ->
+    application:set_env(bookshelf, hex_encoding_case, uppercase),
+    try
+        ?assertEqual("0A1B2C3D", bksw_format:to_hex(<<16#0a, 16#1b, 16#2c, 16#3d>>))
+    after
+        application:unset_env(bookshelf, hex_encoding_case)  %% always clean up
+    end.
+
+%% Toggle OFF: default lowercase when env is unset
+to_hex_default_is_lowercase_when_toggle_unset_test() ->
+    application:unset_env(bookshelf, hex_encoding_case),
+    ?assertEqual("0a1b2c3d", bksw_format:to_hex(<<16#0a, 16#1b, 16#2c, 16#3d>>)).
+```
+
+The `try...after` block ensures the test environment is always cleaned up,
+preventing toggle state from leaking into subsequent tests.
+
+### Risks & Limitations
+
+| Concern | Note |
+|---------|------|
+| ETag comparison | If ETags stored in DB are lowercase and the toggle is flipped to uppercase, ETag checks on in-flight downloads will mismatch. Only change this toggle before or after a maintenance window, not during active uploads. |
+| `to_etag/1` affected | Since `to_etag/1` calls `to_hex/1` internally, ETags in XML listings and HTTP headers will also change case. |
+| Not persisted across restarts | Unless set in `sys.config`, `application:set_env` changes are lost on restart. |
+| No audit trail | There is no log entry when the toggle changes. Operators should log the change manually. |
+
+### What is NOT toggled
+
+- `to_base64/1` — base64 alphabet is case-defined by RFC 4648; no toggle needed
+- `to_etag/1` — format (quotes) is fixed by S3 protocol; only hex case is toggled
+- `to_date/1` — ISO 8601 format; no case concern
diff --git a/src/bookshelf/src/bksw_format.erl b/src/bookshelf/src/bksw_format.erl
index e8d730393e..45bdc21fc7 100644
--- a/src/bookshelf/src/bksw_format.erl
+++ b/src/bookshelf/src/bksw_format.erl
@@ -51,15 +51,29 @@ to_date(Date) ->
 to_base64(Bin) when is_binary(Bin) ->
     base64:encode_to_string(Bin).
 
-%% @doc Convert a binary to a lowercase hexadecimal string.
+%% @doc Convert a binary to a hexadecimal string.
 %%
 %% Each byte is formatted as exactly two hex digits (zero-padded).
-%% Example: <<10, 255>> → "0aff"
+%%
+%% The case of hex letters is controlled by the `hex_encoding_case`
+%% bookshelf application environment key:
+%%
+%%   * `lowercase` (default) — "0aff"  (S3-standard; current behavior)
+%%   * `uppercase`           — "0AFF"  (compatibility with tools that require it)
+%%
+%% Toggle at runtime (takes effect on the next call; no restart required):
+%%
+%%   application:set_env(bookshelf, hex_encoding_case, uppercase)
+%%   application:set_env(bookshelf, hex_encoding_case, lowercase)
 %%
 %% Raises function_clause if Bin is not a binary.
 -spec to_hex(binary()) -> string().
 to_hex(Bin) when is_binary(Bin) ->
-    lists:flatten([byte_to_hex(B) || <<B>> <= Bin]).
+    Hex = lists:flatten([byte_to_hex(B) || <<B>> <= Bin]),
+    case application:get_env(bookshelf, hex_encoding_case, lowercase) of
+        uppercase -> string:to_upper(Hex);
+        _         -> Hex
+    end.
 
 %% @doc Wrap a value in HTTP ETag double-quotes.
 %%
diff --git a/src/bookshelf/test/bksw_format_tests.erl b/src/bookshelf/test/bksw_format_tests.erl
index 882dbaa87d..6bb943d1b4 100644
--- a/src/bookshelf/test/bksw_format_tests.erl
+++ b/src/bookshelf/test/bksw_format_tests.erl
@@ -33,3 +33,17 @@ to_etag_wraps_hex_in_quotes_test() ->
 %% to_date/1 — undefined input returns the epoch sentinel string
 to_date_undefined_returns_epoch_test() ->
     ?assertEqual(<<"1970-01-01T00:00:00.000Z">>, bksw_format:to_date(undefined)).
+
+%% Toggle ON: hex_encoding_case=uppercase produces uppercase hex digits
+to_hex_uppercase_toggle_produces_uppercase_test() ->
+    application:set_env(bookshelf, hex_encoding_case, uppercase),
+    try
+        ?assertEqual("0A1B2C3D", bksw_format:to_hex(<<16#0a, 16#1b, 16#2c, 16#3d>>))
+    after
+        application:unset_env(bookshelf, hex_encoding_case)
+    end.
+
+%% Toggle OFF: default (no env set) preserves lowercase behavior
+to_hex_default_is_lowercase_when_toggle_unset_test() ->
+    application:unset_env(bookshelf, hex_encoding_case),
+    ?assertEqual("0a1b2c3d", bksw_format:to_hex(<<16#0a, 16#1b, 16#2c, 16#3d>>)).

From 509bdf9afff5b25b968633374515cb342b956ab0 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 17:26:27 -0500
Subject: [PATCH 14/15] =?UTF-8?q?exercise=2014=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20static=20analysis=20=E2=80=94=20elvis=20+=20dialyzer=20basel?=
 =?UTF-8?q?ine?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Elvis: 0 violations across all 20 bookshelf src/*.erl files (9 rules).
All Ex3-13 changes to bksw_format.erl and bksw_wm_sql_object.erl pass clean.

Dialyzer on bksw_format.erl (with iso8601 dep): exit 0, no warnings.
All -spec attrs consistent with actual return types including the Ex13
string:to_upper/1 toggle path.

bksw_wm_sql_object.erl: 'Unknown functions' warnings are expected (sibling
modules not in minimal PLT) — no defects in our Ex9 code.

Pre-existing finding: mochiweb_http.erl:79 unreachable pattern in 3rd-party
mochiweb v2.x; not introduced by our changes.

Gaps documented: no Elvis/Dialyzer in CI, full PLT blocked by jiffy NIF segfault.
See ai-track-docs/static-analysis.md for full findings and run instructions.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ai-track-docs/static-analysis.md | 158 +++++++++++++++++++++++++++++++
 1 file changed, 158 insertions(+)
 create mode 100644 ai-track-docs/static-analysis.md

diff --git a/ai-track-docs/static-analysis.md b/ai-track-docs/static-analysis.md
new file mode 100644
index 0000000000..7b25a6f4b7
--- /dev/null
+++ b/ai-track-docs/static-analysis.md
@@ -0,0 +1,158 @@
+# Static Analysis — Exercise 14
+
+**Date**: 2026-05-18  
+**Scope**: `src/bookshelf/src/*.erl` — 20 modules  
+**Tools**: Elvis (style), Dialyzer (type / flow)
+
+---
+
+## Elvis (style linter)
+
+### Config
+
+`src/bookshelf/elvis.config` — 9 rules applied to all `src/*.erl` files:
+
+| Rule | What it checks |
+|------|----------------|
+| `macro_names` | Macros must be UPPER_CASE |
+| `no_if_expression` | No `if` expressions (use `case` instead) |
+| `no_debug_call` | No `io:format`, `erlang:display` (except `bksw_app`) |
+| `no_nested_try_catch` | No `try` inside another `try` |
+| `no_tabs` | No tab characters |
+| `no_trailing_whitespace` | No trailing spaces |
+| `operator_spaces` | Spaces around operators |
+| `used_ignored_variable` | No `_Var` that is actually used |
+| `variable_naming_convention` | CamelCase variable names |
+
+### Result
+
+```
+# src/bksw_app.erl [OK]
+# src/bksw_cleanup_task.erl [OK]
+# src/bksw_conf.erl [OK]
+# src/bksw_format.erl [OK]          ← our practice module
+# src/bksw_io.erl [OK]
+# src/bksw_io_names.erl [OK]
+# src/bksw_req.erl [OK]
+# src/bksw_sec.erl [OK]
+# src/bksw_sql.erl [OK]
+# src/bksw_sup.erl [OK]
+# src/bksw_util.erl [OK]
+# src/bksw_webmachine_sup.erl [OK]
+# src/bksw_wm_base.erl [OK]
+# src/bksw_wm_bucket.erl [OK]
+# src/bksw_wm_index.erl [OK]
+# src/bksw_wm_object.erl [OK]
+# src/bksw_wm_sql_bucket.erl [OK]
+# src/bksw_wm_sql_index.erl [OK]
+# src/bksw_wm_sql_object.erl [OK]   ← Ex9 req_id changes
+# src/bksw_xml.erl [OK]
+
+Exit 0 — 0 violations across all 20 files
+```
+
+All Exercise 3–13 changes to `bksw_format.erl` and `bksw_wm_sql_object.erl`
+pass every Elvis rule.
+
+**How to run**:
+```bash
+cd src/bookshelf
+../../scripts/elvis rock --config elvis.config -V
+```
+
+---
+
+## Dialyzer (type / success-typing analysis)
+
+### Setup
+
+No pre-built PLT was present in this environment. A minimal OTP PLT was built
+from `erts`, `stdlib`, and `kernel` for targeted module analysis:
+
+```bash
+dialyzer --build_plt --output_plt /tmp/otp_base.plt --apps erts stdlib kernel
+# 1m7s; emits only qlc_pt.erl compile:option/0 warning (OTP stdlib internal)
+```
+
+### `bksw_format.erl` — clean
+
+**Without iso8601 dep** (minimal PLT only):
+```
+Unknown functions: iso8601:format/1 (src/bksw_format.erl:45:5)
+Exit 2 (warnings-as-exit)
+```
+→ Expected: `iso8601` is a 3rd-party dep not in the minimal PLT. Not a real defect.
+
+**With iso8601 dep** added to analysis:
+```bash
+dialyzer --plt /tmp/otp_base.plt \
+  _build/default/lib/iso8601/ebin \
+  /tmp/bksw_format.beam
+# done (passed successfully)
+# Exit 0 — no warnings
+```
+
+All `-spec` attributes are consistent with actual return types:
+
+| Function | Spec return | Actual return |
+|----------|------------|---------------|
+| `to_date/1` | `binary()` | `binary()` ✓ |
+| `to_base64/1` | `string()` | `string()` (base64:encode_to_string) ✓ |
+| `to_hex/1` | `string()` | `string()` (list of chars from byte_to_hex) ✓ |
+| `to_etag/1` | `string()` | `string()` ✓ |
+| `byte_to_hex/1` | `string()` | `string()` ✓ |
+
+The Ex13 toggle (`string:to_upper/1` applied to a `string()`) returns `string()` — no
+type widening or spec violation.
+
+### `bksw_wm_sql_object.erl` — "unknown functions" only (expected)
+
+When analyzed in isolation (without the full bookshelf PLT), all warnings are
+"Unknown functions" — calls to sibling modules (`bksw_format`, `bksw_sql`,
+`bksw_req`, `bksw_util`, `bksw_wm_base`) and the `crypto` OTP app not present
+in the minimal PLT. These are **not defects**.
+
+One pre-existing finding from the pulled-in `mochiweb` library:
+```
+mochiweb_http.erl:79:7: The pattern
+    {'error', {'already_started', _Pid}} can never match the type {'ok', pid()}
+```
+→ Pre-existing in mochiweb v2.x; not in our code; not introduced by Ex9 changes.
+
+---
+
+## Summary
+
+| Tool | Files checked | Violations | Notes |
+|------|--------------|------------|-------|
+| Elvis | 20 `src/*.erl` | **0** | All 9 rules pass |
+| Dialyzer (`bksw_format`) | 1 | **0** (with dep) | `-spec` attrs consistent |
+| Dialyzer (`bksw_wm_sql_object`) | 1 | 0 in our code | "Unknown fn" warnings expected |
+
+---
+
+## Gaps & Recommendations
+
+| Item | Priority | Note |
+|------|----------|------|
+| Full bookshelf PLT | Medium | `rebar3 dialyzer` builds a complete PLT including all deps; blocked by jiffy NIF segfault in this env |
+| CI integration | High | Neither Elvis nor Dialyzer run in CI (see `build-test.md`); adding them would catch regressions automatically |
+| `elvis.config` coverage | Low | `test/*.erl` not linted; consider adding a `test` dir stanza |
+| Dialyzer `unknown_function` allowlist | Low | A `.dialyzer.ignore` file (or `rebar3 dialyzer` config) would suppress noise from cross-module unknowns |
+
+---
+
+## How to Run (locally)
+
+```bash
+# Elvis — style check all bookshelf modules
+cd src/bookshelf
+../../scripts/elvis rock --config elvis.config -V
+
+# Dialyzer — type check bksw_format.erl (requires pre-built PLT)
+ERL_LIBS=_build/default/lib erlc +debug_info -I include -o /tmp src/bksw_format.erl
+dialyzer --plt /tmp/otp_base.plt _build/default/lib/iso8601/ebin /tmp/bksw_format.beam
+
+# rebar3 dialyzer (full project; requires jiffy NIF build to work)
+cd src/bookshelf && ./rebar3 dialyzer
+```

From a6bc5d623181e419dd2df722d6e64778b145ea52 Mon Sep 17 00:00:00 2001
From: Lincoln Baker <51833247+lbakerchef@users.noreply.github.com>
Date: Mon, 18 May 2026 17:32:39 -0500
Subject: [PATCH 15/15] =?UTF-8?q?exercise=2015=20=E2=80=94=20ghcp(crawl):?=
 =?UTF-8?q?=20resilience=20+=20failure=20tests=20for=20bksw=5Fformat?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Four new tests (14 total, all passing):

1. to_hex_unknown_toggle_value_falls_back_to_lowercase_test
   Proves the wildcard clause in to_hex/1's case expression fires on
   unrecognised hex_encoding_case values — bad config never crashes.

2. to_etag_empty_binary_produces_empty_quoted_string_test
   Edge case: to_etag(<<>>) produces ""  (valid ETag for empty object).

3. to_hex_large_binary_does_not_crash_test
   Boundary: 1 KiB binary (1024 bytes) encodes to exactly 2048 hex chars
   with correct content — no crash, no truncation.

4. to_date_datetime_tag_unwraps_and_formats_test
   Previously untested code path: the {datetime, Date} tagged form of
   to_date/1 was missing coverage. Verifies the unwrap clause delegates
   to iso8601 and returns a binary ISO 8601 string containing the date.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 src/bookshelf/test/bksw_format_tests.erl | 31 ++++++++++++++++++++++++
 1 file changed, 31 insertions(+)

diff --git a/src/bookshelf/test/bksw_format_tests.erl b/src/bookshelf/test/bksw_format_tests.erl
index 6bb943d1b4..0e0c0f17a2 100644
--- a/src/bookshelf/test/bksw_format_tests.erl
+++ b/src/bookshelf/test/bksw_format_tests.erl
@@ -47,3 +47,34 @@ to_hex_uppercase_toggle_produces_uppercase_test() ->
 to_hex_default_is_lowercase_when_toggle_unset_test() ->
     application:unset_env(bookshelf, hex_encoding_case),
     ?assertEqual("0a1b2c3d", bksw_format:to_hex(<<16#0a, 16#1b, 16#2c, 16#3d>>)).
+
+%% ── Exercise 15: Resilience & failure tests ───────────────────────────────
+
+%% Resilience: unrecognised toggle value falls back to lowercase without crashing.
+%% The wildcard clause (_ -> Hex) is the fail-safe; this test proves it fires.
+to_hex_unknown_toggle_value_falls_back_to_lowercase_test() ->
+    application:set_env(bookshelf, hex_encoding_case, not_a_valid_case),
+    try
+        ?assertEqual("0a1b2c3d", bksw_format:to_hex(<<16#0a, 16#1b, 16#2c, 16#3d>>))
+    after
+        application:unset_env(bookshelf, hex_encoding_case)
+    end.
+
+%% Edge case: to_etag/1 on an empty binary produces a valid (empty) quoted ETag.
+to_etag_empty_binary_produces_empty_quoted_string_test() ->
+    ?assertEqual("\"\"", lists:flatten(bksw_format:to_etag(<<>>))).
+
+%% Boundary: to_hex/1 on a 1 KiB binary does not crash and returns the correct length.
+to_hex_large_binary_does_not_crash_test() ->
+    LargeBin = binary:copy(<<16#ab>>, 1024),
+    Result = bksw_format:to_hex(LargeBin),
+    ?assertEqual(2048, length(Result)),
+    ?assertEqual("ab", lists:sublist(Result, 2)).
+
+%% Failure path: the {datetime, Date} tagged form of to_date/1 was previously untested.
+%% Verifies the unwrap clause delegates to iso8601 and returns a binary ISO 8601 string.
+to_date_datetime_tag_unwraps_and_formats_test() ->
+    DateTime = {{2024, 1, 15}, {10, 30, 0}},
+    Result = bksw_format:to_date({datetime, DateTime}),
+    ?assertMatch(<<_/binary>>, Result),
+    ?assertNotEqual(nomatch, binary:match(Result, <<"2024-01-15">>)).