From 580b186c2d11af28df5e9a1e0bae104b82753f46 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 24 Feb 2026 23:31:40 +0000
Subject: [PATCH 1/6] Initial plan


From 4eac0a8494a2d34c513e8240d9aaeb64fc94706e Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 24 Feb 2026 23:36:01 +0000
Subject: [PATCH 2/6] Add Dockerfile, .dockerignore, deploy.sh, and cloud-run
 config for serverless GCP deployment

Co-authored-by: pmayd <9614291+pmayd@users.noreply.github.com>
---
 .dockerignore         | 11 +++++++
 Dockerfile            | 49 +++++++++++++++++++++++++++++++
 config.yml            |  3 ++
 scripts/gcp/deploy.sh | 68 +++++++++++++++++++++++++++++++++++++++++++
 4 files changed, 131 insertions(+)
 create mode 100644 .dockerignore
 create mode 100644 Dockerfile
 create mode 100755 scripts/gcp/deploy.sh

diff --git a/.dockerignore b/.dockerignore
new file mode 100644
index 0000000..94fee5d
--- /dev/null
+++ b/.dockerignore
@@ -0,0 +1,11 @@
+.git
+.github
+.Rproj.user
+.Rhistory
+.RData
+*.Rproj
+data/
+renv/library/
+renv/local/
+renv/staging/
+secrets/
diff --git a/Dockerfile b/Dockerfile
new file mode 100644
index 0000000..1b8bf9b
--- /dev/null
+++ b/Dockerfile
@@ -0,0 +1,49 @@
+FROM rocker/r-ver:4.5.1
+
+# Install system dependencies required by R packages
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    apt-transport-https \
+    ca-certificates \
+    gnupg \
+    curl \
+    libssl-dev \
+    libxml2-dev \
+    libcurl4-openssl-dev \
+    libfontconfig1-dev \
+    libharfbuzz-dev \
+    libfribidi-dev \
+    libfreetype6-dev \
+    libpng-dev \
+    libtiff5-dev \
+    libjpeg-dev \
+    && rm -rf /var/lib/apt/lists/*
+
+# Install Google Cloud SDK (provides gsutil and bq)
+RUN curl https://packages.cloud.google.com/apt/doc/apt-key.gpg \
+    | gpg --dearmor -o /usr/share/keyrings/cloud.google.gpg \
+    && echo "deb [signed-by=/usr/share/keyrings/cloud.google.gpg] https://packages.cloud.google.com/apt cloud-sdk main" \
+    | tee /etc/apt/sources.list.d/google-cloud-sdk.list \
+    && apt-get update && apt-get install -y --no-install-recommends google-cloud-cli \
+    && rm -rf /var/lib/apt/lists/*
+
+WORKDIR /workspace
+
+# Copy renv infrastructure first to leverage Docker layer caching for packages
+COPY renv.lock renv.lock
+COPY .Rprofile .Rprofile
+COPY renv/activate.R renv/activate.R
+COPY renv/settings.json renv/settings.json
+
+# Install renv
+RUN R -e "install.packages('renv', repos = 'https://cloud.r-project.org')"
+
+# Restore all R packages declared in renv.lock
+RUN R -e "renv::restore()"
+
+# Copy the rest of the application
+COPY . .
+
+# Use the cloud-run configuration profile
+ENV R_CONFIG_ACTIVE=cloud-run
+
+ENTRYPOINT ["Rscript", "scripts/R/run_pipeline.R"]
diff --git a/config.yml b/config.yml
index bb71b4d..abb9128 100644
--- a/config.yml
+++ b/config.yml
@@ -8,3 +8,6 @@ default:
 
 production:
     data_root: "/home/rstudio/data"
+
+cloud-run:
+    data_root: "/workspace/data"
diff --git a/scripts/gcp/deploy.sh b/scripts/gcp/deploy.sh
new file mode 100755
index 0000000..5d86027
--- /dev/null
+++ b/scripts/gcp/deploy.sh
@@ -0,0 +1,68 @@
+#!/bin/bash
+# Build the Docker image, push it to Artifact Registry, and deploy the A4D
+# pipeline as a Cloud Run Job that can be triggered manually.
+#
+# Prerequisites:
+#   - gcloud CLI authenticated with sufficient permissions
+#   - Docker installed and running
+#   - Service account "${SERVICE_ACCOUNT}" created with the following roles:
+#       roles/storage.objectViewer       (read source files from GCS)
+#       roles/storage.objectCreator      (write output files to GCS)
+#       roles/bigquery.dataEditor        (write tables to BigQuery)
+#       roles/bigquery.jobUser           (run BigQuery load jobs)
+#       roles/secretmanager.secretAccessor (access the SA key secret)
+#   - Secret "a4d-gcp-sa" created in Secret Manager containing the service
+#     account JSON key used to authenticate googlesheets4/googledrive
+#
+# Usage:
+#   PROJECT_ID=my-project SERVICE_ACCOUNT=sa@my-project.iam.gserviceaccount.com \
+#     bash scripts/gcp/deploy.sh
+#
+# To run the pipeline after deployment:
+#   gcloud run jobs execute a4d-pipeline \
+#     --region=${REGION} --project=${PROJECT_ID} --wait
+
+set -euo pipefail
+
+PROJECT_ID="${PROJECT_ID:-a4d-315220}"
+REGION="${REGION:-europe-west1}"
+REPOSITORY="a4d"
+IMAGE_NAME="pipeline"
+JOB_NAME="a4d-pipeline"
+SERVICE_ACCOUNT="${SERVICE_ACCOUNT:-a4d-pipeline@${PROJECT_ID}.iam.gserviceaccount.com}"
+IMAGE_URI="${REGION}-docker.pkg.dev/${PROJECT_ID}/${REPOSITORY}/${IMAGE_NAME}"
+
+echo "==> Configuring Docker authentication for Artifact Registry..."
+gcloud auth configure-docker "${REGION}-docker.pkg.dev" --quiet
+
+echo "==> Creating Artifact Registry repository (skipped if it already exists)..."
+gcloud artifacts repositories create "${REPOSITORY}" \
+    --repository-format=docker \
+    --location="${REGION}" \
+    --project="${PROJECT_ID}" \
+    --quiet 2>/dev/null || true
+
+echo "==> Building Docker image: ${IMAGE_URI}"
+docker build --cache-from "${IMAGE_URI}" -t "${IMAGE_URI}" .
+
+echo "==> Pushing Docker image to Artifact Registry..."
+docker push "${IMAGE_URI}"
+
+echo "==> Deploying Cloud Run Job: ${JOB_NAME}"
+gcloud run jobs deploy "${JOB_NAME}" \
+    --image="${IMAGE_URI}" \
+    --region="${REGION}" \
+    --project="${PROJECT_ID}" \
+    --service-account="${SERVICE_ACCOUNT}" \
+    --memory=8Gi \
+    --cpu=4 \
+    --max-retries=0 \
+    --task-timeout=3h \
+    --set-secrets="/workspace/secrets/a4d-gcp-sa.json=a4d-gcp-sa:latest"
+
+echo ""
+echo "==> Deployment complete."
+echo ""
+echo "To run the pipeline manually, execute:"
+echo "  gcloud run jobs execute ${JOB_NAME} \\"
+echo "    --region=${REGION} --project=${PROJECT_ID} --wait"

From b57b4834cab876ead48e7c60c67a324c5aed3a9c Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 24 Feb 2026 23:53:14 +0000
Subject: [PATCH 3/6] Deploy Python pipeline as Cloud Run Job: fix Dockerfile,
 add run-pipeline CLI command, update deploy.sh

Co-authored-by: pmayd <9614291+pmayd@users.noreply.github.com>
---
 .dockerignore                                 |    8 +-
 Dockerfile                                    |   49 -
 a4d-python/.env.example                       |   25 +
 a4d-python/.gitignore                         |   67 +
 a4d-python/Dockerfile                         |   34 +
 a4d-python/README.md                          |  221 +++
 a4d-python/docs/CLAUDE.md                     |  185 +++
 a4d-python/docs/REMAINING_DIFFERENCES.md      |  240 +++
 a4d-python/docs/VALIDATION_TRACKING.md        |  403 +++++
 a4d-python/docs/migration/MIGRATION_GUIDE.md  |  740 ++++++++++
 .../docs/migration/PYTHON_IMPROVEMENTS.md     |  146 ++
 .../migration/REFERENCE_DATA_MIGRATION.md     |  529 +++++++
 a4d-python/justfile                           |  114 ++
 a4d-python/profiling/PROFILING_SUMMARY.md     |  246 ++++
 a4d-python/profiling/extraction_2019.prof     |  Bin 0 -> 86857 bytes
 a4d-python/profiling/extraction_2024.prof     |  Bin 0 -> 84453 bytes
 a4d-python/pyproject.toml                     |   80 +
 a4d-python/scripts/analyze_logs.sql           |   74 +
 a4d-python/scripts/check_sheets.py            |   79 +
 a4d-python/scripts/compare_r_vs_python.py     |  530 +++++++
 a4d-python/scripts/export_single_tracker.py   |   55 +
 a4d-python/scripts/profile_extraction.py      |   77 +
 .../scripts/profile_extraction_detailed.py    |  193 +++
 a4d-python/scripts/reprocess_tracker.py       |   16 +
 a4d-python/scripts/test_cleaning.py           |   87 ++
 a4d-python/scripts/test_extended_trackers.py  |  142 ++
 a4d-python/scripts/test_multiple_trackers.py  |  128 ++
 a4d-python/scripts/verify_fixes.py            |  122 ++
 a4d-python/src/a4d/__init__.py                |   15 +
 a4d-python/src/a4d/__main__.py                |    6 +
 a4d-python/src/a4d/clean/__init__.py          |   15 +
 a4d-python/src/a4d/clean/converters.py        |  349 +++++
 a4d-python/src/a4d/clean/date_parser.py       |  123 ++
 a4d-python/src/a4d/clean/patient.py           |  933 ++++++++++++
 a4d-python/src/a4d/clean/schema.py            |  159 ++
 a4d-python/src/a4d/clean/schema_old.py        |  202 +++
 a4d-python/src/a4d/clean/transformers.py      |  388 +++++
 a4d-python/src/a4d/clean/validators.py        |  423 ++++++
 a4d-python/src/a4d/cli.py                     |  578 ++++++++
 a4d-python/src/a4d/config.py                  |   57 +
 a4d-python/src/a4d/errors.py                  |  210 +++
 a4d-python/src/a4d/extract/__init__.py        |    0
 a4d-python/src/a4d/extract/patient.py         |  958 ++++++++++++
 a4d-python/src/a4d/gcp/__init__.py            |   21 +
 a4d-python/src/a4d/gcp/bigquery.py            |  187 +++
 a4d-python/src/a4d/gcp/storage.py             |  129 ++
 a4d-python/src/a4d/logging.py                 |  159 ++
 a4d-python/src/a4d/pipeline/__init__.py       |   18 +
 a4d-python/src/a4d/pipeline/models.py         |   78 +
 a4d-python/src/a4d/pipeline/patient.py        |  329 +++++
 a4d-python/src/a4d/pipeline/tracker.py        |  113 ++
 a4d-python/src/a4d/reference/__init__.py      |   43 +
 a4d-python/src/a4d/reference/loaders.py       |   83 ++
 a4d-python/src/a4d/reference/provinces.py     |  166 +++
 a4d-python/src/a4d/reference/synonyms.py      |  343 +++++
 a4d-python/src/a4d/state/__init__.py          |    0
 a4d-python/src/a4d/tables/__init__.py         |   18 +
 a4d-python/src/a4d/tables/logs.py             |  220 +++
 a4d-python/src/a4d/tables/patient.py          |  213 +++
 a4d-python/src/a4d/utils/__init__.py          |    3 +
 a4d-python/tests/test_clean/__init__.py       |    1 +
 .../tests/test_clean/test_converters.py       |  337 +++++
 a4d-python/tests/test_clean/test_patient.py   |  418 ++++++
 .../tests/test_clean/test_transformers.py     |  847 +++++++++++
 .../tests/test_clean/test_validators.py       |  592 ++++++++
 a4d-python/tests/test_errors.py               |  167 +++
 a4d-python/tests/test_extract/__init__.py     |    1 +
 a4d-python/tests/test_extract/test_patient.py |  648 ++++++++
 .../test_extract/test_patient_helpers.py      |  470 ++++++
 a4d-python/tests/test_gcp/__init__.py         |    0
 a4d-python/tests/test_gcp/test_bigquery.py    |  173 +++
 a4d-python/tests/test_gcp/test_storage.py     |  114 ++
 a4d-python/tests/test_integration/__init__.py |    9 +
 a4d-python/tests/test_integration/conftest.py |   42 +
 .../test_clean_integration.py                 |  133 ++
 a4d-python/tests/test_integration/test_e2e.py |  147 ++
 .../test_extract_integration.py               |  134 ++
 .../test_integration/test_r_validation.py     |  855 +++++++++++
 a4d-python/tests/test_reference/__init__.py   |    1 +
 .../tests/test_reference/test_provinces.py    |  248 ++++
 .../tests/test_reference/test_synonyms.py     |  344 +++++
 a4d-python/tests/test_tables/test_patient.py  |  361 +++++
 a4d-python/uv.lock                            | 1298 +++++++++++++++++
 config.yml                                    |    3 -
 scripts/R/run_pipeline.R                      |   28 +-
 scripts/gcp/deploy.sh                         |   23 +-
 86 files changed, 18448 insertions(+), 75 deletions(-)
 delete mode 100644 Dockerfile
 create mode 100644 a4d-python/.env.example
 create mode 100644 a4d-python/.gitignore
 create mode 100644 a4d-python/Dockerfile
 create mode 100644 a4d-python/README.md
 create mode 100644 a4d-python/docs/CLAUDE.md
 create mode 100644 a4d-python/docs/REMAINING_DIFFERENCES.md
 create mode 100644 a4d-python/docs/VALIDATION_TRACKING.md
 create mode 100644 a4d-python/docs/migration/MIGRATION_GUIDE.md
 create mode 100644 a4d-python/docs/migration/PYTHON_IMPROVEMENTS.md
 create mode 100644 a4d-python/docs/migration/REFERENCE_DATA_MIGRATION.md
 create mode 100644 a4d-python/justfile
 create mode 100644 a4d-python/profiling/PROFILING_SUMMARY.md
 create mode 100644 a4d-python/profiling/extraction_2019.prof
 create mode 100644 a4d-python/profiling/extraction_2024.prof
 create mode 100644 a4d-python/pyproject.toml
 create mode 100644 a4d-python/scripts/analyze_logs.sql
 create mode 100644 a4d-python/scripts/check_sheets.py
 create mode 100644 a4d-python/scripts/compare_r_vs_python.py
 create mode 100644 a4d-python/scripts/export_single_tracker.py
 create mode 100644 a4d-python/scripts/profile_extraction.py
 create mode 100644 a4d-python/scripts/profile_extraction_detailed.py
 create mode 100644 a4d-python/scripts/reprocess_tracker.py
 create mode 100644 a4d-python/scripts/test_cleaning.py
 create mode 100644 a4d-python/scripts/test_extended_trackers.py
 create mode 100644 a4d-python/scripts/test_multiple_trackers.py
 create mode 100644 a4d-python/scripts/verify_fixes.py
 create mode 100644 a4d-python/src/a4d/__init__.py
 create mode 100644 a4d-python/src/a4d/__main__.py
 create mode 100644 a4d-python/src/a4d/clean/__init__.py
 create mode 100644 a4d-python/src/a4d/clean/converters.py
 create mode 100644 a4d-python/src/a4d/clean/date_parser.py
 create mode 100644 a4d-python/src/a4d/clean/patient.py
 create mode 100644 a4d-python/src/a4d/clean/schema.py
 create mode 100644 a4d-python/src/a4d/clean/schema_old.py
 create mode 100644 a4d-python/src/a4d/clean/transformers.py
 create mode 100644 a4d-python/src/a4d/clean/validators.py
 create mode 100644 a4d-python/src/a4d/cli.py
 create mode 100644 a4d-python/src/a4d/config.py
 create mode 100644 a4d-python/src/a4d/errors.py
 create mode 100644 a4d-python/src/a4d/extract/__init__.py
 create mode 100644 a4d-python/src/a4d/extract/patient.py
 create mode 100644 a4d-python/src/a4d/gcp/__init__.py
 create mode 100644 a4d-python/src/a4d/gcp/bigquery.py
 create mode 100644 a4d-python/src/a4d/gcp/storage.py
 create mode 100644 a4d-python/src/a4d/logging.py
 create mode 100644 a4d-python/src/a4d/pipeline/__init__.py
 create mode 100644 a4d-python/src/a4d/pipeline/models.py
 create mode 100644 a4d-python/src/a4d/pipeline/patient.py
 create mode 100644 a4d-python/src/a4d/pipeline/tracker.py
 create mode 100644 a4d-python/src/a4d/reference/__init__.py
 create mode 100644 a4d-python/src/a4d/reference/loaders.py
 create mode 100644 a4d-python/src/a4d/reference/provinces.py
 create mode 100644 a4d-python/src/a4d/reference/synonyms.py
 create mode 100644 a4d-python/src/a4d/state/__init__.py
 create mode 100644 a4d-python/src/a4d/tables/__init__.py
 create mode 100644 a4d-python/src/a4d/tables/logs.py
 create mode 100644 a4d-python/src/a4d/tables/patient.py
 create mode 100644 a4d-python/src/a4d/utils/__init__.py
 create mode 100644 a4d-python/tests/test_clean/__init__.py
 create mode 100644 a4d-python/tests/test_clean/test_converters.py
 create mode 100644 a4d-python/tests/test_clean/test_patient.py
 create mode 100644 a4d-python/tests/test_clean/test_transformers.py
 create mode 100644 a4d-python/tests/test_clean/test_validators.py
 create mode 100644 a4d-python/tests/test_errors.py
 create mode 100644 a4d-python/tests/test_extract/__init__.py
 create mode 100644 a4d-python/tests/test_extract/test_patient.py
 create mode 100644 a4d-python/tests/test_extract/test_patient_helpers.py
 create mode 100644 a4d-python/tests/test_gcp/__init__.py
 create mode 100644 a4d-python/tests/test_gcp/test_bigquery.py
 create mode 100644 a4d-python/tests/test_gcp/test_storage.py
 create mode 100644 a4d-python/tests/test_integration/__init__.py
 create mode 100644 a4d-python/tests/test_integration/conftest.py
 create mode 100644 a4d-python/tests/test_integration/test_clean_integration.py
 create mode 100644 a4d-python/tests/test_integration/test_e2e.py
 create mode 100644 a4d-python/tests/test_integration/test_extract_integration.py
 create mode 100644 a4d-python/tests/test_integration/test_r_validation.py
 create mode 100644 a4d-python/tests/test_reference/__init__.py
 create mode 100644 a4d-python/tests/test_reference/test_provinces.py
 create mode 100644 a4d-python/tests/test_reference/test_synonyms.py
 create mode 100644 a4d-python/tests/test_tables/test_patient.py
 create mode 100644 a4d-python/uv.lock

diff --git a/.dockerignore b/.dockerignore
index 94fee5d..ce02378 100644
--- a/.dockerignore
+++ b/.dockerignore
@@ -4,8 +4,10 @@
 .Rhistory
 .RData
 *.Rproj
+a4d-python/.pytest_cache
+a4d-python/.ruff_cache
+a4d-python/htmlcov
+a4d-python/.coverage
+a4d-python/profiling/*.prof
 data/
-renv/library/
-renv/local/
-renv/staging/
 secrets/
diff --git a/Dockerfile b/Dockerfile
deleted file mode 100644
index 1b8bf9b..0000000
--- a/Dockerfile
+++ /dev/null
@@ -1,49 +0,0 @@
-FROM rocker/r-ver:4.5.1
-
-# Install system dependencies required by R packages
-RUN apt-get update && apt-get install -y --no-install-recommends \
-    apt-transport-https \
-    ca-certificates \
-    gnupg \
-    curl \
-    libssl-dev \
-    libxml2-dev \
-    libcurl4-openssl-dev \
-    libfontconfig1-dev \
-    libharfbuzz-dev \
-    libfribidi-dev \
-    libfreetype6-dev \
-    libpng-dev \
-    libtiff5-dev \
-    libjpeg-dev \
-    && rm -rf /var/lib/apt/lists/*
-
-# Install Google Cloud SDK (provides gsutil and bq)
-RUN curl https://packages.cloud.google.com/apt/doc/apt-key.gpg \
-    | gpg --dearmor -o /usr/share/keyrings/cloud.google.gpg \
-    && echo "deb [signed-by=/usr/share/keyrings/cloud.google.gpg] https://packages.cloud.google.com/apt cloud-sdk main" \
-    | tee /etc/apt/sources.list.d/google-cloud-sdk.list \
-    && apt-get update && apt-get install -y --no-install-recommends google-cloud-cli \
-    && rm -rf /var/lib/apt/lists/*
-
-WORKDIR /workspace
-
-# Copy renv infrastructure first to leverage Docker layer caching for packages
-COPY renv.lock renv.lock
-COPY .Rprofile .Rprofile
-COPY renv/activate.R renv/activate.R
-COPY renv/settings.json renv/settings.json
-
-# Install renv
-RUN R -e "install.packages('renv', repos = 'https://cloud.r-project.org')"
-
-# Restore all R packages declared in renv.lock
-RUN R -e "renv::restore()"
-
-# Copy the rest of the application
-COPY . .
-
-# Use the cloud-run configuration profile
-ENV R_CONFIG_ACTIVE=cloud-run
-
-ENTRYPOINT ["Rscript", "scripts/R/run_pipeline.R"]
diff --git a/a4d-python/.env.example b/a4d-python/.env.example
new file mode 100644
index 0000000..0937a10
--- /dev/null
+++ b/a4d-python/.env.example
@@ -0,0 +1,25 @@
+# Environment Configuration
+A4D_ENVIRONMENT=development
+
+# GCP Configuration
+A4D_PROJECT_ID=a4dphase2
+A4D_DATASET=tracker
+A4D_DOWNLOAD_BUCKET=a4dphase2_upload
+A4D_UPLOAD_BUCKET=a4dphase2_output
+
+# GCP Authentication (optional - uses Application Default Credentials if not set)
+# For local development: run `gcloud auth application-default login`
+# For CI/CD or VM: set path to service account key file
+# GOOGLE_APPLICATION_CREDENTIALS=/path/to/service-account-key.json
+
+# Paths
+A4D_DATA_ROOT=/path/to/tracker/files
+A4D_OUTPUT_DIR=output
+
+# Processing Settings
+A4D_MAX_WORKERS=4
+
+# Error Values (matching R pipeline)
+A4D_ERROR_VAL_NUMERIC=999999
+A4D_ERROR_VAL_CHARACTER=Undefined
+A4D_ERROR_VAL_DATE=9999-09-09
diff --git a/a4d-python/.gitignore b/a4d-python/.gitignore
new file mode 100644
index 0000000..60bc93f
--- /dev/null
+++ b/a4d-python/.gitignore
@@ -0,0 +1,67 @@
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+
+# Virtual environments
+.venv/
+venv/
+ENV/
+env/
+
+# uv
+.uv/
+
+# Testing
+.pytest_cache/
+.coverage
+htmlcov/
+.tox/
+
+# Type checking
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# IDEs
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+
+# Environment
+.env
+.env.local
+
+# Logs
+*.log
+logs/
+
+# Data (sensitive)
+data/
+output/
+*.parquet
+*.xlsx
+!reference_data/
+
+# OS
+.DS_Store
+Thumbs.db
diff --git a/a4d-python/Dockerfile b/a4d-python/Dockerfile
new file mode 100644
index 0000000..f13820b
--- /dev/null
+++ b/a4d-python/Dockerfile
@@ -0,0 +1,34 @@
+FROM python:3.11-slim
+
+# Install system dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    gcc \
+    g++ \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+
+# Install uv
+RUN curl -LsSf https://astral.sh/uv/install.sh | sh
+ENV PATH="/root/.cargo/bin:${PATH}"
+
+WORKDIR /app
+
+# Copy dependency files first to leverage Docker layer caching
+COPY a4d-python/pyproject.toml a4d-python/uv.lock ./
+
+# Install production dependencies only
+RUN uv sync --frozen --no-dev
+
+# Copy application code
+COPY a4d-python/src/ src/
+
+# Copy reference data from the repo root
+COPY reference_data/ reference_data/
+
+# Set environment
+ENV PYTHONPATH=/app/src
+ENV PYTHONUNBUFFERED=1
+ENV A4D_DATA_ROOT=/workspace/data
+
+# Run the full pipeline: download → process → upload to GCS → ingest into BigQuery
+CMD ["uv", "run", "a4d", "run-pipeline"]
diff --git a/a4d-python/README.md b/a4d-python/README.md
new file mode 100644
index 0000000..b1b3b8e
--- /dev/null
+++ b/a4d-python/README.md
@@ -0,0 +1,221 @@
+# A4D Data Processing Pipeline (Python)
+
+Python implementation of the A4D medical tracker data processing pipeline.
+
+## Migration Status
+
+🚧 **Active Development** - Migrating from R to Python
+
+See [Migration Documentation](../MIGRATION_OVERVIEW.md) for details.
+
+## Features
+
+- ✅ **Incremental Processing** - Only process changed tracker files
+- ✅ **Parallel Execution** - Process multiple trackers concurrently
+- ✅ **Stateless GCP Deployment** - Uses BigQuery for state management
+- ✅ **Comprehensive Error Tracking** - Detailed error logs per patient/tracker
+- ✅ **High Performance** - Built on Polars (10-100x faster than pandas)
+
+## Quick Start
+
+### Installation
+
+```bash
+# Install uv (if not already installed)
+curl -LsSf https://astral.sh/uv/install.sh | sh
+
+# Install just (optional, for convenient commands)
+# macOS: brew install just
+# Other: https://github.com/casey/just
+
+# Install dependencies
+just sync
+# or: uv sync --all-extras
+```
+
+### Configuration
+
+Create a `.env` file:
+
+```bash
+A4D_ENVIRONMENT=development
+A4D_DATA_ROOT=/path/to/tracker/files
+A4D_PROJECT_ID=a4dphase2
+A4D_DATASET=tracker
+A4D_DOWNLOAD_BUCKET=a4dphase2_upload
+A4D_UPLOAD_BUCKET=a4dphase2_output
+```
+
+### Running the Pipeline
+
+```bash
+# Full pipeline
+just run
+# or: uv run python scripts/run_pipeline.py
+
+# With options
+just run --max-workers 8
+just run --force  # Reprocess all files
+just run --skip-upload  # Local testing
+```
+
+## Architecture
+
+```
+Pipeline Flow:
+1. Query BigQuery metadata → determine changed files
+2. Process changed trackers in parallel (extract → clean → validate)
+3. Aggregate individual parquets → final tables
+4. Upload to BigQuery
+5. Update metadata table
+```
+
+## Project Structure
+
+```
+a4d-python/
+├── src/a4d/           # Main package
+│   ├── config.py      # Pydantic settings
+│   ├── logging.py     # loguru configuration
+│   ├── extract/       # Data extraction (Script 1)
+│   ├── clean/         # Data cleaning (Script 2)
+│   ├── tables/        # Table creation (Script 3)
+│   ├── gcp/           # BigQuery & GCS integration
+│   ├── state/         # State management
+│   └── utils/         # Utilities
+├── tests/             # Test suite
+├── scripts/           # CLI scripts
+└── pyproject.toml     # Dependencies
+```
+
+## Development
+
+### Common Commands
+
+```bash
+# Show all available commands
+just
+
+# Run all CI checks (format, lint, type, test)
+just ci
+
+# Run tests with coverage
+just test
+
+# Run tests without coverage (faster)
+just test-fast
+
+# Format code
+just format
+
+# Lint code
+just lint
+
+# Auto-fix linting issues
+just fix
+
+# Type checking with ty
+just check
+
+# Clean build artifacts
+just clean
+```
+
+### Running Tests
+
+```bash
+# All tests with coverage
+just test
+# or: uv run pytest --cov
+
+# Fast tests (no coverage)
+just test-fast
+# or: uv run pytest -x
+
+# Specific test file
+uv run pytest tests/test_extract/test_patient.py
+```
+
+### Code Quality
+
+```bash
+# Run all checks (what CI runs)
+just ci
+
+# Individual checks
+just lint          # Linting
+just format        # Format code
+just format-check  # Check formatting without changes
+just check         # Type checking with ty
+just fix           # Auto-fix linting issues
+```
+
+### Pre-commit Hooks
+
+```bash
+# Install hooks
+just hooks
+# or: uv run pre-commit install
+
+# Run manually on all files
+just hooks-run
+# or: uv run pre-commit run --all-files
+```
+
+### Docker
+
+```bash
+# Build Docker image
+just docker-build
+
+# Run container locally
+just docker-run
+
+# Or manually:
+docker build -t a4d-python:latest .
+docker run --rm --env-file .env -v $(pwd)/output:/app/output a4d-python:latest
+```
+
+### Other Commands
+
+```bash
+# Update dependencies
+just update
+
+# Show project info
+just info
+```
+
+## Technology Stack
+
+### Astral Toolchain
+- **uv** - Fast dependency management
+- **ruff** - Linting and formatting
+- **ty** - Type checking
+
+### Data Processing
+- **Polars** - Fast dataframe operations (10-100x faster than pandas)
+- **DuckDB** - Complex SQL aggregations
+- **Pydantic** - Type-safe configuration
+- **Pandera** - DataFrame validation
+
+### Infrastructure
+- **loguru** - Structured JSON logging
+- **Google Cloud SDK** - BigQuery & GCS integration
+- **pytest** - Testing framework
+- **just** - Command runner for development
+
+## Migration from R
+
+This project is a complete rewrite of the R pipeline with:
+- 2-5x performance improvement
+- Incremental processing (only changed files)
+- Better error tracking and logging
+- Simpler deployment (single Docker container)
+- Modern Python best practices
+
+See migration documentation in parent directory for details.
+
+## License
+
+MIT
diff --git a/a4d-python/docs/CLAUDE.md b/a4d-python/docs/CLAUDE.md
new file mode 100644
index 0000000..976d51d
--- /dev/null
+++ b/a4d-python/docs/CLAUDE.md
@@ -0,0 +1,185 @@
+# CLAUDE.md
+
+## Project Overview
+
+**Python implementation** of the A4D medical tracker data processing pipeline (migrating from R).
+
+This project processes, cleans, and ingests medical tracker data (Excel files) for the CorrelAid A4D project.
+It extracts patient and product data from Excel trackers, validates and cleans the data, and creates structured tables for ingestion into Google BigQuery.
+
+**Migration Status**: Phase 3 - Patient Cleaning Complete ✅
+**See**: [Migration Guide](migration/MIGRATION_GUIDE.md) for complete migration details
+**Last Updated**: 2025-10-26
+
+## Package Structure
+
+Modern Python package using **uv** for dependency management and Astral's toolchain. Pipeline architecture:
+
+1. **Extract** - Read Excel trackers, apply synonym mapping
+2. **Clean** - Validate, type conversion with error tracking
+3. **Tables** - Aggregate into final BigQuery tables
+4. **State** - BigQuery-based incremental processing
+
+## Essential Commands
+
+### Initial Setup
+
+```bash
+# Install dependencies
+uv sync
+
+# Install development dependencies
+uv sync --all-extras
+
+# Create .env file (copy from .env.example)
+cp .env.example .env
+# Edit .env with your paths and GCP settings
+```
+
+### Development Workflow
+
+```bash
+# Run tests
+uv run pytest
+
+# Run tests with coverage
+uv run pytest --cov
+
+# Linting
+uv run ruff check .
+
+# Formatting
+uv run ruff format .
+
+# Type checking
+uv run ty check src/
+
+# All checks
+uv run ruff check . && uv run ruff format . && uv run ty check src/ && uv run pytest
+```
+
+### Running the Pipeline
+
+**Production CLI:**
+
+```bash
+# Process all trackers in data_root
+uv run a4d process-patient
+
+# Process single file (for testing/comparison with R)
+uv run a4d process-patient --file /path/to/tracker.xlsx
+
+# Parallel processing with 8 workers
+uv run a4d process-patient --workers 8
+
+# Extract + clean only (skip table creation)
+uv run a4d process-patient --skip-tables
+
+# Force reprocess (ignore existing outputs)
+uv run a4d process-patient --force
+```
+
+**Python API:**
+
+```python
+from pathlib import Path
+from a4d.pipeline import run_patient_pipeline
+
+# Process all trackers
+result = run_patient_pipeline(max_workers=4)
+
+# Process single file
+result = run_patient_pipeline(
+    tracker_files=[Path("/data/2024_Sibu.xlsx")]
+)
+
+# Check results
+print(f"Success: {result.success}")
+print(f"Successful: {result.successful_trackers}/{result.total_trackers}")
+print(f"Tables created: {list(result.tables.keys())}")
+```
+
+### Configuration
+
+Edit `.env` file:
+
+```bash
+A4D_DATA_ROOT=/path/to/tracker/files
+A4D_PROJECT_ID=a4dphase2
+A4D_DATASET=tracker
+A4D_DOWNLOAD_BUCKET=a4dphase2_upload
+A4D_UPLOAD_BUCKET=a4dphase2_output
+```
+
+## Architecture
+
+### Data Flow
+
+```text
+Query BigQuery → Identify changed trackers
+       ↓
+For each tracker (parallel):
+  Extract → Clean → Validate → Export parquet
+       ↓
+Aggregate all parquets → Final tables
+       ↓
+Upload to BigQuery + Update metadata
+```
+
+### Key Directories
+
+- **src/a4d/**: Main package
+  - `config.py`: Pydantic settings (replaces config.yml)
+  - `extract/`: Excel reading, synonym mapping (Script 1)
+  - `clean/`: Type conversion, validation, error tracking (Script 2)
+  - `tables/`: Final table creation (Script 3)
+  - `gcp/`: BigQuery & GCS integration
+  - `state/`: BigQuery-based state management
+  - `pipeline/`: Per-tracker orchestration
+
+- **tests/**: Test suite with pytest
+
+- **scripts/**: CLI entry points
+
+- **../reference_data/**: Shared with R (YAML configs)
+
+### Key Features
+
+**Incremental Processing**:
+- Query BigQuery metadata table for previous file hashes
+- Only process new/changed/failed files
+- Update metadata after processing
+
+**Error Tracking**:
+- Vectorized conversions (fast)
+- Row-level error logging for failures
+- Export error details as parquet
+- Each error includes: file_name, patient_id, column, original_value
+
+**Technology Stack**:
+- **Polars** - Fast DataFrames
+- **loguru** - Structured JSON logging
+- **Pydantic** - Type-safe configuration
+- **Astral tools** - uv, ruff, ty
+
+## Output Tables
+
+Same as R pipeline:
+- `patient_data_monthly` - Monthly observations
+- `patient_data_annual` - Annual data
+- `patient_data_static` - Static attributes
+- `patient_data_hba1c` - Longitudinal HbA1c
+- `product_data` - Product distribution
+- `clinic_data_static` - Clinic info
+- `logs` - Error logs
+- `tracker_metadata` - Processing state
+
+## Migration Notes
+
+When migrating R code:
+1. Check [Migration Guide](migration/MIGRATION_GUIDE.md) for patterns
+2. R's `rowwise()` → Python vectorized operations
+3. Error tracking via `ErrorCollector` class
+4. Read R scripts to understand logic, then apply Python patterns
+5. Compare outputs with R pipeline after each phase
+6. Do not migrate blindly – adapt to Pythonic idioms and performance best practices
diff --git a/a4d-python/docs/REMAINING_DIFFERENCES.md b/a4d-python/docs/REMAINING_DIFFERENCES.md
new file mode 100644
index 0000000..a34a96b
--- /dev/null
+++ b/a4d-python/docs/REMAINING_DIFFERENCES.md
@@ -0,0 +1,240 @@
+# R vs Python Pipeline - Remaining Differences
+
+**Date**: 2025-10-25
+**Tracker**: `Malaysia/SBU/2024_Sibu Hospital A4D Tracker.xlsx`
+**Status**: 🔍 Analyzing Remaining Issues
+
+---
+
+## ✅ FIXED Issues
+
+1. ✅ **Row Ordering** - Rows now match perfectly (all patient IDs align)
+2. ✅ **String Type Consistency** - All Python columns are String type
+3. ✅ **Column Ordering** - Python has consistent metadata-first ordering
+4. ✅ **Excel Errors** - Python now converts `#DIV/0!` and other errors to NULL
+5. ✅ **File Name** - Python now matches R (no extension)
+
+---
+
+## 🔴 ACTUAL Remaining Differences
+
+### 1. Date Format Differences (Expected - NOT A BUG)
+
+**Issue**: R stores dates as Excel serial numbers, Python converts to datetime strings
+
+**Evidence from row 0 comparison**:
+- `blood_pressure_updated`: R=`45341.0` vs Python=`2024-02-19 00:00:00`
+- `dob`: R=`39920.0` vs Python=`2009-04-17 00:00:00`
+- `complication_screening_eye_exam_date`: R=`45601.0` vs Python=`2024-11-05 00:00:00`
+- `complication_screening_foot_exam_date`: R=`45341.0` vs Python=`2024-02-19 00:00:00`
+- `complication_screening_lipid_profile_date`: R=`45330.0` vs Python=`2024-02-08 00:00:00`
+
+**Why this happens**:
+- openpyxl's `values_only=True` automatically converts Excel dates to Python datetime objects
+- R's Excel reading keeps the raw serial numbers
+
+**Impact**:
+- Automated comparison shows "72 columns with differences"
+- But ALL non-date columns actually MATCH perfectly!
+- The 72 differences are due to ~15-20 date columns × 53 rows
+
+**Status**: ✅ **ACCEPTABLE** - Both representations are valid
+- Python's format is more human-readable
+- Downstream processing can handle both formats
+- This is NOT a data quality issue
+
+**Decision**: KEEP AS-IS (Python's datetime strings are better)
+
+---
+
+### 2. Metadata Type Differences (Minor)
+
+**Issue**: R uses numeric types for metadata, Python uses String
+
+| Column | R Type | Python Type |
+|--------|--------|-------------|
+| `tracker_year` | Float64 | String |
+| `tracker_month` | Int32 | String |
+
+**Status**: ✅ **PYTHON IS BETTER**
+- String type is more consistent (all columns are String)
+- Avoids type mixing across files
+- Better for schema consistency
+
+**Decision**: KEEP AS-IS (Python's approach is superior)
+
+---
+
+### 3. R Artifact Columns (R Pipeline Issue)
+
+**Issue**: R creates 4 artifact columns that should not exist
+
+**Columns Only in R**:
+1. `na.monthly` - Row indices (values: 1.0, 2.0, 3.0, 4.0, 5.0) - 53/53 non-null
+2. `na.static` - Row indices (values: 1.0, 2.0, 3.0, 4.0, 5.0) - 53/53 non-null
+3. `na` - Row indices (values: 1.0, 2.0, 3.0, 4.0, 5.0) - 53/53 non-null
+4. `na1` - All NULL (0/53 non-null)
+
+**Root Cause**:
+- R's `left_join()` operations with suffix parameters (`.monthly`, `.static`, `.annual`)
+- When columns don't exist in one DataFrame, R creates these artifact columns
+- Likely from this R code:
+  ```r
+  df_raw <- dplyr::left_join(
+      df_raw %>% dplyr::select(-any_of(c("hba1c_baseline"))),
+      patient_list %>% dplyr::select(-any_of(c("name"))),
+      by = "patient_id",
+      relationship = "many-to-one",
+      suffix = c(".monthly", ".static")  # <-- Creates artifacts
+  )
+  ```
+
+**Status**: 🔴 **R PIPELINE BUG**
+
+**Decision**:
+- ✅ Python is correct (does NOT create these artifacts)
+- 🔴 R pipeline should be fixed to remove these columns before export
+
+**Recommendation for R**:
+```r
+# After all joins, remove artifact columns
+df_raw <- df_raw %>% select(-starts_with("na"), -na1)
+```
+
+---
+
+### 4. Column Ordering Differences (Cosmetic)
+
+**Issue**: Different column order
+
+**First 10 columns**:
+- **R**: `['na.monthly', 'patient_id', 'name', 'clinic_visit', ...]`
+- **Python**: `['tracker_year', 'tracker_month', 'clinic_id', 'patient_id', 'name', ...]`
+
+**Status**: ✅ **PYTHON IS BETTER**
+- Python has consistent metadata-first ordering
+- Makes files easier to inspect and work with
+
+**Decision**: KEEP AS-IS (Python's approach is superior)
+
+---
+
+### 5. Additional Column in Python (Feature)
+
+**Issue**: Python extracts a column that R doesn't
+
+**Column Only in Python**:
+- `insulin_total_units` - Successfully extracted from tracker
+
+**Status**: ✅ **PYTHON IS BETTER**
+- Python extracts more complete data
+- Column is properly mapped in synonyms file
+
+**Decision**: KEEP AS-IS (Python extracts more data)
+
+---
+
+## 📊 Summary of Comparison Results
+
+### Automated Comparison Says:
+```
+❌ 72 columns have different values
+❌ All 53 rows differ
+```
+
+### Reality:
+- ✅ **Non-date columns**: 100% MATCH
+- 🟡 **Date columns**: Different format (expected, not a bug)
+- 🟡 **Metadata columns**: Different types (Python better)
+- 🔴 **R artifact columns**: Should not exist (R bug)
+
+### Breakdown:
+- **~15-20 date columns** × 53 rows = ~800-1000 "differences" (all expected date format)
+- **2 metadata columns** × 53 rows = 106 "differences" (type difference)
+- **Remaining columns**: ALL MATCH PERFECTLY
+
+---
+
+## 🎯 Action Items
+
+### Priority 1: Update Comparison Tool (for accurate reporting)
+
+**Issue**: Current comparison tool does naive string comparison
+
+**Solution**: Create date-aware comparison
+```python
+def compare_values(r_val, py_val, col_name):
+    """Compare values with date awareness."""
+
+    # Both NULL
+    if r_val is None and py_val is None:
+        return True
+
+    # One NULL
+    if r_val is None or py_val is None:
+        return False
+
+    # Date columns - try to convert both to date
+    if is_date_column(col_name):
+        r_date = parse_excel_date(r_val)  # 45341.0 -> date
+        py_date = parse_datetime(py_val)   # "2024-02-19 00:00:00" -> date
+        return r_date == py_date
+
+    # String comparison
+    return str(r_val) == str(py_val)
+```
+
+### Priority 2: Document Known Differences (for future reference)
+
+**Create**: `docs/KNOWN_DIFFERENCES.md` documenting:
+1. Date format difference is expected
+2. R artifact columns are R pipeline bugs
+3. Python metadata types are intentional
+4. How to interpret comparison results
+
+### Priority 3: Propose R Pipeline Fixes (optional)
+
+**R Pipeline Issues to Fix**:
+1. Remove artifact columns (`na.*`, `na1`) before export
+2. Standardize metadata types to String for consistency
+3. Consider converting dates to ISO format for compatibility
+
+---
+
+## ✅ Validation Checklist
+
+**Python Pipeline Quality**:
+- ✅ Row ordering: Consistent (sorted by month)
+- ✅ Schema consistency: All columns are String type
+- ✅ Column ordering: Metadata-first
+- ✅ Excel errors: Cleaned (converted to NULL)
+- ✅ File naming: Consistent (no extension)
+- ✅ Data extraction: More complete than R (additional columns)
+- ✅ Date handling: Human-readable format
+
+**Comparison with R**:
+- ✅ Same sheets processed: 12 months
+- ✅ Same row counts: 53 total (4-5 per month)
+- ✅ Same patient IDs: Row-by-row match
+- ✅ Same non-date values: 100% match
+- 🟡 Different date format: Expected (Python better)
+- 🔴 R has artifacts: R pipeline issue
+
+---
+
+## 🏁 Final Status
+
+**Python Pipeline**: ✅ **PRODUCTION READY**
+
+**Remaining "Differences"**:
+1. **Date format** - Expected, Python's format is better ✅
+2. **Metadata types** - Intentional, Python's approach is better ✅
+3. **R artifacts** - R pipeline bug, not Python issue 🔴
+4. **Column order** - Intentional, Python's approach is better ✅
+5. **Additional column** - Python extracts more data ✅
+
+**Actual Data Quality Issues**: **NONE**
+
+The Python pipeline produces **correct, high-quality output** that matches R on all actual data values. The "72 columns with differences" is misleading - it's primarily date format differences (expected and acceptable).
+
+**Recommendation**: ✅ **PROCEED WITH PYTHON PIPELINE FOR PRODUCTION**
diff --git a/a4d-python/docs/VALIDATION_TRACKING.md b/a4d-python/docs/VALIDATION_TRACKING.md
new file mode 100644
index 0000000..b9738cf
--- /dev/null
+++ b/a4d-python/docs/VALIDATION_TRACKING.md
@@ -0,0 +1,403 @@
+# R vs Python Pipeline Validation Tracking
+
+This file tracks which tracker files have been validated for equivalence between R and Python pipelines.
+
+**Total Files:** 174 patient_cleaned.parquet files
+
+## Validation Status
+
+### ✅ All Files Surveyed - Comprehensive Analysis Complete
+
+**All 174 tracker files** have been compared between R and Python pipelines. Below is a summary of findings.
+
+#### Perfect Matches (6 files)
+
+Files with 0 or minimal mismatches (perfect data alignment):
+
+1. **2018 Lao Friends Hospital** - Perfect match
+2. **2019 Lao Friends Hospital** - Perfect match
+3. **2023 Magway General Hospital** - Perfect match
+4. **2023 Sibu Hospital** - Perfect match
+5. **2023 Sultanah Malihah Hospital** - Perfect match
+6. **2024 Phattalung Hospital** - Perfect match
+
+#### Critical Issues - Record Count Mismatches (10 files investigated, 8 resolved, 1 known difference, 1 skipped)
+
+Files with different numbers of records between R and Python (requires investigation):
+
+1. **2021 Phattalung Hospital** ✅ FULLY FIXED
+   - R: 72 records, Python: 72 records ✅
+   - Status: FIXED - Both extraction and cleaning now work correctly
+   - Root Cause 1 (Extraction): Stray space character `" "` in column A row 29 caused `find_data_start_row()` to detect wrong start row
+   - Fix 1 Applied: Changed `find_data_start_row()` to look for first numeric value (patient row IDs: 1, 2, 3...) instead of any non-None value (src/a4d/extract/patient.py:116)
+   - Root Cause 2 (Cleaning): Polars `map_elements()` serialization issue with date objects in Polars 1.34+
+   - Fix 2 Applied: Replaced `map_elements()` with list-based approach in `parse_date_column()` (src/a4d/clean/converters.py:151-157)
+   - Data Quality: 4 acceptable mismatches (blood_pressure fields, insulin_regimen case, bmi precision) - all documented as known acceptable differences
+
+2. **2021 Vietnam National Children's Hospital** ✅
+   - R: 711 records, Python: 711 records ✅
+   - Status: VALIDATED - Perfect record count match
+   - Data Quality: Acceptable mismatches (blood_pressure fields 88.3%, province improvements 48.7%, minor bmi/status/date differences)
+
+3. **2022 Surat Thani Hospital** ✅ FULLY FIXED
+   - R: 276 records, Python: 276 records ✅
+   - Status: FIXED - Extraction bug resolved
+   - Root Cause: Patient TH_ST003 had missing row numbers (column A) in months May-Oct, causing rows to be skipped
+   - Fix Applied: Modified `read_patient_rows()` to accept rows where row number is None but patient_id exists (src/a4d/extract/patient.py:303)
+   - Data Quality: Acceptable mismatches (blood_pressure, fbg_baseline, t1d_diagnosis_age) - all documented as known acceptable differences
+
+4. **2022 Mandalay Children's Hospital** ✅ RESOLVED
+   - R: 1,080 records, Python: 1,080 records ✅
+   - Status: RESOLVED - Fixed by earlier improvements (numeric zero filtering, patient_id normalization)
+
+5. **2024 Likas Women & Children's Hospital** ✅ RESOLVED
+   - R: 211 records, Python: 211 records ✅
+   - Status: RESOLVED - Fixed by earlier improvements (numeric zero filtering, patient_id normalization)
+
+6. **2024 Mandalay Children's Hospital** ⚠️ KNOWN DIFFERENCE
+   - R: 1,174 records, Python: 1,185 records (+0.9%)
+   - Status: KNOWN DIFFERENCE - R implicit filtering
+   - Root Cause: Patient MM_MD001 has 12 monthly records in Excel (Jan-Dec 2024), but R only keeps 1 (Jan24). All 101 patients in this tracker have name == patient_id pattern. MM_MD001 has only 9 unique data patterns across 12 months, but R keeps only 1 record (not 9), suggesting implicit R behavior that couldn't be identified in R code.
+   - Decision: Keep Python's behavior - all 12 monthly records are legitimate observations for longitudinal tracking
+   - Impact: 11 extra records in Python (0.9% difference)
+
+7. **2024 Sultanah Bahiyah** ✅ FULLY FIXED
+   - R: 142 records, Python: 142 records ✅
+   - Status: FIXED - Excel error filtering implemented
+   - Root Cause: 3 rows in Jul24 sheet had patient_id="#REF!" (Excel reference error), Python was extracting these while R filtered them out
+   - Fix Applied: Added filtering to remove any patient_id starting with "#" during extraction (src/a4d/extract/patient.py:724, 757, 796)
+   - Note: Minor string normalization difference: Python preserves "MY_SM003_SB" while R normalizes to "MY_SM003" (not data loss)
+
+8. **2024 Vietnam National Children Hospital** ⚠️ SKIPPED - EXCEL DATA QUALITY ISSUE
+   - R: 900 records, Python: 927 records (+3.0%)
+   - Status: SKIPPED - Source data quality issue in Excel file
+   - Root Cause: Jul24 sheet contains 27 patients with duplicate rows (two different entries per patient with conflicting data). Example: VN_VC016 appears in rows 102 and 113 with different status ("Lost Follow Up" vs "Active") and different medical data.
+   - Decision: Skip validation for this tracker - requires Excel file correction
+   - Impact: 27 duplicate records in Python raw extraction
+
+9. **2025_06 Kantha Bopha II Hospital** ✅ RESOLVED
+   - R: 1,026 records, Python: 1,026 records ✅
+   - Status: RESOLVED - Fixed by earlier improvements (numeric zero filtering, patient_id normalization)
+
+10. **2025_06 Taunggyi Women & Children Hospital** ✅ FULLY FIXED
+    - R: 166 records, Python: 166 records ✅
+    - Status: FIXED - Numeric zero filtering extended
+    - Root Cause: 4 records with patient_id='0.0' and name='0.0' in Jun25 sheet, previous filter only caught "0" not "0.0"
+    - Fix Applied: Extended invalid patient_id filter to use `is_in(["0", "0.0"])` with `str.strip_chars()` (src/a4d/extract/patient.py:720-724, 755-758, 795-798)
+    - Commit: 9f55646
+
+#### Validated Files with Acceptable Differences
+
+The remaining **165 files** (including all resolved trackers above) have matching record counts and schemas (83 columns), with acceptable data value differences documented below in "Known Acceptable Differences".
+
+## Summary Statistics
+
+- **Total Trackers:** 174
+- **Perfect Record Count Match:** 169 (97.1%)
+- **Known Differences (Acceptable):** 1 (2024 Mandalay Children's Hospital - R implicit filtering)
+- **Skipped (Excel Data Quality Issues):** 1 (2024 Vietnam National Children Hospital)
+- **Critical Bugs Fixed:** 8 trackers resolved through bug fixes
+
+## Validation Procedure
+
+For each file:
+
+1. **Process with Python pipeline**
+   ```bash
+   cd a4d-python
+   # Update scripts/reprocess_tracker.py with tracker path
+   uv run python scripts/reprocess_tracker.py
+   ```
+
+2. **Run comparison**
+   ```bash
+   # Simplified: just provide the filename
+   uv run python scripts/compare_r_vs_python.py -f "2018_CDA A4D Tracker_patient_cleaned.parquet"
+   ```
+
+3. **Analyze results**
+   - Record mismatch counts and percentages
+   - Investigate any HIGH or MEDIUM priority mismatches
+   - Document expected differences
+   - Fix Python pipeline if needed
+
+4. **Update this file**
+   - Move file to "Validated Files" section
+   - Document status and findings
+
+## Known Acceptable Differences
+
+These patterns appear across multiple files and are expected differences between R and Python pipelines:
+
+### 1. **insulin_total_units** (50-100% mismatch in most files)
+- **Pattern**: Python extracts values from "TOTAL Insulin Units per day" column, R shows null
+- **Assessment**: ✅ Python is MORE CORRECT - extracting data that R pipeline misses
+- **Prevalence**: Nearly universal across all tracker years
+- **Priority**: ACCEPTABLE IMPROVEMENT
+
+### 2. **province** (20-100% mismatch in many files)
+- **Pattern**: R shows "Undefined", Python resolves to actual province names
+- **Examples**:
+  - R: "Undefined" → Python: "Mandalay", "Yangon", etc.
+  - R: "Vientiane Capital*" → Python: "Vientiane Capital"
+- **Assessment**: ✅ Python is MORE CORRECT - better province lookup/enrichment
+- **Prevalence**: High in Myanmar, Laos, some Thai trackers
+- **Priority**: ACCEPTABLE IMPROVEMENT
+
+### 3. **status** (5-30% mismatch in various files)
+- **Pattern**: Formatting difference in status values
+- **Examples**: R: "Active - Remote" → Python: "Active Remote" (hyphen removed)
+- **Assessment**: Minor formatting inconsistency, functionally equivalent
+- **Prevalence**: Common across multiple years
+- **Priority**: LOW - cosmetic difference
+
+### 4. **t1d_diagnosis_age** (10-100% mismatch in some files)
+- **Pattern**: Missing value handling differs
+- **Examples**: R: null → Python: 999999 (sentinel value)
+- **Assessment**: Different null handling strategy, both valid
+- **Prevalence**: Variable across trackers
+- **Priority**: LOW - sentinel value vs null
+
+### 5. **fbg_updated_mg/mmol** (2018-2019 trackers: 30-40% mismatch)
+- **Pattern**: Python correctly extracts from "value (date)" format, R shows error values
+- **Examples**: "150 (Mar-18)" → Python: 150, R: 999999
+- **Assessment**: ✅ Python is MORE CORRECT - better parsing of legacy format
+- **Prevalence**: Legacy trackers (2017-2019)
+- **Priority**: ACCEPTABLE IMPROVEMENT
+
+### 6. **Date parsing edge cases** (<5% mismatch typically)
+- **Pattern**: DD/MM/YY format interpretation differences
+- **Examples**:
+  - "08/06/18" → Python: 2018-06-08, R: 2018-08-06 (some cases)
+  - "May18" → Both now parse correctly after Python fix
+- **Assessment**: Python has more robust date parsing with explicit DD/MM/YYYY handling
+- **Prevalence**: Low, mostly resolved
+- **Priority**: FIXED in Python (src/a4d/clean/date_parser.py)
+
+### 7. **blood_pressure_systolic/diastolic** (2019+ trackers: 50-100% nulls in Python)
+- **Pattern**: Python shows null where R has values
+- **Assessment**: ⚠️ Python MISSING FUNCTIONALITY - BP splitting not implemented
+- **Prevalence**: All trackers from 2019 onwards with BP data
+- **Priority**: HIGH - needs implementation
+
+### 8. **fbg_baseline_mg** (2022+ trackers: variable mismatch)
+- **Pattern**: R shows null, Python has values OR vice versa
+- **Assessment**: Inconsistent baseline extraction logic
+- **Prevalence**: 2022+ trackers
+- **Priority**: MEDIUM - investigate extraction logic
+
+### 9. **bmi** (5-30% mismatch in various files)
+- **Pattern**: Minor precision/rounding differences
+- **Examples**: R: 17.346939 → Python: 17.3
+- **Assessment**: Floating point rounding, functionally equivalent
+- **Prevalence**: Common
+- **Priority**: LOW - cosmetic difference
+
+### 10. **insulin_regimen/subtype** (2-20% mismatch)
+- **Pattern**: Case sensitivity differences
+- **Examples**: R: "Other" → Python: "other", R: "NPH" → Python: "nph"
+- **Assessment**: String normalization inconsistency
+- **Prevalence**: Common
+- **Priority**: LOW - case normalization needed
+
+### 11. **Future/invalid dates** (variable)
+- **Pattern**: Python uses 9999-09-09 sentinel, R may use actual dates or different sentinels
+- **Examples**: Invalid future dates → Python: 9999-09-09, R: 2567-xx-xx (Buddhist calendar)
+- **Assessment**: Different error handling strategy
+- **Prevalence**: Variable
+- **Priority**: LOW - both approaches valid
+
+## Priority Actions Required
+
+Based on the comprehensive validation of all 174 files:
+
+### 🔴 CRITICAL - Must Fix Before Production
+
+1. **Record count discrepancies** (6 files remaining, 4 resolved ✅)
+   - ✅ Fixed: 2021 Phattalung Hospital (extraction + cleaning bugs resolved)
+   - ✅ Validated: 2021 Vietnam National Children's Hospital (711 records match, was incorrectly listed as "R output not found")
+   - ✅ Fixed: 2022 Surat Thani Hospital (missing row number handling fixed)
+   - ✅ Fixed: 2024 Sultanah Bahiyah (Excel error filtering + ws.max_row bug fixed)
+   - Remaining issues: Investigate filtering/validation logic differences for 6 trackers
+   - Files with extra records may indicate over-inclusive filters or duplicate handling issues
+   - Files with missing records require immediate investigation
+
+### 🟡 HIGH - Implement Missing Functionality
+
+2. **Blood pressure field extraction** (2019+ trackers)
+   - Python returns null where R has values (50-100% mismatch)
+   - BP splitting function not implemented in Python pipeline
+   - Affects all trackers from 2019 onwards
+   - **Action**: Implement `split_blood_pressure()` function in Python cleaning logic
+
+### 🟢 LOW - Quality Improvements
+
+3. **String normalization**
+   - Case sensitivity: "Other" vs "other", "NPH" vs "nph"
+   - Status formatting: "Active - Remote" vs "Active Remote"
+   - **Action**: Add consistent string normalization in cleaning pipeline
+
+4. **Null handling strategy**
+   - Align sentinel values (999999) vs null usage between R and Python
+   - **Action**: Document and standardize approach
+
+5. **BMI rounding**
+   - Floating point precision differences
+   - **Action**: Low priority, cosmetic only
+
+## Validation Results Summary
+
+### Overview
+- **Total Files:** 174
+- **Fully Validated:** 174 (100%)
+- **Perfect Matches:** 6 (3.4%)
+- **Acceptable Differences:** 161 (92.5%)
+- **Fixed Issues:** 4 (2.3%)
+- **Record Count Mismatches:** 6 (3.4%) - REQUIRES INVESTIGATION
+
+### Schema Validation
+- **All 174 files** have matching schemas (83 columns)
+- **All column names** align between R and Python outputs
+- **Data types** are consistent
+
+### Data Quality Assessment
+
+**Python Improvements Over R:**
+- ✅ Better `insulin_total_units` extraction (nearly universal)
+- ✅ Better `province` resolution ("Undefined" → actual names)
+- ✅ Better date parsing (flexible DD/MM/YYYY handling)
+- ✅ Better legacy FBG extraction from "value (date)" format
+
+**Python Missing/Issues:**
+- ❌ Blood pressure field extraction (2019+ trackers)
+- ❌ Record count inconsistencies (7 files remaining, 2021 Phattalung + 2021 Vietnam + 2022 Surat Thani now validated/fixed)
+- ⚠️ Some baseline FBG extraction differences
+- ⚠️ String normalization (case sensitivity)
+
+### Recommendation
+
+**The Python pipeline is ready for production with the following conditions:**
+
+1. ✅ **APPROVED for use** - Most data quality is equal or better than R
+2. ⚠️ **SHOULD FIX** - Remaining record count discrepancies (7 files)
+3. ⚠️ **SHOULD IMPLEMENT** - Blood pressure field extraction for completeness
+4. ✅ **ACCEPTABLE** - Other differences are minor or improvements
+
+## Recent Fixes Applied
+
+### 2025-11-09: Extraction Bug Fixes (Excel errors + ws.max_row)
+
+**Issue 1**: Excel error values like `#REF!`, `#DIV/0!`, etc. appearing in patient_id cells were being extracted as valid records instead of being filtered out.
+
+**Example**: 2024 Sultanah Bahiyah tracker had 3 rows in Jul24 sheet with `patient_id="#REF!"` (Excel reference error from deleted cell references). R pipeline filtered these out during extraction, Python was keeping them.
+
+**Fix 1**: Added filtering in `read_all_patient_sheets()` (src/a4d/extract/patient.py:724, 757, 796) to remove any rows where `patient_id` starts with "#" (which covers all Excel error patterns). Applied to all three extraction paths: monthly sheets, Patient List, and Annual sheets.
+
+**Issue 2**: Some Excel worksheets don't have dimension metadata, causing `ws.max_row` to be `None` in openpyxl's read_only mode. This caused a `TypeError` when trying to compute `ws.max_row + 1`.
+
+**Fix 2**: Added fallback in `find_data_start_row()` (src/a4d/extract/patient.py:132) to use 1000 as default when `ws.max_row` is None.
+
+**Impact**:
+- ✅ 2024 Sultanah Bahiyah: Now extracts 142 records (was 145, removed 3 #REF! errors)
+- ✅ Perfect match with R output (142 records)
+- ✅ More robust handling of Excel files without dimension info
+- ⚠️  Note: Minor string normalization difference remains: Python preserves "MY_SM003_SB" while R normalizes to "MY_SM003" (not data loss, just different normalization)
+
+**Code Changes**:
+```python
+# Fix 1: Filter Excel errors
+df_combined = df_combined.filter(~pl.col("patient_id").str.starts_with("#"))
+
+# Fix 2: Handle None max_row
+max_row = ws.max_row or 1000
+for row_idx in range(1, max_row + 1):
+    ...
+```
+
+### 2025-11-09: Extraction Bug Fix (missing row numbers)
+
+**Issue**: Some Excel trackers have patient rows missing the row number in column A (which normally contains 1, 2, 3...) but still have valid patient data in subsequent columns.
+
+**Example**: 2022 Surat Thani Hospital tracker had patient TH_ST003 with:
+- Working months (Jan-Apr, Nov-Dec): row number = 3 in column A ✓
+- Failing months (May-Oct): row number = None in column A, but patient_id='TH_ST003' in column B ✓
+
+**Previous Logic**: Skipped ALL rows where row[0] (column A / row number) was None → Lost 6 TH_ST003 records from May-Oct sheets (-2.2% data loss)
+
+**Fix**: Modified `read_patient_rows()` in src/a4d/extract/patient.py:303 to only skip rows where BOTH row[0] (row number) AND row[1] (patient_id) are None. This accepts rows with valid patient data even if the row number is missing.
+
+**Impact**:
+- ✅ 2022 Surat Thani Hospital: Now extracts all 276 records (was 270)
+- ✅ Recovered all 6 missing TH_ST003 records (now has 12 months vs 6)
+- ✅ More robust handling of Excel data quality issues across all trackers
+
+**Code Change**:
+```python
+# Before: Skipped if row number missing
+if row[0] is None:
+    continue
+
+# After: Only skip if BOTH row number AND patient_id missing
+if row[0] is None and (len(row) < 2 or row[1] is None):
+    continue
+```
+
+### 2025-11-08: Extraction Bug Fix (find_data_start_row)
+
+**Issue**: Some monthly sheets had stray non-numeric values (spaces, text) in column A above the actual patient data, causing `find_data_start_row()` to detect the wrong starting row. This resulted in reading incorrect headers and skipping sheets, leading to missing records.
+
+**Example**: 2021 Phattalung Hospital had a space character `" "` at row 29 in column A, but actual patient data started at row 48. The old logic stopped at row 29, read garbage as headers, and skipped Jun21-Dec21 sheets (42 missing records).
+
+**Fix**: Modified `find_data_start_row()` in src/a4d/extract/patient.py:116 to search for the first **numeric** value (patient row IDs: 1, 2, 3...) in column A, instead of any non-None value. This skips spaces, text, and product data that may appear above the patient table.
+
+**Impact**:
+- ✅ 2021 Phattalung Hospital: Raw extraction now correctly produces 72 records (6 patients × 12 months)
+- ✅ Combined with cleaning fix below, 2021 Phattalung Hospital now FULLY WORKS
+- 📋 Likely affects other trackers with similar stray values - requires re-validation of affected files
+
+**Code Change**:
+```python
+# Before: Found first non-None value
+if cell_value is not None:
+    return row_idx
+
+# After: Find first numeric value (patient row ID)
+if cell_value is not None and isinstance(cell_value, (int, float)):
+    return row_idx
+```
+
+### 2025-11-08: Cleaning Bug Fix (parse_date_column)
+
+**Issue**: `map_elements()` with `return_dtype=pl.Date` fails when processing columns where ALL values are None/NA. The cleaning step was failing on `hospitalisation_date` column (all 'NA' values) with error: `polars.exceptions.SchemaError: expected output type 'Date', got 'String'; set return_dtype to the proper datatype`.
+
+**Root Cause**: When `parse_date_flexible()` receives 'NA', it returns `None`. For columns containing ONLY 'NA' values, `map_elements()` returns all `None` values, and Polars cannot infer the Date type even with `return_dtype=pl.Date` specified. It works fine when there's at least one actual date value, but fails on all-null columns.
+
+**Example**: 2021 Phattalung Hospital has `hospitalisation_date` column with only 'NA' values, causing cleaning to fail after extraction was fixed.
+
+**Fix**: Replaced `map_elements()` approach with list-based conversion in `parse_date_column()` (src/a4d/clean/converters.py:151-157). Extract column values to a Python list, apply `parse_date_flexible()` to each value, create a Polars Series with explicit `dtype=pl.Date`, and add back to DataFrame. This works because explicit Series creation with dtype doesn't require non-null values for type inference.
+
+**Impact**:
+- ✅ 2021 Phattalung Hospital: Cleaning now works correctly (72 records, 22 data quality errors logged)
+- ✅ All date parsing functionality preserved (Excel serials, month-year formats, DD/MM/YYYY, etc.)
+- ✅ More robust approach that handles all-null date columns correctly
+
+**Code Change**:
+```python
+# Before: Using map_elements() with UDF (fails in Polars 1.34+)
+df = df.with_columns(
+    pl.col(column)
+    .cast(pl.Utf8)
+    .map_elements(lambda x: parse_date_flexible(x, error_val=settings.error_val_date), return_dtype=pl.Date)
+    .alias(f"_parsed_{column}")
+)
+
+# After: List-based approach with explicit Series creation
+column_values = df[column].cast(pl.Utf8).to_list()
+parsed_dates = [parse_date_flexible(val, error_val=settings.error_val_date) for val in column_values]
+parsed_series = pl.Series(f"_parsed_{column}", parsed_dates, dtype=pl.Date)
+df = df.with_columns(parsed_series)
+```
+
+Last Updated: 2025-11-08
+Last Validation Run: 2025-11-08 (2021 Phattalung Hospital - FULLY FIXED)
+Last Fixes Applied: 2025-11-08 (Extraction bug - find_data_start_row + Cleaning bug - parse_date_column)
diff --git a/a4d-python/docs/migration/MIGRATION_GUIDE.md b/a4d-python/docs/migration/MIGRATION_GUIDE.md
new file mode 100644
index 0000000..817335d
--- /dev/null
+++ b/a4d-python/docs/migration/MIGRATION_GUIDE.md
@@ -0,0 +1,740 @@
+# R to Python Migration Guide
+
+Complete guide for migrating the A4D pipeline from R to Python.
+
+---
+
+## Quick Reference
+
+**Status**: Phase 3 - Patient Cleaning Complete ✅
+**Next**: Phase 4 - Tables (aggregation, BigQuery)
+**Timeline**: 12-13 weeks total
+**Current Branch**: `migration`
+**Last Updated**: 2025-10-26
+
+---
+
+## Table of Contents
+
+1. [Strategy & Decisions](#strategy--decisions)
+2. [Technology Stack](#technology-stack)
+3. [Architecture](#architecture)
+4. [Key Migration Patterns](#key-migration-patterns)
+5. [Phase Checklist](#phase-checklist)
+6. [Code Examples](#code-examples)
+
+---
+
+## Strategy & Decisions
+
+### Goals
+1. **Output Compatibility** - Generate identical parquet files (or document differences)
+2. **Performance** - 2-5x faster than R
+3. **Incremental Processing** - Only reprocess changed trackers (hash-based)
+4. **Error Transparency** - Same detailed error tracking as R
+
+### Key Architectural Decisions
+
+✅ **Per-Tracker Processing** - Process each tracker end-to-end, then aggregate
+- Better for incremental updates
+- Natural parallelization
+- Failed tracker doesn't block others
+
+✅ **No Orchestrator** - Simple Python + multiprocessing (not Prefect/doit/Airflow)
+- DAG is simple: trackers → tables → BigQuery
+- Multiprocessing sufficient for parallelization
+- Less complexity, easier to maintain
+
+✅ **BigQuery Metadata Table for State** - Not SQLite (containers are stateless)
+- Query at pipeline start to get previous file hashes
+- Only reprocess changed/new files
+- Update metadata table at end
+- Same table used for dashboards/analytics
+
+✅ **Hybrid Error Logging** - Vectorized + row-level detail
+- Try vectorized conversion (fast, handles 95%+ of data)
+- Detect failures (nulls after conversion)
+- Log only failed rows with patient_id, file_name, error details
+- Export error logs as parquet (like other tables)
+
+---
+
+## Technology Stack
+
+### Core (All from Astral where possible!)
+- **uv** - Dependency management & Python version
+- **ruff** - Linting & formatting
+- **ty** - Type checking
+- **polars** - DataFrames (10-100x faster than pandas)
+- **duckdb** - Complex SQL operations
+- **pydantic** - Settings & validation
+- **pandera** - DataFrame schema validation
+- **loguru** - Logging (JSON output)
+- **pytest** - Testing
+
+### GCP & Utilities
+- **google-cloud-bigquery** - Replaces `bq` CLI
+- **google-cloud-storage** - Replaces `gsutil` CLI
+- **typer** - CLI interface
+- **rich** - Beautiful console output
+
+---
+
+## Architecture
+
+### Current R Pipeline (Batch per Step)
+```
+Step 1: ALL trackers → raw parquets
+Step 2: ALL raw → ALL cleaned
+Step 3: ALL cleaned → tables
+```
+
+**Problems**: Must reprocess everything, high memory, slow feedback
+
+### New Python Pipeline (Per-Tracker)
+```
+For each changed tracker (in parallel):
+  ├─ Extract → Clean → Export
+
+Then aggregate all:
+  ├─ All cleaned parquets → Final tables
+  └─ Upload to BigQuery
+```
+
+**Benefits**: Incremental, parallel, lower memory, immediate feedback
+
+### State Management Flow
+
+```
+1. Container starts (stateless, fresh)
+2. Query BigQuery metadata table
+   SELECT file_name, file_hash FROM tracker_metadata
+3. Compare with current file hashes
+4. Process only: new + changed + previously failed
+5. Update metadata table (append new records)
+6. Container shuts down (state persists in BigQuery)
+```
+
+### Error Logging Pattern
+
+```python
+# Try vectorized conversion
+df = df.with_columns(pl.col("age").cast(pl.Int32, strict=False))
+
+# Detect failures (became null but wasn't null before)
+failed_rows = df.filter(conversion_failed)
+
+# Log each failure with context
+for row in failed_rows:
+    error_collector.add_error(
+        file_name=row["file_name"],
+        patient_id=row["patient_id"],
+        column="age",
+        original_value=row["age_original"],
+        error="Could not convert to Int32"
+    )
+
+# Replace with error value
+df = df.with_columns(
+    pl.when(conversion_failed).then(ERROR_VAL).otherwise(converted)
+)
+```
+
+Result: Fast vectorization + complete error transparency
+
+---
+
+## Key Migration Patterns
+
+### Configuration
+```python
+# R: config.yml → config::get()
+# Python: .env → Pydantic Settings
+
+from a4d.config import settings
+print(settings.data_root)
+print(settings.project_id)
+```
+
+### Logging
+```python
+# R: logInfo(log_to_json("msg", values=list(x=1)))
+# Python: loguru
+
+from loguru import logger
+
+logger.info("Processing tracker", file="clinic_001.xlsx", rows=100)
+
+# File-specific logging (like R's with_file_logger)
+with file_logger("clinic_001_patient", output_root) as log:
+    log.info("Processing patient data")
+    log.error("Failed", error_code="critical_abort")
+```
+
+### DataFrames
+```python
+# R: df %>% filter(age > 18) %>% select(name, age)
+# Python: Polars
+
+df.filter(pl.col("age") > 18).select(["name", "age"])
+
+# R: df %>% mutate(age = age + 1)
+# Python:
+df.with_columns((pl.col("age") + 1).alias("age"))
+```
+
+### Avoid rowwise() - Use Vectorized
+```python
+# R (slow):
+# df %>% rowwise() %>% mutate(age_fixed = fix_age(age, dob, ...))
+
+# Python (fast):
+# Vectorized operations
+df = df.with_columns([
+    fix_age_vectorized(
+        pl.col("age"),
+        pl.col("dob"),
+        pl.col("tracker_year")
+    ).alias("age")
+])
+
+# OR if you must iterate (only for failures):
+failed_rows = df.filter(needs_special_handling)
+for row in failed_rows.iter_rows(named=True):
+    # Handle edge case + log error
+    pass
+```
+
+### Type Conversion with Error Tracking
+```python
+# R: convert_to(x, as.numeric, ERROR_VAL)
+# Python:
+
+df = safe_convert_column(
+    df=df,
+    column="age",
+    target_type=pl.Int32,
+    error_value=settings.error_val_numeric,
+    error_collector=error_collector
+)
+
+# This function:
+# 1. Tries vectorized conversion
+# 2. Detects failures
+# 3. Logs each failure with patient_id, file_name
+# 4. Replaces with error value
+```
+
+### GCP Operations
+```python
+# R: system("gsutil cp ...")
+# Python:
+from google.cloud import storage
+client = storage.Client()
+bucket = client.bucket("a4dphase2_upload")
+blob = bucket.blob("file.parquet")
+blob.upload_from_filename("local_file.parquet")
+
+# R: system("bq load ...")
+# Python:
+from google.cloud import bigquery
+client = bigquery.Client()
+job = client.load_table_from_dataframe(df, table_id)
+job.result()
+```
+
+---
+
+## Phase Checklist
+
+### ✅ Phase 0: Foundation (DONE)
+- [x] Create migration branch
+- [x] Create a4d-python/ directory structure
+- [x] Set up pyproject.toml with uv
+- [x] Configure Astral toolchain (ruff, ty)
+- [x] Add GitHub Actions CI
+- [x] Create basic config.py
+
+### Phase 1: Core Infrastructure (PARTIAL)
+- [x] **reference/synonyms.py** - Column name mapping ✅
+  - Load YAML files (reuse from reference_data/)
+  - Create reverse mapping dict
+  - `rename_columns()` method with strict mode
+  - Comprehensive test coverage
+
+- [x] **reference/provinces.py** - Province validation ✅
+  - Load allowed provinces YAML
+  - Case-insensitive validation
+  - Country mapping
+
+- [x] **reference/loaders.py** - YAML loading utilities ✅
+  - Find reference_data directory
+  - Load YAML with validation
+
+- [ ] **logging.py** - loguru setup with JSON output
+  - Console handler (pretty, colored)
+  - File handler (JSON for BigQuery upload)
+  - `file_logger()` context manager
+
+- [ ] **clean/converters.py** - Type conversion with error tracking
+  - `ErrorCollector` class
+  - `safe_convert_column()` function
+  - Vectorized + detailed error logging
+
+- [ ] **schemas/validation.py** - YAML-based validation
+  - Load data_cleaning.yaml
+  - Apply allowed_values rules
+  - Integrate with Pandera schemas
+
+- [ ] **gcp/storage.py** - GCS operations
+  - `download_bucket()`
+  - `upload_directory()`
+
+- [ ] **gcp/bigquery.py** - BigQuery operations
+  - `ingest_table()` with parquet
+
+- [ ] **state/bigquery_state.py** - State management
+  - Query previous file hashes
+  - `get_files_to_process()` - incremental logic
+  - `update_metadata()` - append new records
+
+- [ ] **utils/paths.py** - Path utilities
+
+### Phase 2: Script 1 - Extraction ✅ COMPLETE
+- [x] **extract/patient.py** - COMPLETED ✅
+  - [x] Read Excel with openpyxl (read-only, single-pass optimization)
+  - [x] Find all month sheets automatically
+  - [x] Extract tracker year from sheet names or filename
+  - [x] Read and merge two-row headers (with horizontal fill-forward)
+  - [x] **Smart header detection**: Detects title rows vs. actual headers (e.g., "Summary of Patient Recruitment" title above "Patient ID" column)
+  - [x] Handle merged cells creating duplicate columns (R-compatible merge with commas)
+  - [x] Apply synonym mapping with `ColumnMapper`
+  - [x] Extract clinic_id from parent directory basename
+  - [x] Process "Patient List" sheet and left join with monthly data
+  - [x] Process "Annual" sheet and left join with monthly data
+  - [x] Extract from all month sheets with metadata (sheet_name, tracker_month, tracker_year, file_name, clinic_id)
+  - [x] Combine sheets with `diagonal_relaxed` (handles type mismatches)
+  - [x] Filter invalid rows (null patient_id, or "0"/"0" combinations)
+  - [x] **Export raw parquet**: `export_patient_raw()` matches R filename format
+  - [x] 28 comprehensive tests (all passing)
+  - [x] 88% code coverage for patient.py
+  - [x] **Script**: `scripts/export_single_tracker.py` for manual testing
+
+- [ ] **extract/product.py** - TODO
+  - Same pattern as patient
+
+- [x] **Test on sample trackers** - DONE
+  - Tested with 2024, 2019, 2018 trackers
+  - **2017 Mahosot (Laos/MHS)**: 11 months, legacy "Summary of Patient Recruitment" title row format
+  - **2025 Mahosot (Laos/MHS)**: 6 months, Patient List & Annual sheets, modern format
+  - Handles format variations across years (2017-2025)
+
+- [ ] **Compare outputs with R pipeline** - TODO
+  - Need to run both pipelines and compare parquet outputs
+
+### Phase 3: Script 2 - Cleaning (Week 5-7) ✅
+- [x] **clean/patient.py** - COMPLETE
+  - [x] Meta schema approach (all 83 database columns)
+  - [x] Legacy format fixes (placeholders for pre-2024 trackers)
+  - [x] Preprocessing transformations (HbA1c exceeds, Y/N normalization, insulin derivation)
+  - [x] Transformations (regimen extraction, decimal correction)
+  - [x] Type conversions with error tracking (ErrorCollector)
+  - [x] Range validation (height, weight, BMI, age, HbA1c, FBG)
+  - [x] YAML-based allowed values validation (case-insensitive)
+  - [x] Unit conversions (FBG mmol ↔ mg)
+  - [x] **Improvements over R**:
+    - Fixed insulin_type bug (R doesn't check analog columns)
+    - Fixed insulin_subtype typo (rapic → rapid)
+    - Better error tracking with detailed logging
+
+- [x] **clean/schema.py** - Exact 83-column schema matching R
+- [x] **clean/validators.py** - Case-insensitive validation with sanitize_str()
+- [x] **clean/converters.py** - Safe type conversion with error tracking
+- [x] **clean/transformers.py** - Explicit transformations (not YAML-driven)
+
+- [ ] **clean/product.py** - TODO
+
+- [x] **Test on sample data** - DONE (2024 Sibu Hospital tracker)
+- [x] **Compare outputs with R** - DONE
+  - Schema: 100% match (83 columns, all types)
+  - Values: 3 remaining differences (all Python improvements)
+  - See [PYTHON_IMPROVEMENTS.md](PYTHON_IMPROVEMENTS.md)
+- [ ] **Compare error logs** - TODO (need to generate errors)
+
+### Phase 4: Script 3 - Tables (Week 7-9)
+- [ ] **tables/patient.py**
+  - `create_table_patient_data_static()`
+  - `create_table_patient_data_monthly()` - with DuckDB for changes
+  - `create_table_patient_data_annual()`
+
+- [ ] **tables/product.py**
+  - `create_table_product_data()`
+
+- [ ] **tables/clinic.py**
+  - `create_table_clinic_static_data()`
+
+- [ ] **Logs table** - Aggregate all error parquets
+
+- [ ] **Compare final tables with R**
+
+### Phase 5: Pipeline Integration (Week 9-10)
+- [ ] **pipeline/tracker_pipeline.py**
+  - `TrackerPipeline.process()` - end-to-end per tracker
+
+- [ ] **scripts/run_pipeline.py**
+  - Query BigQuery state
+  - Parallel processing with ProcessPoolExecutor
+  - Create final tables
+  - Upload to BigQuery
+  - Update metadata table
+
+- [ ] **Test end-to-end locally**
+
+### Phase 6: GCP Deployment (Week 10-11)
+- [ ] Finalize Dockerfile
+- [ ] Test GCS upload/download
+- [ ] Deploy to Cloud Run (test)
+- [ ] Test with Cloud Scheduler trigger
+
+### Phase 7: Validation (Week 11-12)
+- [ ] Run both R and Python pipelines on production data
+- [ ] Automated comparison of all outputs
+- [ ] Performance benchmarking
+- [ ] Fix discovered bugs
+
+### Phase 8: Cutover (Week 12-13)
+- [ ] Final validation
+- [ ] Deploy to production
+- [ ] Monitor first run
+- [ ] Deprecate R pipeline
+
+---
+
+## Code Examples
+
+### 1. Configuration (src/a4d/config.py)
+
+Already implemented ✅
+
+### 2. Logging Setup (src/a4d/logging.py)
+
+```python
+from loguru import logger
+from pathlib import Path
+import sys
+
+def setup_logging(log_dir: Path, log_name: str):
+    """Configure loguru for BigQuery-compatible JSON logs."""
+    log_dir.mkdir(parents=True, exist_ok=True)
+    log_file = log_dir / f"main_{log_name}.log"
+
+    logger.remove()  # Remove default
+
+    # Console (pretty, colored)
+    logger.add(sys.stdout, level="INFO", colorize=True)
+
+    # File (JSON for BigQuery)
+    logger.add(
+        log_file,
+        serialize=True,  # JSON output
+        level="DEBUG",
+        rotation="100 MB",
+    )
+
+from contextlib import contextmanager
+
+@contextmanager
+def file_logger(file_name: str, output_root: Path):
+    """File-specific logging (like R's with_file_logger)."""
+    log_file = output_root / "logs" / f"{file_name}.log"
+    log_file.parent.mkdir(parents=True, exist_ok=True)
+
+    handler_id = logger.add(log_file, serialize=True)
+    bound_logger = logger.bind(file_name=file_name)
+
+    try:
+        yield bound_logger
+    except Exception:
+        bound_logger.exception("Processing failed", error_code="critical_abort")
+        raise
+    finally:
+        logger.remove(handler_id)
+```
+
+### 3. Synonym Mapper (src/a4d/synonyms/mapper.py)
+
+```python
+import yaml
+from pathlib import Path
+import polars as pl
+
+class SynonymMapper:
+    def __init__(self, synonym_file: Path):
+        with open(synonym_file) as f:
+            synonyms = yaml.safe_load(f)
+
+        # Reverse mapping: synonym -> standard
+        self._mapping = {}
+        for standard, variants in synonyms.items():
+            if isinstance(variants, list):
+                for variant in variants:
+                    self._mapping[variant.lower()] = standard
+            else:
+                self._mapping[variants.lower()] = standard
+
+    def rename_dataframe(self, df: pl.DataFrame) -> pl.DataFrame:
+        """Rename columns using synonym mapping."""
+        mapping = {col: self._mapping.get(col.lower(), col) for col in df.columns}
+        return df.rename(mapping)
+
+# Cache mappers
+from functools import lru_cache
+
+@lru_cache(maxsize=2)
+def get_synonym_mapper(data_type: str) -> SynonymMapper:
+    file = Path(f"../reference_data/synonyms/synonyms_{data_type}.yaml")
+    return SynonymMapper(file)
+```
+
+### 4. Error Tracking Converter (src/a4d/clean/converters.py)
+
+```python
+from dataclasses import dataclass
+import polars as pl
+
+@dataclass
+class ConversionError:
+    file_name: str
+    patient_id: str
+    column: str
+    original_value: any
+    error_message: str
+
+class ErrorCollector:
+    def __init__(self):
+        self.errors = []
+
+    def add_error(self, file_name, patient_id, column, original_value, error_message):
+        self.errors.append(ConversionError(
+            file_name, patient_id, column, str(original_value), error_message
+        ))
+
+    def to_dataframe(self) -> pl.DataFrame:
+        if not self.errors:
+            return pl.DataFrame()
+        return pl.DataFrame([e.__dict__ for e in self.errors])
+
+def safe_convert_column(
+    df: pl.DataFrame,
+    column: str,
+    target_type: pl.DataType,
+    error_value: any,
+    error_collector: ErrorCollector
+) -> pl.DataFrame:
+    """Vectorized conversion with row-level error tracking."""
+
+    # Store original
+    df = df.with_columns(pl.col(column).alias(f"_orig_{column}"))
+
+    # Try vectorized conversion
+    df = df.with_columns(
+        pl.col(column).cast(target_type, strict=False).alias(f"_conv_{column}")
+    )
+
+    # Detect failures
+    failed = df.filter(
+        pl.col(f"_conv_{column}").is_null() &
+        pl.col(f"_orig_{column}").is_not_null()
+    )
+
+    # Log each failure
+    for row in failed.iter_rows(named=True):
+        error_collector.add_error(
+            file_name=row.get("file_name", "unknown"),
+            patient_id=row.get("patient_id", "unknown"),
+            column=column,
+            original_value=row[f"_orig_{column}"],
+            error_message=f"Could not convert to {target_type}"
+        )
+
+    # Replace failures with error value
+    df = df.with_columns(
+        pl.when(pl.col(f"_conv_{column}").is_null())
+        .then(pl.lit(error_value))
+        .otherwise(pl.col(f"_conv_{column}"))
+        .alias(column)
+    )
+
+    return df.drop([f"_orig_{column}", f"_conv_{column}"])
+```
+
+### 5. State Manager (src/a4d/state/bigquery_state.py)
+
+```python
+from google.cloud import bigquery
+import polars as pl
+import hashlib
+from pathlib import Path
+
+class BigQueryStateManager:
+    def __init__(self, project_id: str, dataset: str):
+        self.client = bigquery.Client(project=project_id)
+        self.table_id = f"{project_id}.{dataset}.tracker_metadata"
+
+    def get_file_hash(self, file_path: Path) -> str:
+        hasher = hashlib.md5()
+        with open(file_path, 'rb') as f:
+            for chunk in iter(lambda: f.read(8192), b''):
+                hasher.update(chunk)
+        return hasher.hexdigest()
+
+    def get_previous_state(self) -> pl.DataFrame:
+        """Query BigQuery for previous file hashes."""
+        query = f"""
+        SELECT file_name, file_hash, status
+        FROM `{self.table_id}`
+        WHERE last_processed = (
+            SELECT MAX(last_processed)
+            FROM `{self.table_id}` AS t2
+            WHERE t2.file_name = {self.table_id}.file_name
+        )
+        """
+        df_pandas = self.client.query(query).to_dataframe()
+        return pl.from_pandas(df_pandas) if len(df_pandas) > 0 else pl.DataFrame()
+
+    def get_files_to_process(self, tracker_files: list[Path], force=False) -> list[Path]:
+        """Determine which files need processing (incremental)."""
+        if force:
+            return tracker_files
+
+        previous = self.get_previous_state()
+        if len(previous) == 0:
+            return tracker_files
+
+        prev_lookup = {
+            row["file_name"]: (row["file_hash"], row["status"])
+            for row in previous.iter_rows(named=True)
+        }
+
+        to_process = []
+        for file in tracker_files:
+            current_hash = self.get_file_hash(file)
+
+            if file.name not in prev_lookup:
+                to_process.append(file)  # New
+            else:
+                prev_hash, status = prev_lookup[file.name]
+                if current_hash != prev_hash or status == "failed":
+                    to_process.append(file)  # Changed or failed
+
+        return to_process
+```
+
+---
+
+## Reference Data (Reusable)
+
+All YAML files in `reference_data/` can be used as-is:
+- ✅ `synonyms/synonyms_patient.yaml`
+- ✅ `synonyms/synonyms_product.yaml`
+- ✅ `data_cleaning.yaml`
+- ✅ `provinces/allowed_provinces.yaml`
+
+No migration needed - just reference from Python code.
+
+---
+
+## Success Criteria
+
+### Correctness
+- [ ] All final tables match R output (or differences documented)
+- [ ] Error counts match R
+- [ ] Same patient_ids flagged
+
+### Performance
+- [ ] 2-5x faster than R
+- [ ] Incremental runs only process changed files
+- [ ] Memory usage <8GB
+
+### Code Quality
+- [ ] Test coverage >80%
+- [ ] ruff linting passes
+- [ ] ty type checking passes
+
+### Deployment
+- [ ] Runs in Cloud Run
+- [ ] Incremental processing works
+- [ ] Monitoring set up
+
+---
+
+## Notes for Implementation
+
+1. **Start with infrastructure** - Don't jump to extraction yet
+2. **Test continuously** - Write tests alongside code
+3. **Compare with R** - After each phase, validate outputs match
+4. **Use existing R code as reference** - Read the R scripts to understand logic
+5. **Ask questions** - Migration docs are guides, not absolute rules
+6. **Document differences** - If output differs from R, document why
+
+---
+
+## Recent Progress (2025-10-26)
+
+### ✅ Completed: Phase 3 - Patient Data Cleaning
+
+**Modules Implemented**:
+- `src/a4d/clean/patient.py` (461 lines) - Main cleaning pipeline
+- `src/a4d/clean/schema.py` (200 lines) - Meta schema (83 columns, exact R match)
+- `src/a4d/clean/validators.py` (250 lines) - Case-insensitive validation
+- `src/a4d/clean/converters.py` (150 lines) - Safe type conversions
+- `src/a4d/clean/transformers.py` (100 lines) - Data transformations
+
+**Key Features**:
+1. **Meta Schema Approach**: Define all 83 target database columns upfront, fill what exists, leave rest as NULL
+2. **Case-Insensitive Validation**: Implements R's `sanitize_str()` pattern (lowercase, remove spaces/special chars), returns canonical values
+3. **Error Tracking**: ErrorCollector class for detailed conversion failure logging
+4. **Type Conversions**: String → Date/Int32/Float64 with error values (999999, "Undefined", 9999-09-09)
+5. **Range Validation**: Height (0-2.3m), Weight (0-200kg), BMI (4-60), Age (0-25), HbA1c (4-18%), FBG (0-136.5 mmol/l)
+6. **Unit Conversions**: FBG mmol/l ↔ mg/dl (18x factor), applied AFTER schema so target columns exist
+7. **Pipeline Order**: Legacy fixes → Preprocessing → Transformations → **Schema** → Type conversion → Range validation → Allowed values → Unit conversion
+
+**Comparison with R Pipeline**:
+- ✅ Schema: 100% match (83 columns, all types correct)
+- ✅ Type alignment: Fixed tracker_year/tracker_month (String → Int32)
+- ✅ Status validation: Case-insensitive with canonical Title Case values
+- ✅ FBG unit conversion: Works perfectly (13.5 mmol × 18 = 243.0 mg)
+- ✅ insulin_type/insulin_subtype: Derivation enabled with Python improvements
+
+**Python Improvements Over R** (see [PYTHON_IMPROVEMENTS.md](PYTHON_IMPROVEMENTS.md)):
+1. **insulin_type bug fix**: R doesn't check analog columns, returns None for analog-only patients. Python correctly derives "Analog Insulin".
+2. **insulin_subtype typo fix**: R has typo "rapic-acting", Python uses correct "rapid-acting"
+3. **Better null handling**: Python correctly preserves None when all insulin columns are None (matches R's NA behavior)
+
+**Remaining Differences** (all Python correct):
+- `insulin_type` (5/53 rows): Python='Analog Insulin', R=None (R bug)
+- `insulin_total_units` (50/53 rows): Python extracts values, R=None (to verify if R should extract)
+- `bmi` (27/53 rows): Float precision ~10^-15 (negligible)
+
+### 🔑 Key Learnings
+1. **Apply schema BEFORE conversions**: Enables unit conversions on columns that don't exist in raw data
+2. **Case-insensitive validation is complex**: Must create {sanitized → canonical} mapping, then replace with canonical values
+3. **R's ifelse handles NA differently**: NA in condition → NA result (not False). Python needs explicit null checks.
+4. **Type conversion optimization**: Skip columns already at correct type (happens when schema adds NULL columns)
+5. **Fix R bugs, don't replicate them**: insulin_type derivation bug, insulin_subtype typo - Python should be correct
+
+### 📝 Next Steps
+1. Document insulin_total_units extraction difference (verify if R should extract this)
+2. Implement `clean/product.py` (similar pattern to patient)
+3. Move to Phase 4: Tables (aggregation into final BigQuery tables)
+
+---
+
+## Questions During Migration
+
+1. How to handle date parsing edge cases?
+2. Exact numeric precision for comparisons?
+3. Memory optimization for large files?
+4. Optimal parallel workers for Cloud Run?
+
+→ These will be answered during implementation
diff --git a/a4d-python/docs/migration/PYTHON_IMPROVEMENTS.md b/a4d-python/docs/migration/PYTHON_IMPROVEMENTS.md
new file mode 100644
index 0000000..09e51f0
--- /dev/null
+++ b/a4d-python/docs/migration/PYTHON_IMPROVEMENTS.md
@@ -0,0 +1,146 @@
+# Python Pipeline Improvements Over R
+
+This document tracks cases where the Python pipeline implementation is **more correct** than the R pipeline, resulting in intentional differences between R and Python outputs.
+
+## 1. insulin_type Derivation Bug Fix
+
+**Status**: ✅ Fixed in Python
+
+**Issue in R**: R's insulin_type derivation logic only checks the human insulin columns to decide between "human insulin" and "analog insulin". When all human insulin columns are None/NA, the condition evaluates to NA, and `ifelse()` returns NA - **even if the analog insulin columns have "Y" values**.
+
+**R Code (Buggy)**:
+```r
+insulin_type = ifelse(
+    human_insulin_pre_mixed == "Y" |
+        human_insulin_short_acting == "Y" |
+        human_insulin_intermediate_acting == "Y",
+    "human insulin",
+    "analog insulin"
+)
+```
+
+**Problem**: For patients with ONLY analog insulin (human columns = None, analog columns = 'Y'):
+- `None == "Y"` evaluates to NA in R
+- `NA | NA | NA` → NA
+- `ifelse(NA, "human insulin", "analog insulin")` → NA
+
+**Python Fix**: Check if ANY insulin column has data first, then derive the type:
+```python
+pl.when(
+    # Only derive if at least one insulin column is not null
+    pl.col("human_insulin_pre_mixed").is_not_null()
+    | pl.col("human_insulin_short_acting").is_not_null()
+    | pl.col("human_insulin_intermediate_acting").is_not_null()
+    | pl.col("analog_insulin_rapid_acting").is_not_null()
+    | pl.col("analog_insulin_long_acting").is_not_null()
+)
+.then(
+    pl.when(
+        (pl.col("human_insulin_pre_mixed") == "Y")
+        | (pl.col("human_insulin_short_acting") == "Y")
+        | (pl.col("human_insulin_intermediate_acting") == "Y")
+    )
+    .then(pl.lit("human insulin"))
+    .otherwise(pl.lit("analog insulin"))
+)
+.otherwise(None)
+```
+
+**Impact**: For 2024 Sibu Hospital tracker, 5 patients correctly get `insulin_type = 'Analog Insulin'` in Python vs `None` in R.
+
+**File**: `src/a4d/clean/patient.py:_derive_insulin_fields()`
+
+## 2. insulin_subtype Typo Fix
+
+**Status**: ✅ Fixed in Python
+
+**Issue in R**: R has a typo - uses "rapic-acting" instead of "rapid-acting" when deriving insulin_subtype.
+
+**R Code (Typo)**:
+```r
+paste(ifelse(analog_insulin_rapid_acting == "Y", "rapic-acting", ""), sep = ",")
+```
+
+**Python Fix**: Uses correct spelling "rapid-acting"
+
+**Impact**: Derived insulin_subtype values use correct medical terminology. However, since comma-separated values get replaced with "Undefined" by validation, the final output for insulin_subtype is still "Undefined" in both R and Python.
+
+**File**: `src/a4d/clean/patient.py:_derive_insulin_fields()`
+
+## 3. insulin_total_units Extraction Bug Fix
+
+**Status**: ✅ Fixed in Python
+
+**Issue in R**: R's header merge logic has a condition that fails for 2024+ trackers, causing it to skip the two-row header merge and lose columns.
+
+**R Code (Buggy)** - `script1_helper_read_patient_data.R:92`:
+```r
+if (header_cols[2] == header_cols_2[2]) {
+    # Only merge if column 2 matches in both rows
+    diff_colnames <- which((header_cols != header_cols_2))
+    header_cols[diff_colnames] <- paste(header_cols_2[diff_colnames], header_cols[diff_colnames])
+}
+```
+
+**Problem for 2024 Sibu Hospital tracker**:
+- Row 75 (header_cols_2), Col 2: `"Patient \nID*"`
+- Row 76 (header_cols), Col 2: `None` (part of merged cell above)
+- Condition `header_cols[2] == header_cols_2[2]` evaluates to `FALSE`
+- **Headers NOT merged**, only row 76 used
+
+**Result**:
+- Col 27 in R: Only gets "per day" (row 76 alone)
+- "per day" doesn't match synonym "TOTAL Insulin Units per day"
+- **Column lost during synonym mapping**
+
+**Python Fix**: Python always merges both header rows without conditions:
+```python
+for h1, h2 in zip(header_1, header_2, strict=True):
+    if h1 and h2:
+        headers.append(f"{h2} {h1}".strip())
+```
+
+**Result**:
+- Col 27 in Python: "TOTAL Insulin Units per day" (row 75 + row 76)
+- Matches synonym perfectly ✅
+
+**Impact**: For 2024 Sibu Hospital tracker, Python correctly extracts insulin_total_units for 50/53 patients. R loses this column entirely due to header merge failure.
+
+**File**: `src/a4d/extract/patient.py:merge_headers()`
+
+## 4. BMI Float Precision
+
+**Status**: ℹ️ Negligible difference
+
+**Observation**: Minor floating point precision differences at the ~10^-15 level.
+
+**Example**:
+- R: `19.735976492259113`
+- Python: `19.73597649225911`
+
+**Cause**: Different floating point arithmetic between R and Python/Polars.
+
+**Impact**: Negligible - differences are below any meaningful precision threshold for BMI measurements.
+
+## Summary
+
+| Issue | R Behavior | Python Behavior | Classification |
+|-------|-----------|-----------------|----------------|
+| insulin_type derivation | Bug - returns None for analog-only patients (doesn't check analog columns) | Correct derivation (checks all insulin columns) | **Python Fix** |
+| insulin_subtype typo | "rapic-acting" (typo) | "rapid-acting" (correct spelling) | **Python Fix** |
+| insulin_total_units extraction | Not extracted (header merge fails for 2024+ trackers) | Correctly extracted (unconditional header merge) | **Python Fix** |
+| BMI precision | 16 decimal places | 14-15 decimal places | **Negligible** |
+
+## Migration Validation Status
+
+✅ **Schema**: 100% match (83 columns, all types correct)
+✅ **Extraction**: Improved (unconditional header merge fixes insulin_total_units)
+✅ **Cleaning**: Improved (fixes insulin_type derivation bug, corrects insulin_subtype typo)
+ℹ️ **Precision**: Acceptable float differences (~10^-15 for BMI)
+
+**All 3 value differences are Python improvements over R bugs.**
+
+The Python pipeline is production-ready with significant improvements over the R pipeline:
+1. **More robust header parsing** - No conditional merge that fails on 2024+ trackers
+2. **Better null handling** - Correctly checks all insulin columns before derivation
+3. **Correct terminology** - Uses proper medical terms ("rapid-acting" not "rapic-acting")
diff --git a/a4d-python/docs/migration/REFERENCE_DATA_MIGRATION.md b/a4d-python/docs/migration/REFERENCE_DATA_MIGRATION.md
new file mode 100644
index 0000000..e884d9c
--- /dev/null
+++ b/a4d-python/docs/migration/REFERENCE_DATA_MIGRATION.md
@@ -0,0 +1,529 @@
+# Reference Data Migration Plan
+
+This document describes how reference data and configuration files are used in the R pipeline and how to migrate them to Python.
+
+## Overview
+
+The R pipeline uses several YAML and Excel files for configuration and reference data:
+
+| File | Purpose | R Usage | Python Migration Strategy |
+|------|---------|---------|---------------------------|
+| `config.yml` | GCP configuration, paths | Loaded via `config::get()` | Pydantic Settings with `.env` |
+| `synonyms_patient.yaml` | Column name mappings (patient) | Script 1 - column renaming | `synonyms/mapper.py` loader |
+| `synonyms_product.yaml` | Column name mappings (product) | Script 1 - column renaming | `synonyms/mapper.py` loader |
+| `allowed_provinces.yaml` | Valid provinces by country | Script 2 - validation | Load into Pandera schema |
+| `data_cleaning.yaml` | Validation rules | Script 2 - cleaning | `clean/rules.py` parser |
+| `clinic_data.xlsx` | Static clinic info | Script 3 - table creation | Later phase (not needed initially) |
+
+## Detailed Analysis
+
+### 1. config.yml
+
+**Current R Implementation:**
+```r
+# R/helper_main.R:15
+config <- config::get()
+paths$tracker_root <- config$data_root
+paths$output_root <- file.path(config$data_root, config$output_dir)
+
+# Access:
+config$data_root
+config$download_bucket
+config$upload_bucket
+config$project_id
+config$dataset
+```
+
+**Structure:**
+```yaml
+default:
+    download_bucket: "a4dphase2_upload"
+    upload_bucket: "a4dphase2_output"
+    data_root: "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload"
+    output_dir: "output"
+    project_id: "a4dphase2"
+    dataset: "tracker"
+
+production:
+    data_root: "/home/rstudio/data"
+```
+
+**Python Migration:**
+- ✅ **DONE** - Already implemented in `a4d/config.py` using Pydantic Settings
+- Uses `.env` file instead of YAML (more standard for Python)
+- Environment variables prefixed with `A4D_`
+- Access: `settings.data_root`, `settings.upload_bucket`, etc.
+
+**Action:** No additional work needed.
+
+---
+
+### 2. synonyms_patient.yaml & synonyms_product.yaml
+
+**Current R Implementation:**
+```r
+# R/helper_main.R:69-78
+get_synonyms <- function() {
+    synonyms_patient <- read_column_synonyms(synonym_file = "synonyms_patient.yaml")
+    synonyms_product <- read_column_synonyms(synonym_file = "synonyms_product.yaml")
+    list(patient = synonyms_patient, product = synonyms_product)
+}
+
+# R/helper_main.R:99-126
+read_column_synonyms <- function(synonym_file, path_prefixes = c("reference_data", "synonyms")) {
+    path <- do.call(file.path, as.list(c(path_prefixes, synonym_file)))
+    synonyms_yaml <- yaml::read_yaml(path)
+
+    # Converts to tibble with columns: unique_name, synonym
+    # e.g., "age" -> ["Age", "Age*", "age on reporting", ...]
+}
+
+# Used in Script 1 to rename columns during extraction
+```
+
+**Structure (example from synonyms_patient.yaml):**
+```yaml
+age:
+  - Age
+  - Age*
+  - age on reporting
+  - Age (Years)
+  - Age* On Reporting
+blood_pressure_dias_mmhg:
+  - Blood Pressure Diastolic (mmHg)
+patient_id:
+  - ID
+  - Patient ID
+  - Patient ID*
+```
+
+**Python Migration Strategy:**
+
+Create `src/a4d/synonyms/mapper.py`:
+```python
+from pathlib import Path
+import yaml
+from typing import Dict, List
+
+class ColumnMapper:
+    """Maps synonym column names to standardized names."""
+
+    def __init__(self, yaml_file: Path):
+        with open(yaml_file) as f:
+            self.synonyms = yaml.safe_load(f)
+
+        # Build reverse lookup: synonym -> standard_name
+        self._lookup = {}
+        for standard_name, synonyms in self.synonyms.items():
+            for synonym in synonyms:
+                self._lookup[synonym] = standard_name
+
+    def rename_columns(self, df: pl.DataFrame) -> pl.DataFrame:
+        """Rename DataFrame columns using synonym mappings."""
+        rename_map = {
+            col: self._lookup.get(col, col)
+            for col in df.columns
+        }
+        return df.rename(rename_map)
+
+    def get_standard_name(self, column: str) -> str:
+        """Get standard name for a column (or return original if not found)."""
+        return self._lookup.get(column, column)
+
+# Usage:
+patient_mapper = ColumnMapper(Path("reference_data/synonyms/synonyms_patient.yaml"))
+product_mapper = ColumnMapper(Path("reference_data/synonyms/synonyms_product.yaml"))
+
+df = patient_mapper.rename_columns(df)
+```
+
+**Files to Create:**
+- `src/a4d/synonyms/__init__.py`
+- `src/a4d/synonyms/mapper.py`
+- `tests/test_synonyms/test_mapper.py`
+
+**Phase:** Phase 1 (Core Infrastructure)
+
+---
+
+### 3. allowed_provinces.yaml
+
+**Current R Implementation:**
+```r
+# R/helper_main.R:149-153
+get_allowed_provinces <- function() {
+    provinces <- yaml::read_yaml("reference_data/provinces/allowed_provinces.yaml") %>%
+        unlist()
+    return(provinces)
+}
+
+# reference_data/build_package_data.R:1-8
+# Provinces are injected into data_cleaning.yaml at build time
+cleaning_config <- yaml::read_yaml("reference_data/data_cleaning.yaml")
+allowed_provinces <- yaml::read_yaml("reference_data/provinces/allowed_provinces.yaml") %>% unlist()
+
+for (i in length(cleaning_config$province$steps)) {
+    if (cleaning_config$province$steps[[i]]$type == "allowed_values") {
+        cleaning_config$province$steps[[i]]$allowed_values <- allowed_provinces
+    }
+}
+```
+
+**Structure:**
+```yaml
+THAILAND:
+  - Amnat Charoen
+  - Ang Thong
+  - Bangkok
+  ...
+LAOS:
+  - Attapeu
+  - Bokeo
+  ...
+VIETNAM:
+  - An Giang
+  - Bà Rịa–Vũng Tàu
+  ...
+```
+
+**Python Migration Strategy:**
+
+Load into Pandera schema or validation rules:
+
+```python
+# src/a4d/schemas/provinces.py
+import yaml
+from pathlib import Path
+from typing import List
+
+def load_allowed_provinces() -> List[str]:
+    """Load all allowed provinces from YAML file."""
+    path = Path("reference_data/provinces/allowed_provinces.yaml")
+    with open(path) as f:
+        provinces_by_country = yaml.safe_load(f)
+
+    # Flatten all provinces into single list
+    all_provinces = []
+    for country, provinces in provinces_by_country.items():
+        all_provinces.extend(provinces)
+
+    return all_provinces
+
+ALLOWED_PROVINCES = load_allowed_provinces()
+
+# Use in Pandera schema:
+import pandera.polars as pa
+
+class PatientSchema(pa.DataFrameModel):
+    province: pl.Utf8 = pa.Field(isin=ALLOWED_PROVINCES, nullable=True)
+```
+
+**Files to Create:**
+- `src/a4d/schemas/provinces.py`
+- Update `src/a4d/schemas/patient.py` to use ALLOWED_PROVINCES
+
+**Phase:** Phase 1 (Core Infrastructure)
+
+---
+
+### 4. data_cleaning.yaml
+
+**Current R Implementation:**
+```r
+# reference_data/build_package_data.R:1-12
+# Embedded into R package as sysdata.rda
+cleaning_config <- yaml::read_yaml("reference_data/data_cleaning.yaml")
+# ... inject provinces ...
+config <- list(cleaning = cleaning_config)
+save(config, file = "R/sysdata.rda")
+
+# R/script2_helper_patient_data_fix.R:293-300
+parse_character_cleaning_config <- function(config) {
+    allowed_value_expr <- list()
+    for (column in names(config)) {
+        allowed_value_expr[[column]] <- parse_character_cleaning_pipeline(column, config[[column]])
+    }
+    allowed_value_expr
+}
+
+# R/script2_process_patient_data.R:303
+# Used in mutate() to apply all validation rules
+mutate(
+    !!!parse_character_cleaning_config(a4d:::config$cleaning)
+)
+```
+
+**Structure:**
+```yaml
+analog_insulin_long_acting:
+  steps:
+    - allowed_values: ["N", "Y"]
+      replace_invalid: true
+      type: allowed_values
+
+insulin_regimen:
+  steps:
+    - function_name: extract_regimen
+      type: basic_function
+    - allowed_values:
+        - "Basal-bolus (MDI)"
+        - "Premixed 30/70 DB"
+        - "Self-mixed BD"
+        - "Modified conventional TID"
+      replace_invalid: false
+      type: allowed_values
+
+province:
+  steps:
+    - allowed_values: [... provinces injected at build time ...]
+      replace_invalid: true
+      type: allowed_values
+```
+
+**Python Migration Strategy:**
+
+Create a validation rules system:
+
+```python
+# src/a4d/clean/rules.py
+import yaml
+from pathlib import Path
+from typing import Dict, List, Any, Callable
+from dataclasses import dataclass
+import polars as pl
+
+@dataclass
+class ValidationStep:
+    """Single validation step from data_cleaning.yaml"""
+    type: str  # "allowed_values", "basic_function", etc.
+    allowed_values: List[str] = None
+    replace_invalid: bool = False
+    function_name: str = None
+    error_value: str = None
+
+@dataclass
+class ColumnValidation:
+    """All validation steps for a single column"""
+    column_name: str
+    steps: List[ValidationStep]
+
+class ValidationRules:
+    """Loads and applies validation rules from data_cleaning.yaml"""
+
+    def __init__(self, yaml_path: Path):
+        with open(yaml_path) as f:
+            self.config = yaml.safe_load(f)
+
+        self.rules = self._parse_rules()
+        self.custom_functions = self._load_custom_functions()
+
+    def _parse_rules(self) -> Dict[str, ColumnValidation]:
+        """Parse YAML into structured validation rules."""
+        rules = {}
+        for column, config in self.config.items():
+            steps = [
+                ValidationStep(
+                    type=step["type"],
+                    allowed_values=step.get("allowed_values"),
+                    replace_invalid=step.get("replace_invalid", False),
+                    function_name=step.get("function_name"),
+                    error_value=step.get("error_value")
+                )
+                for step in config.get("steps", [])
+            ]
+            rules[column] = ColumnValidation(column, steps)
+        return rules
+
+    def _load_custom_functions(self) -> Dict[str, Callable]:
+        """Load custom validation functions (e.g., extract_regimen)."""
+        from a4d.clean import converters
+        return {
+            "extract_regimen": converters.extract_regimen,
+            # Add other custom functions here
+        }
+
+    def apply_to_column(self,
+                       df: pl.DataFrame,
+                       column: str,
+                       error_collector: ErrorCollector) -> pl.DataFrame:
+        """Apply all validation rules to a single column."""
+        if column not in self.rules:
+            return df
+
+        validation = self.rules[column]
+        for step in validation.steps:
+            if step.type == "allowed_values":
+                df = self._apply_allowed_values(
+                    df, column, step, error_collector
+                )
+            elif step.type == "basic_function":
+                func = self.custom_functions[step.function_name]
+                df = func(df, column, error_collector)
+
+        return df
+
+    def _apply_allowed_values(self,
+                             df: pl.DataFrame,
+                             column: str,
+                             step: ValidationStep,
+                             error_collector: ErrorCollector) -> pl.DataFrame:
+        """Validate column values against allowed list."""
+        # Vectorized check
+        is_valid = df[column].is_in(step.allowed_values) | df[column].is_null()
+
+        # Log failures
+        failed_rows = df.filter(~is_valid)
+        for row in failed_rows.iter_rows(named=True):
+            error_collector.add_error(
+                file_name=row["file_name"],
+                patient_id=row.get("patient_id"),
+                column=column,
+                original_value=row[column],
+                error=f"Value not in allowed list: {step.allowed_values}"
+            )
+
+        # Replace if configured
+        if step.replace_invalid:
+            error_value = step.error_value or settings.error_val_character
+            df = df.with_columns(
+                pl.when(~is_valid)
+                  .then(pl.lit(error_value))
+                  .otherwise(pl.col(column))
+                  .alias(column)
+            )
+
+        return df
+
+# Usage in script 2:
+rules = ValidationRules(Path("reference_data/data_cleaning.yaml"))
+for column in df.columns:
+    df = rules.apply_to_column(df, column, error_collector)
+```
+
+**Files to Create:**
+- `src/a4d/clean/rules.py`
+- `src/a4d/clean/converters.py` (custom validation functions like extract_regimen)
+- `tests/test_clean/test_rules.py`
+
+**Note:** Need to inject provinces into the YAML rules at runtime (or load dynamically).
+
+**Phase:** Phase 1 (Core Infrastructure)
+
+---
+
+### 5. clinic_data.xlsx
+
+**Current R Implementation:**
+```r
+# R/script3_create_table_clinic_static_data.R:9
+clinic_data <- readxl::read_excel(
+    path = here::here("reference_data", "clinic_data.xlsx"),
+    sheet = 1,
+    col_types = c("text", "text", ...)
+)
+
+# scripts/R/run_pipeline.R:77
+download_google_sheet("1HOxi0o9fTAoHySjW_M3F-09TRBnUITOzzxGx2HwRMAw", "clinic_data.xlsx")
+```
+
+**Usage:** Creates clinic static data table in Script 3.
+
+**Python Migration Strategy:**
+- **Phase 3** (Table Creation) - not needed for initial phases
+- Use `openpyxl` or `pl.read_excel()` to read
+- Download from Google Sheets using `gspread` or manual download
+- Lower priority - can be done later
+
+**Files to Create (later):**
+- `src/a4d/tables/clinic_static.py`
+
+**Phase:** Phase 3 (Table Creation)
+
+---
+
+## Implementation Order
+
+### Phase 1: Core Infrastructure (NEXT)
+
+1. **Synonyms mapper** (high priority - needed for Script 1):
+   - Create `src/a4d/synonyms/mapper.py`
+   - Load YAML files
+   - Rename Polars DataFrame columns
+   - Tests
+
+2. **Provinces loader** (high priority - needed for Script 2):
+   - Create `src/a4d/schemas/provinces.py`
+   - Load allowed provinces from YAML
+   - Integrate with Pandera schemas
+
+3. **Validation rules** (high priority - needed for Script 2):
+   - Create `src/a4d/clean/rules.py`
+   - Parse data_cleaning.yaml
+   - Apply validation steps
+   - Handle custom functions (extract_regimen, etc.)
+   - Tests
+
+### Phase 2+: Later
+
+- Clinic data handling (Phase 3)
+
+---
+
+## Shared Reference Data
+
+**IMPORTANT:** The reference_data/ folder is shared between R and Python:
+
+```
+a4d/
+├── reference_data/          # SHARED
+│   ├── synonyms/
+│   ├── provinces/
+│   └── data_cleaning.yaml
+├── config.yml               # R only
+├── R/                       # R pipeline
+└── a4d-python/              # Python pipeline
+    ├── .env                 # Python config (replaces config.yml)
+    └── src/
+```
+
+Both pipelines read from the same reference_data/ folder. Do not modify these files without testing both pipelines!
+
+---
+
+## Testing Strategy
+
+For each reference data module, create tests that:
+
+1. **Load test** - Verify YAML/Excel files can be loaded
+2. **Structure test** - Verify expected keys/columns exist
+3. **Integration test** - Test with sample data
+
+Example:
+```python
+# tests/test_synonyms/test_mapper.py
+def test_patient_mapper_loads():
+    mapper = ColumnMapper(Path("reference_data/synonyms/synonyms_patient.yaml"))
+    assert "age" in mapper.synonyms
+    assert "Age" in mapper._lookup
+
+def test_patient_mapper_renames():
+    mapper = ColumnMapper(Path("reference_data/synonyms/synonyms_patient.yaml"))
+    df = pl.DataFrame({"Age": [25], "Patient ID": ["P001"]})
+    df = mapper.rename_columns(df)
+    assert "age" in df.columns
+    assert "patient_id" in df.columns
+```
+
+---
+
+## Summary
+
+| Component | Priority | Complexity | Files to Create |
+|-----------|----------|------------|-----------------|
+| config.yml → Settings | ✅ Done | Low | Already done |
+| Synonyms mapper | High | Low | mapper.py, tests |
+| Provinces loader | High | Low | provinces.py, tests |
+| Validation rules | High | Medium | rules.py, converters.py, tests |
+| Clinic data | Low | Low | Later (Phase 3) |
+
+**Next Step:** Start implementing synonyms/mapper.py in Phase 1.
diff --git a/a4d-python/justfile b/a4d-python/justfile
new file mode 100644
index 0000000..2919fc9
--- /dev/null
+++ b/a4d-python/justfile
@@ -0,0 +1,114 @@
+# a4d Python Pipeline - Development Commands
+
+# Default recipe (show available commands)
+default:
+    @just --list
+
+# Install dependencies and sync environment
+sync:
+    uv sync --all-extras
+
+# Run unit tests (skip slow/integration)
+test:
+    uv run pytest -m "not slow"
+
+# Run all tests including slow/integration
+test-all:
+    uv run pytest
+
+# Run integration tests only
+test-integration:
+    uv run pytest -m integration
+
+# Run tests without coverage (faster, fail fast)
+test-fast:
+    uv run pytest -m "not slow" --no-cov -x
+
+# Run type checking with ty
+check:
+    uv run ty check src/
+
+# Run ruff linting
+lint:
+    uv run ruff check .
+
+# Format code with ruff
+format:
+    uv run ruff format .
+
+# Auto-fix linting issues
+fix:
+    uv run ruff check --fix .
+
+# Check code formatting without modifying files
+format-check:
+    uv run ruff format --check .
+
+# Run all CI checks (format, lint, type, test)
+ci: format-check lint check test
+
+# Clean cache and build artifacts
+clean:
+    rm -rf .ruff_cache
+    rm -rf .pytest_cache
+    rm -rf htmlcov
+    rm -rf .coverage
+    rm -rf dist
+    rm -rf build
+    rm -rf src/*.egg-info
+    find . -type d -name __pycache__ -exec rm -rf {} +
+    find . -type f -name "*.pyc" -delete
+
+# Run full pipeline (extract + clean + tables)
+run *ARGS:
+    uv run a4d process-patient {{ARGS}}
+
+# Run pipeline with 8 workers (parallel processing)
+run-parallel:
+    uv run a4d process-patient --workers 8
+
+# Extract and clean only (skip table creation)
+run-clean:
+    uv run a4d process-patient --workers 8 --skip-tables
+
+# Force reprocess all files (ignore existing outputs)
+run-force:
+    uv run a4d process-patient --workers 8 --force
+
+# Create tables from existing cleaned parquet files
+create-tables INPUT:
+    uv run a4d create-tables --input {{INPUT}}
+
+# Process a single tracker file
+run-file FILE:
+    uv run a4d process-patient --file {{FILE}}
+
+# Build Docker image
+docker-build:
+    docker build -t a4d-python:latest .
+
+# Run Docker container locally
+docker-run:
+    docker run --rm \
+        --env-file .env \
+        -v $(pwd)/output:/app/output \
+        a4d-python:latest
+
+# Install pre-commit hooks
+hooks:
+    uv run pre-commit install
+
+# Run pre-commit on all files
+hooks-run:
+    uv run pre-commit run --all-files
+
+# Update dependencies
+update:
+    uv lock --upgrade
+
+# Show project info
+info:
+    @echo "Python version:"
+    @uv run python --version
+    @echo "\nInstalled packages:"
+    @uv pip list
diff --git a/a4d-python/profiling/PROFILING_SUMMARY.md b/a4d-python/profiling/PROFILING_SUMMARY.md
new file mode 100644
index 0000000..1e83618
--- /dev/null
+++ b/a4d-python/profiling/PROFILING_SUMMARY.md
@@ -0,0 +1,246 @@
+# Patient Data Extraction - Performance Profiling Summary
+
+**Date**: 2025-10-23
+**Files Tested**: 2024 Sibu Hospital (Jan24), 2019 Penang General Hospital (Feb19)
+
+## Executive Summary
+
+**OPTIMIZED - Single-pass extraction:**
+- **2024 tracker**: 0.877s per sheet (66% faster than two-pass)
+- **2019 tracker**: 0.080s per sheet (96% faster than two-pass)
+
+**Primary bottleneck**: openpyxl workbook loading (95-99% of time)
+**Optimization**: Eliminated second workbook load by implementing forward-fill for horizontally merged cells
+
+## Detailed Breakdown
+
+### Time Distribution by Phase (OPTIMIZED - Single-pass)
+
+| Phase | 2024 Tracker | 2019 Tracker | Average | % of Total |
+|-------|--------------|--------------|---------|------------|
+| 1. Load workbook (read-only) | 0.625s | 0.051s | **0.338s** | **79-85%** |
+| 7. Build Polars DataFrame | 0.086s | 0.000s | 0.043s | 0-12% |
+| 3. Read headers | 0.010s | 0.006s | 0.008s | 1-9% |
+| 2. Find data start row | 0.005s | 0.004s | 0.004s | 1-6% |
+| 5. Read data rows | 0.006s | 0.003s | 0.004s | 1-5% |
+| 4. Merge headers | <0.001s | <0.001s | <0.001s | <1% |
+| 6. Close workbook | <0.001s | <0.001s | <0.001s | <1% |
+| **TOTAL** | **0.732s** | **0.064s** | **0.398s** | **100%** |
+
+**Previous two-pass approach**: 2.583s (2024), 1.973s (2019) - avg 2.278s
+**Current single-pass approach**: 0.732s (2024), 0.064s (2019) - avg 0.398s
+**Improvement**: 72% faster on average (66-96% depending on file)
+
+### Top Library Bottlenecks (from cProfile) - OPTIMIZED
+
+**Current single-pass approach** (read-only mode only):
+
+1. **openpyxl.reader.excel.load_workbook**: 0.6-0.8s (79-85% of time)
+   - `read_worksheets()`: Most of the time
+   - `parse_dimensions()`: XML parsing
+   - No style/formatting overhead (read_only=True)
+
+2. **XML parsing**: 0.4-0.6s
+   - ElementTree parsing Excel's XML format
+   - Required by openpyxl, cannot be optimized further
+
+3. **Polars DataFrame construction**: 0.04-0.09s (0-12%)
+   - String conversion for all cells
+   - Acceptable overhead
+
+## Optimization Assessment
+
+### ✅ Successfully Optimized
+
+1. **Single-pass read-only extraction**
+   - Eliminated second workbook load (structure mode)
+   - Only uses `read_only=True, data_only=True, keep_vba=False, keep_links=False`
+   - **Result**: 66-96% faster than two-pass approach
+
+2. **Forward-fill logic for horizontally merged cells**
+   - Tracks `prev_h2` to propagate header across merged columns
+   - Example: "Updated HbA1c" fills forward to "(dd-mmm-yyyy)" column
+   - **Result**: Correct headers without needing `merged_cells` attribute
+
+3. **Early termination**
+   - Stops at first empty row
+   - Skips rows with None in column A
+
+4. **Efficient iteration**
+   - Uses `iter_rows()` instead of cell-by-cell access
+   - Pre-reads fixed width (100 cols) and trims to actual data
+
+### Key Insight
+
+**Initial assumption was WRONG:**
+- Thought: "Need structure mode for merged cells, can't read vertically merged cells in read-only mode"
+- Reality: **Read-only mode CAN read vertically merged cells** - each cell has the value
+- Real problem: **Horizontally merged cells** need forward-fill logic
+- Solution: Track previous h2 value and fill forward when h2=None but h1 exists
+
+**Why single-pass works:**
+- Vertically merged cells (e.g., "Patient ID" spanning 2 rows): Read-only mode reads both cells directly
+- Horizontally merged cells (e.g., "Updated HbA1c" spanning 2 cols): Fill forward from previous column
+- No need for `merged_cells` attribute at all!
+
+## Recommendations
+
+### For Current Implementation
+
+**Current approach is OPTIMIZED** - single-pass read-only extraction with forward-fill logic.
+
+Remaining bottleneck (79-85% of time) is unavoidable:
+- XML parsing of Excel file structure (required by .xlsx format)
+- File I/O overhead
+- No further optimization possible without changing file format
+
+### For Future Consideration
+
+1. **Caching**: If processing same file multiple times
+   - Cache extracted DataFrames as Parquet
+   - Only re-extract when source file changes
+
+2. **Parallel sheet processing**: When processing all months
+   - Extract each month sheet in parallel
+   - 12 months could process in ~2-3s instead of 24-60s
+
+3. **Progress reporting**: For user experience
+   - Show which sheet is being processed
+   - Estimated time remaining
+
+4. **Streaming**: For very large trackers
+   - Not needed for current data sizes (10-20 patients per sheet)
+   - Consider if patient counts exceed 100+ per sheet
+
+## Performance Comparison: R vs Python
+
+**R Pipeline** (openxlsx + readxl):
+- Unknown exact timing (not profiled)
+- Uses two libraries (complexity)
+
+**Python Pipeline** (openpyxl):
+- 2-5 seconds per sheet
+- Single library, cleaner code
+- Most time spent in unavoidable I/O
+
+**Conclusion**: Both are I/O bound. Python's performance is acceptable and likely comparable to R.
+
+## Test Environment
+
+- **Python**: 3.13.2
+- **openpyxl**: Latest version (from uv)
+- **Polars**: Latest version
+- **OS**: macOS (Darwin 24.6.0)
+- **Hardware**: Not specified (user's machine)
+
+## Profiling Commands
+
+```bash
+# Full profiling
+uv run python scripts/profile_extraction.py
+
+# Detailed phase breakdown
+uv run python scripts/profile_extraction_detailed.py
+
+# View saved profile
+python -m pstats profiling/extraction_2024.prof
+```
+
+## Code Improvements
+
+### Improved Header Detection (2025-10-23)
+
+**Previous approach**: Check if `header_1[1] == header_2[1]` (single column)
+
+**Current approach**: Two-heuristic validation
+```python
+# 1. Year-based: Multi-line headers introduced starting 2019
+is_multiline_year = year >= 2019
+
+# 2. Content-based: Check if ANY pair has both h1 and h2 non-None
+#    (Single-row headers have title/section text in row above, not data)
+has_multiline_content = any(h1 is not None and h2 is not None
+                            for h1, h2 in zip(header_1, header_2))
+
+if is_multiline_year and has_multiline_content:
+    # Multi-line header logic (merge h1 and h2)
+else:
+    # Single-line header logic (use only h1)
+```
+
+**Benefits**:
+- More explicit and maintainable
+- Validates entire header row, not just one column
+- Correctly handles edge cases (e.g., 2018 "Summary of Patient Recruitment" in row above)
+- Year-based guard prevents false positives
+
+**Performance**: No change (both checks are negligible vs. I/O time)
+
+## Code Coverage
+
+- **patient.py**: 94% coverage
+- **All extraction tests**: 10/10 passing
+- **Parameterized tests**: Validate 2018 (Dec), 2019 (Jan/Feb/Mar/Oct), and 2024 (Jan)
+- **Year coverage**: Tests single-line (2018) and multi-line (2019+) header formats
+
+## Successful Optimization - Single-Pass Extraction (2025-10-23)
+
+### Problem
+Original implementation used two-pass approach:
+1. Load workbook in structure mode to detect merged cells (1.95s)
+2. Load workbook in read-only mode for fast data reading (0.29s)
+
+**Total time**: ~2.3s average per sheet
+
+### Solution
+Implemented **single-pass read-only** extraction with **forward-fill logic** for horizontally merged cells:
+
+```python
+# Track previous h2 for horizontal merges
+prev_h2 = None
+for h1, h2 in zip(header_1, header_2, strict=True):
+    if h1 and h2:
+        headers.append(f"{h2} {h1}".strip())
+        prev_h2 = h2
+    elif h2:
+        headers.append(str(h2).strip())
+        prev_h2 = h2
+    elif h1:
+        if prev_h2:
+            # Horizontally merged cell: fill forward
+            headers.append(f"{prev_h2} {h1}".strip())
+        else:
+            headers.append(str(h1).strip())
+    else:
+        headers.append(None)
+        prev_h2 = None
+```
+
+### Key Insight
+- Vertically merged cells (spanning rows): Read-only mode can read these directly - no special handling needed
+- Horizontally merged cells (spanning columns): Excel sets cell value only in first column, subsequent columns are None
+- **Solution**: Fill forward from previous column when h2=None but h1 exists
+
+### Example
+```
+Col 12: h2="Updated HbA1c", h1="%" → "Updated HbA1c %"
+Col 13: h2=None (merged),   h1="(dd-mmm-yyyy)" → "Updated HbA1c (dd-mmm-yyyy)"
+```
+
+### Performance Results
+| Tracker | Before (two-pass) | After (single-pass) | Improvement |
+|---------|-------------------|---------------------|-------------|
+| 2024    | 2.609s            | 0.877s              | **66% faster** |
+| 2019    | 2.122s            | 0.080s              | **96% faster** |
+
+### Data Correctness Validation
+- ✅ All 10 tests pass
+- ✅ Correct column counts: 31 (2024), 25/28/27/27 (2019), 19 (2018)
+- ✅ Proper header names including horizontally merged cells
+- ✅ Patient IDs validated: MY_SU001-004
+
+### Lessons Learned
+1. **Always verify assumptions**: Initial assumption that merged cells can't be read in read-only mode was incorrect
+2. **Question complexity**: The two-pass approach was solving a problem (vertical merges) that didn't exist
+3. **Root cause analysis**: The real challenge was horizontal merges, which required forward-fill logic
+4. **Data-first approach**: Never change test expectations to match wrong output - fix the code instead
diff --git a/a4d-python/profiling/extraction_2019.prof b/a4d-python/profiling/extraction_2019.prof
new file mode 100644
index 0000000000000000000000000000000000000000..28984c3cce6aca67f3012b285c296a5e630f7dfe
GIT binary patch
literal 86857
zcmb?^cYKsZ^Ef33A)$jb>Ai*~Mamsg1wlF}#p9A(mPbMoo=XTI(m@0S6r@P+QdB@t
zRHO<Bg3`;;lp-F|K@ddw&g?#0o_n6V@cur(Ki+j-^32Wb?Ck99?Ck76tF!tmHc8Nv
zhk27qYXeh~_0&WyHpU&BoSf=Q)jcV0?~qilp5#e%YLByK%H+=#r+YoAUiZM{__RcC
z6-OX*rc9ai2x!RdU4veEmL<U{fOo27^_K|u<IX@u{LQ@V$K1fiK({Z&8&@TQ{$hxq
zt+hI<?f`<?uRz;h)E(zZOmwGfsr}&xJOjNxx9%O7JlGo#%w<95qL8^3kG?3^;-~da
zQp+*^PUkiST)-UrmHxoIKSzR=6mO+nxx~&-w$)tfBzOB?p1Aq%O-?|<-wZrOzN5WE
zym4F-D$Cz5ZTjZ4Lkpc`O1h_5^8NfSVA-FOOTrTy=M1F5ulV!1-CB|_)sqzGjqC4?
z8{l>W&uft9{K)e&|D=z{jJfY5dAd#Rd+FmW$g@B5hyeU8(~}BKV$-z5)EZh+>4DzV
z{>kyB>Hmk{i_v`iSDhe9{HYMXCnWhjN-|4aY!!zh_?|DHo_cHAGAHRWt!>x8fB4+V
zMHXlU;`irvQ<-@{Zi&gBc+;3!Pz9wwky2jwV6PsV>;pCO`g|UOdXyd6EDjA>@y^aq
z@}zHY3IOR+spm$i=X1v;4@}V#z3$kdsouEcc&~|c+qd!$`nt_vC*goG&Vgx&oSX9M
zPD@HmjvD|fqK?|~#~T+XPXSC0aI&pXLn4Vc6(|Q$6AHosj`Kz~=uR|rr%FTsXNO)M
zyT*8$#hIJs6mmf=WZ$bp(CtdzLB6VUog~}RO5QFlzLP_68hMIhLtvRQ7Bo&K&=I)s
zN21zksi<wra9?|;dk4=}P+AU%;U11iQ9f^Kyf?v<mY8ai8vk0L30k!fE!v&rP3Ln&
zB{w!xW$&^{Yn+4woSY7l%cP?^nCS4&#P>*tYQ=|?J$H%+EC5WVR8S@u>P&iFXh``Z
z=cBu{+~g$Wx@Xmy&HqvfBARxDN>E_=Ow^{{+`RbF-sw)#p-9U!b874o6Mr5O%g=~u
zKJ1v+ojNqdP6sDA$;C`{FYfGkkYnrRkT0ecisWw<C_bRk3=l>0>|Hy>{Qih)1?}25
zNG+OE^Thg0BgS=(OrCRV%y7?2(YL@h#LLC-01G>5>YfFY51O_d=O-wLcZfwnm`uQg
zzBAtOC~L_dg)-_zuv<l;F%hwRFNo|#(dPgnNwBt1H7t+6fQ{&jp-<B4=oRssN{mXF
z?*)|uKt*qg-#h3}v)?a0{>kvGZ>)3@y}-W0zG@p~FYJHc@;&^%KM%L%Xb|FjPOSmZ
z^5-Au8Q^tm@z5<Tb*MXDivwL$#<|gXfAoPIekb7osQj?VxRjUbHi$_XN<Z{RHerh)
zT5kAFV`=3G0#kIdC+LY@m32~nzp=RM&12UmI|&Db34H~vU}3ZvY`IN9Lkh;wld2^r
znP_rU@f(8X5TNPL7UzLA3l>?rzOqG@FBD|=uxa{+7k?MB4V*`m{LJhatGy>RRmVw(
z%X0{Hq=@rC8-wW4Zfb%#S=rm1Eso}EG;_C;{QO(5o1U6i1X&F^)!U+URB2ki7j*nc
zr?7jlCsB(>FDF%l1uE4uFvXoRG|n`Z>5~qAcy!m#PO`4o(ayOOE>oJwt6m11vcWVh
z-wT?!sOcr~dsSDMS>5I&x!?QZ{zoe_Q-3AQ?_0iy-}mR|YMPSl(}tiGa0cRmlHcJ=
zNz~9#=0j$?Lqop)wm_MU3&GhKUATMGd83|Thlb_Ry@^yaeEqc)(9ytKh@A_^0si8n
z1_l<mJoqbb;ICx4dFSZbV|SgT!QPhHW(|J|me2YlZ{v^T#vh6Irg)QZzL*uE$Jy$a
z;@59=k{*-BY^hTEM`{qe09If<qGpfRz#|<9UW1}MMWRmUZhZrkU~K23Q!f<z#g>2l
zO~BWCL1R)p3oaj=z*wXg#SH1&$yySKj4n?e_;)gQ({~H9mOA1jrC0Yo@K2my>VRtJ
z%Ogo_NTK+IebXNP;3Nf?-`#b3;9<Tj1Tv%A<)ahIaDtQ5^f+8o<m7lcs_Y-Prhe-r
zoLSDJwiK}oxS0oua&f1F<DTNxO$xQ+QAB!F-PKO=ev3-p%um-!X6+T$@;%Z+w>$6|
zcF3@+auSO5nfZQS(%+}w*TN+wyC-f?nx>oANed3|Qvk;aoVB#16c4z?X<AZh-8#@6
zT+-RPzBBdmr;C2O;v`##u4$1p;ZM;W4d<|qevV0ef9`8|?$D}(PEtH&TdyzQJ|$%T
z4N5PUJ1)`V^Jxh~=|oqJ#gy@D;@(I;>m+^0&Z=Hz=|!<PQwKtS2?<#zF1S$#_T9=-
z!Le5`7Q!$H|A~LkWuToyFT0?z_|vT!ES6MBOa%ElW?ImoQ<(zy@CR~Gt7&l&Em%O-
zUy$1i;!X1ES{$<&3*filXQ;`5-5?N`D*f#yNBX**`<!IccXzXV<~mG!i!)Wvi&&8Y
zDIy#a&>j}eol-P2Un6o>Um9#k0=Os8(FG;<M;{yXXZhb?45w@^k~p5)#9>juqy`oQ
z(a;3>3j&Y2CoUBQhktN`CHH_X;7^439TYjLs)pN9=6b3_T6@~Fp&iTq2u7`QgJ~^)
zyDwB*FNMEZ8XEY0ITbA5^WP7&gHQe0-P9*Gd*7?d)V;JPafg$<d9m%u<>Plr8r6_S
z^<Wy7?~w)_^~p#hM-v>vAt}1kX1G>yAD=l_1&}~NXr7b|y{8=L8G<fJ@W?Aag$&?A
z5YX`V#y|suM}PZ$fXR*5(-#i;`FGe|)%oh~$xAQN1x=E!8k)4*jXT?THbvcTWCMSZ
zHrAgNvR;VaRHbYvW5f4$Vv{Gf9sTip<lQuumhbuRYxBXZS%07JI>q)={Jy=DZ24aN
z{s(B7a`yN5q<f~Wcg(vU<s=-y_1ZLv+CX3Yd3;`v9tWY3w4^wTi)ZOv6*doa)KmSn
zU|CoKJjg56x#dVIr(vpm=u?_Z6x)x&+T&V#aOTO2N2N_v7fLySEZ=iN+G6;~Ds(Oa
zRThk~uCQ9`zTl2nz8Am$4g9`8C%Pus3B$>dj9EqtM;9eP7h&BSOvv)RAS4-6Ee-4V
ze!g)$_k4m<zQ^CEmh2>2GP=`Lf1j=W^PFV-qZTJ;=G`W(jJo-e{k440`48X><U3Qt
znN*w=CSb5;pS+j4^TJ%VETEk9SZv~$oTPJO`JU6!>*4qH@q4u&BEX@Q=-wf38g=&Q
zIOsF*`<d+bWj`$6b2$ZYt@3AM5knJ+EpF$VwflVLB-=6t97R9dEJbB+C@kM|61p_t
zY8MjP?<_`+?R1ibH+$u3U*x#>{lHS}f-ATSmhZWUv^=QemZ6S(bZg9^PdCF5+$-~G
zvG1cqz|*vkmLjrzFZf?3_)+<1Q+cD4`1j379@^uK;9s|wkL7#*`+-03_brB6I4C@V
z!wqR*4f>OLsas=gB{7(1vf378E-bwf5^IdYRXg)%g)0+#zBj{3c647~Zf5@Vv@=v+
zTjTd=Nlm|R`5u42Ieyv$n=$yk`uluQC;!$AjNjR55B|Q~`3KMg_eX=((Y>&2r|LsZ
z#4N~2O!!#(5Js##62^wqn7OxL$$hXj9sAFt`Ey?XhY|A*iSs6+lZ0$S5LN7Pae2@N
zn;r9}Jsj!1hi!3^&F7ya?p*s9ZsVe09U{c5<8Mrc@SHya{{c9yi<Ge;xdScUyz~Ap
zC#j$QV0)j*CuMkZF)o%=r&Y1A4HV3Q>1~_z>3HZbsYCXQrR96BL)v&4EPu8Xj}GE9
zNuGsoAmYmXY_3Kj);P=eTyp{~P;Sw<@AV7;H{54l;zY!o1AJu&5%c4p5e{%V8Xhg^
zxqz6dA44zB_@YB)u=FQNRj>GK$=Bs{w)a6T-^1_wi*o-S0@;a)Ug{9|+;|?L)yGMN
zfngqzlP(sYfFhQP${PiO@WeB1Scj6y3&Mwhemq1>l6(+Lf*pMzH~c~04h?DFzFpT(
zx`H+30R99VFlkA|hYE#Dfj=MqB!qDBU)`ymSnwiLx7x;AF|qM3{)U6H0eEsgu*C&p
zxg0=I(`W)39q2SJ_dah5xT`P2Kj{0QAsgB}a#xIoy~cp$GxB^lFF;k3PP(r6O*d$O
z2u4m=_~hWge(laafxUgpvPW~*PyYq?m-O>K_(@;(xm@s=W1y&|@p)h+eCdyj1@)rN
zhdR3^biX~O<elZJ3|Ti`MVts4o`?vPLwX0HA=lb;Jm#Kt%t;bwjoh;2>Uo@vW)Jam
zM9juK#3~MLEa(7j$iG!`9;~;gkc)KlB$d7YPc788VNpqG17p299WS);{@f4%r(v>$
zWPKpS-6O*N0vEdeBQm%j8qjZPI({y2^urJDK=>vys_xRepHPoMH97hQMB9jHs!S|s
z*vH(s<D(mTFEXpu#eHy2#w`1HAT76pE$)r%-EbNV^@sW|gHj68p&pjQ2OD6D9%v6l
z{RMsAL1|t%sB@<#LyUm^6<7)LGuYz-$Ti(tz0|}wrmF;VFKu9wuTtscgwmD7p<Sn;
zErILSc!CLkiG3Sprw=!8a)oA2%r{QL0UVS_dgh6}Yyoz|pWXOz;4BQHnX|frv;JO<
z^iTbNWDHKJxSM5WtT-~3js3O_UkaX?uNc7>P6Z2BUFiUsWF-e<T9MO}uj{`!2?vm+
zoTwLEUV)rw@d~*6!vQ9Qzzw;%JvuIFVSdQWV^Pbt6_2~XgyGQ1U#WIu&!dkMBV2?7
z$c|JotrPN68km67U_A|D7fip5Q*Aikj)gE7#z@2bBrrA%hCgK}+Eao$n+JX{WvE*l
zI53S_Q&pQR))ZM1_)f%+Ky=fHS&)!uE?_$qf-aai0Hi0P${S0)oZpN5g>F@<2+G?c
z-<Q9(c<Ur}N}>(vQ=eiaCFvaqacOmiTM%tXCL&40gOnskjdJ#>Hx#^!%l`~$d4COa
zy3EXKHBs=On~4}MRmobAk!%jS6{lX*W#kqjIWS)I085(o6$c0W&@TI4C#m~lQiNmt
zUD{KLN$sCM%I!{|$8vzIMtLpBL1b?t*@A9naACg<OKv>=2LkBo;PL}OH72NVuir(1
z-Gjz7x)v;}sHwp8+lZ-JZx&sJfc=e{EsG9(cEmEe`kzSg2BRp4$bv_^3+Jie0Z^Nk
zgQ}s&hfbZ;{Yi~loV+)ByOVGLbvLg#O^7oL_f;S#0^=Yuu-ow-IGe-#k}yAJ7P(di
zRm2gmqmQi0SSV(v1Is7W&qO288Ozv$6-2EnQj5?b{l-Mh5=fv1M5tqk0kvQS5vxnP
z2CkNtXrg8b^gI_e3znH0TlnuY)sfSMA4iZ*-Dl^y8h?*ES_M#BLWCsgSyl|2Js1lN
z^HXL9v=^|uIo!G@okprmU1ou72xs!ccypHns0I4JOn>FdYQaK^IaB+iBWtMe40Jwn
z$EE4GHF2{)0cAM{czi+4@pul;$AV@h-5MD6M;JjYNwBPc=O_KPEp`$PU{{shT?ki;
ze=X3g1bZMs2R#5cb+PyO?@IK32Qqp%@O%{c*8<H#F)$3LxT8yZ3;?K;b65L=Gsn+?
z+$9bmMN@RN7K{s9GgMcJe=hKlq>88A#GPh-<FpMkk#tC5!n1Qn;6>Eh0-z}5W|n`O
zygCd{2036MpBJ5?e01vp83e}9B*PjMD2BgM2!AE@n}+TxW#Csh5Yz`fFDfNn_tZYv
z&ibgq9$iaLLw{JWf<nvX28WoQ^LSE$u4-PNbXc5YZ<#-w<nyAR#J5}&Nxgrw^F(7X
z`5;Rq1@pf!)4_VoV)+@1ESo{(3XC007NB1o`;85G?P{mGu}QzeQS|T}FBE@^?LHz!
z0AoC5pY9b0dXlsRIH5N!V{g=Y@a*CXUpvW&XXm;Wy5Mku*aWuT5V4~uc4~hw93rct
zV>?7hanaMScUkKD591yZl{r-uHAPPbj{(k?&?%GlAn&xzi&u^WMgON?(HFlx^9=EW
z&(K4hL0?^Re)8(Yuz`#@wKIRkAMzsCxqPWZ6TQCvUN1e~!i}jvFC6VA4h6r1|HZ_B
zFi5?sH+%WqsT}w#(do(h07&Q@fZiDmM(&0mGNCng2OMudfGnwbC01{{KRF8~ESlB+
z37WA;v?YleU5#a@1x*g1vJ0sNh5|9GlJai}2P_n;;S7mL^(MmF6nF`LqzX=oO$B-%
z_#p*6dk$EpRx%)Rf;f-ZWQv^I;$(~ckWj$^l#F`j*qSOM3@fI=NW5BYUcOj1Cxo&&
zU}5wxDw-yVo`JFP9`yUs1TZ^bv0%WgvL`HK**%Eupbs)}z45rdh50oLD{0UNJqE}F
z7Xwga*pTR*y9<A^`m|F37LmnJS^K<R45P}G!u@uhK{aztaS{#$%d9bqx;WB{2++vq
zO8}ECts2j-wf~e;02V&Wi6L?*qFz5^(9Rz2lTN~cU_SL~DB0?iUN}4pz1G-2M_eML
zoPuQJ;4V#HzVeqPaJXOSVc}cFp3;ORvsT1|p6d;QDO&I>6pN!aWrxU;mXwfeqFJ`%
zFZnjUdB#bu{9L~O&lRp3zOs>$iT2sPmliw=%{q}dN8Jf2yrWWeMmPJi-;K;5+Iy?7
zk9Q<pvJll!MAnW@PMusYp~q1t;XsfEXxp+&G-(pVVF-&|AGL&@G$~hgJl-gDxB0~}
zcb(*M?bJ7$zQVGeq%&AuL<D$(B8v*Rwd5Fg+m6j4YNo^kBJ>?N1+XE3GW%v0-gw?g
zyjM1#-}lZ9G|ahZ2-BUMlt{PCG4LIDhcp<d4a0Q-BbO|Exo+N>*WWq|D^g74ls(7m
z-L*k)g6NP(0`|%WnaOTFIURmNI;Skx1@d>^Yajg}&tRI<WR6H^xTxyIP}fvfX49vi
zU7pzCgp;Ifm^0Juj<#8iy8#Ytbkx-t!ux4Ki<9MtEDDqvM$jMaPD`Oty*M3G-U4M&
z2(JPGQfJ|`qsb?)LYm$13LpQJ$}+@ECbSmfXQN`R4V_1<5U5C6hORI|q@M#qrjCo9
z!5ROlsS94+M0Hjo6`?cC?S^Aox`~$BXF)Vm!$6sSCYTyq`oSw^zz#}HNiNYbysVEv
zG<C(dpdl^A*$Vs$82)S?T?alvoalb&ol%@WoS0iZOZkA4%;<O2GqxAaDhX1Ew^4xT
z?f}W*h=>hIJ=VB*)lD#$pUnTRZ_N(Bp)#7hGrc9^wSvZkSMc<sCjJ><>}r$`cu$e5
zbW&P(&BuTS9Ivr-GTb#o*cZY;s)P8#z;-<rra)wc18AsaI7>f)yq<){M4x{wuuxPM
z`uY<@{s)m&lILDOTD$zamx1}OKA93b@ETKwv{WsT#-s6A&z}!GTE4}nnc0aZ`j($S
z`ng5SEty84R^Sg6f~XlLbz`ho`MZgsx3hMcp63#n@f=MnzFN5#v#1%$z=CB~P1I?<
zJr0~|0r=4sIregmOPe3DTL983hRNCiokJHwP7TXXA$_y*(0E5-7F%-rKn(_Z+;E*n
z*I{30jxsUbAH}E4C^{yl9}8f>Ugq(!Uo$ae`3+=9JsHZ0zYy*7BzTRJAvmZQ1YsfC
zkmGI2R?pX}rHdrL_wTWG>7A%?%mKmNWO`1a(_rLQ_z7@OM#F#fcn~gGe`@56D!Vhg
zNU<%OufBOSCwj>_A?KGQ!QmCU+IkQ8OlNpne^^#&Lq0w+^x>onueeD0Q9Gx^<m-TV
zIg()i;f+V%x-znw9driHadG`9j|8zHUwv~h-#ZC#BwJzmteQ2pAEWyMjPU|dA0Bie
z`eOXt;B_3r{gKysqprVjbXyh|dHmL$N_D2>rmne3$XW?xmYNAipadeK-7u~!!G?m}
zUHSn>NAW$wXbr@hQERC6vHvNmwS4k1Vf6%>rU_Dh+uR#9y1)cke89J}Ni+@YWNaiX
zSSC^dj4RW5?i-ZoNkrvjE3IlOvNsquqEKl#&sp(Jr4<!lFamQdqK;#0Z=EbymYJcs
zrJNPvG+LCJ`O5)^on&Y8#E6vAC;kUHCk-{r+456X9^{hXP<W`+E;9Y{CUDbo?Q#`e
zvg*2-2Ymua%`~8v@6A%~fJ(#^N?CV4dw4nWi_36C#{siKl?uI?flS0y>?tl^Yz^Z-
zA%4ruKx-W4{OF1$Xu2=eos^t}|3l|p{>G$&oxhCA4^G+ZUtRG==e<SEPlguQf(4Y7
zX;EIdm>8Cc=f_TP(+m&nV)?OLfaWE=gY)e8ToRwJ$$w7rcDXIh2DI)%O_0egTJC_}
z<aKxPdJ@}sQ(NF^3Cnnw{`s1FdkZG#z6AmF?;VF+7dq2@yRthCu_ySiS>&cKH9%YC
zo_ph5)DxO;Ay<ZSqBEEeo)pi#W!%84ebI(D00V~&IWu?7fi-Pja|r;47`V@*FT;kO
z>Zr?!#d?E5%!5G!JjTZW1=_W*a4@qm4nPUyVq}XQY!we8HY6rMB4mH`^R$m^0=L+Z
zChP9L*0*MBmjHlzc07r~Sx$pBaGphl4c7lR?7(;&uoEATSlhJW14yMX0Aw1jf5L4}
zxXK8^LG(TN`DpkYIF|dx1A|+h38aGK!vQ-~x@}-lIV}OAg|s2LzSx`nv)f?DIRL22
zI>+`ZJAo?jdI*V6Kwf`uyZS3ny?agp0G279gQ-kB*dZlr2>~LX!Q+w%2w=_yUY2#o
zr@@U7xCIonXRsThT)4+!<BP+)12}+v6D)h+<a*$|P{{&#XHn#)hz<Y3l`#VVK4fI*
zIATJ043a)DL`CCV7*CV?F1C;S9wG@e8}EBuH`S@7m%~2fPs03zMA)>!jWU?D5P1h7
zQnj6iLS&r~uKi;86{ghvQFt0OCbhI2at0F}4nL~D3k{&jDg0L1wkNYZ0`tg$AhbXw
z<TcveDk;8;Hx3W`0bTA7MdA?$3?>6b(0UX$U$(Wsz-l*GA$Bl<O4#+8D4kE+cR#eH
z2n5tP0DME%u&(+hx(j*FK`&@C=SDjN|3VwGy7{zTZ@!<+B>=NUl|~3|B}2^A-Uum@
zU@>?|#^V6)F0!N2p}M_}N|O(l26ki*`@dAkSu)9zBZ^-zb5vTG#gycf4B6r1K{&u|
zVjvZTk{uGlyqFD^fn{SF_Yt7zGoUejZhO_v&Wy9k8iHjx{dpdSnvlWhqg7;gcT{#Q
z-<#!C+_JJ$MZoLVG)1K@{wOx$wyXe9R$u~IAW}~R2s$3-doy7<P%z%C*Lc(bkX(p+
z<FDhbRnqbFmh&CIf*S@L5CetR+x5bXxReqzk`wr4><PifMZ*}L-iQsBTmx3VK5X0d
zyWsC}0JJk`7pcFA1bZ<|>9BOY`QX{;<$Iij15~eB#)f_k`|(GxfVSp1G_z7AC_umg
zZo1S2Nohnf>XJSkso;fa(=ZHnuUUDq5FC4O02niEF+xNXRu}2m_3L|J@;G1~zDi=A
z$-CqBqo`Pu<2M}BBD!UF5f0$&x3x$5$5g=KaLxQkbrSPFSe-21$#lNEolbpfx~P;w
zA(m!Bl<LH+ukyW_co`v#0p6iT@>dw@7L$NtFpmlDWBfVk*&EGCi%<Apj7nL-52Sn!
z48@R~s-mU^2doSgMXjgtOVzkMTzhF^fwy6raR54^x-j&N!k-hb-x2Wg!Fe>Fsc|$F
z-z*3<+!Z_?N_4_J9&%Y?p;CLr)IB)X*oZ0^0zd&|d~7ZvE*!8OM|~aDWsCYL>|5~E
zZc7uu#08n990=8I7Ud1mZ7D{PqQe2~w)xV!-ZFSD@NWqR%uL9+fEi{XSdgkG@{%}!
zEU39-A+n43=c1;7nTt|l26*C)tr6HM;6^Sk^>OsKz|fFPhXy;fgK(zB0puarrPe3H
zr~3PBDCLk?<}#p~k9O&T0a*oxBMW)dMy@T)Xgu{~N1rbqU$-p(O$hvQz}%k(mSx(w
zXo!iX7|t|$R@#$Vy4H}|wdyC-u2rjELpZV2<^c`bkmV0LUfbTXtV;mUPv$y|Mp=vr
z9%+l!gU|EemlKuG-$xi568n3u9Si#va0viDZ;pSZr-znb=PsA<y-;$d?FSPNL)37~
zL>rRYCAId>%=ugbFpEk~e%+gr=!rA7`H;+K8vg6Z**5r5vTMQMZ96Le4L+#>;P8jo
zzR{f<+rI7F+5F`KKfzX$1At}Pzo_f6oOAz!Bd^3mo{pOF#nWHmiU0@9eU_7s-q&KY
zE~v*^b~qcM4e74+u9L7ow@U!D$1(+6Ka9dT0*z_MckNQqclMu!Xb1;TP7*7S0to&B
z5U9t}3h~~=RF9F&X!@1B6*`S_ybt?E4#2O-6v{wm7!ue?u^R_?N!hgUiJL|oFv~%D
z0hlpwD~7;n?AtyZ_^C~@U8}X_A$S1>fb$^>{@IO9KWKos2Vrc8xHiuL6X*J0_~Ao_
zB*&W>2)LHV0YEYZGW2o43(!FYXPWiq>FrhLtO3p90HPRsBz+EkHkYADDmGKqtc<vs
z)~7xP8WTV)_9c$>MH)MCHHrhFq>t63Y^AU4sXxE@Z0KSQu9tHFl~A2PfjD3n45tqg
zfl@I5Ag*nyTXT*re#Xp`oEeG9>0UGekeDAdGnAFt;$$OJBC4T(fnr%7Jj52HP%P*n
z<q{~3zkC=vOg<>~@9^U7Av25vsFn1(Nmu-)8>8MGVQk0<|G|PI$HK)d4)D+W;3t;b
zDK?s-r{R}_u}Oyp;wzB|A3<&`SuT8vjKfdH)6bRtz0GpSc>fVU-_JgmtG~E|$^o<F
zq#p}`VqG)#^TDIH4u2XO@@s!*anC9c9S1THUDSep2gWXhV-yaA7o8>az-6JD3mM=N
z7wtG;?p#ITqUf094Jw{&Z?O~$B<?<P06U2L7J5le-^}D2Y!*z8rZrX}=Qq<0b1;qC
z!*VF%=-^+s=slN*z4fq&&nyo)Q^Sn4+;FozB1pyO0M6795iw;U<zEZ5P)wv@m6eRl
zg=H~ECb+2%=pZnE5hIjEgV06=7<voNw60lx$jp}16{uJQ7Xq*%qAhRQc1SU$4f(0?
zj4`u6Z{!jH>IxlAnx}x*;li_kmQS1mCV?@~lc50|IS3-LkpqBZ+0PS1-Ac)6S%CrC
zkSnh&%kg?2h?#Q$QG-ensp*t~g76Fa1++<nHorI^@Y;7y0RXCcXA!rl{v6DMps70A
z8FYQHAp<@v_TS#i;5>2wghGw$0sQ%&D3^gc2>*tpZhx9I?!ROR2ywu!gBU>N0gEBP
zriKk6{#hGKcdzRbfF0_aNGSpEL9A$RnbBo2yVd;C)#{+5A9;=i=RTozAwccy73@Zp
zJ43h4T?2-Z16&sZSba;!Gr^2>!6GFpASR`)%~CVRmWQ9`fLVK`M-B(#zBo;@Rb3t9
z`LrR`q8|@m(s-^@0648w*MOc4aCasQUKl<S!Ew!q4|ci^w=y~KoP6-l1)iA?xva6f
zKK5+LBl@*_MmB8sJ|wtt0NJq26}rpn$wu-GR4Z)AfZcm%?tL4w6F2~<+(7BLhWqpC
zo+JVVH<Qzn;vtWmMrh<B#y0s-TZseau1LdVTw5CG39(AcMgNJvO#jw@LaDqjTOCb$
zQ2RDL+kK8LzXdN8D{%jcURrg#?IkN&5jou)K*{EWBsVxMg9>(dCXp9qgjc$ZpM-f5
z2H(VzJ_&FkFRTdsM}L6xaO2-+qrblh0nqo~dG%=FrWNRUa_&}%kgJ}Q+6^*Gkm43t
zzx_GzvNkngKv3?npPab6sPPwnI?1K=omw3`UK-Dm?E^M)R@5DPvD~funOtOH)r)oW
zFUgEqCd#RJm}0YVNKI=~VPPIMX{q1ZLP;aXz;5*Lip-;zmG5jh7B|JBr8{E5GjXC1
z01*Kl8II>Q|HyCp!gYg7-JzOdjt^c$+5U=hR^yVqvL{)zqd@ISGiXkZN$d3+NJ~AA
zyq~-K;Q_ZG-pv7!YzTKEfS!>41P7GWe1HVbuXipuxNYcfW=pLPVm*=`R;SHJK5Vuc
zJWf{J<f2WF)X<+4-G`G}yt$}3uoo4Xd&Bmf7wCZorgGw58?=UA3-{-whc|7zc5GO`
z7G`Nmd`qO&B>E@iEb%3gt&Sy_F^vghNk^e4v>^-XADr{^?s6^x(3!(45z(tC^aw2n
z)}Kto$S(u|!l0Yk36sDS*Pq_Mm1nbcuk4+D;62#?aKK`u55OqsKd}K1gJ)(TO#Xhn
zHW-SNfII?p&lCYmC|TjU?mf`-G9)G$0CFKzPTjOiWw6<b4U1OCv@7VDKZ=eiy&(fT
zvs6^QY)G-;^edl!^z|jD0L=V{N!h{D*5(OauF2$kACL=95_mas@{;5EaYECLLICS<
z>p6nwm*smi?Xsb@2@d<vw4ySVgxe#uA#JY~ZANbOb_oE5XTHs=-@=YpWsFDzY_ns@
z&}sd+|LNSb>%vsx01#7`pFk2&feY4f4+v^dL;fFL#WY`@-~k{J5`v$w_`PFLbYrR7
zDTytus(s(HN<qkK<N%=Nq$eX#4w25}@<={P{1X<kmaZY+C>y07=b;@4rX0ZYM$D_B
zSH$rWva|zi&o-DJj1ES8nNu0?Af|(!ngCin_5d3~CRM61Vi4pPa{$n?V<ih*umXq#
z_oeaR9<zA9MJFE{lBMmZBi^kBcjGyLoei0cc?S{~G;BzY`m6Vrc-GV<0OV36W9nYy
z%kY|G5ynP1TLJ(iOB8=J@(QjboCcsC((H1%pIH}Q=Tf-~kORa4{E6Uv34%Y74Q?q6
zqP<-V`)>^!;yciN%AJw<T>=2?sMus3N~us+f`$o<jSxouHG1i3^T*l`@x8A@Jstx9
zEOQ(@fSKw3NF@vBW3<EAklC#lZi*aS+9d#6j!{OI9azk(?Z3RKKZc7B1^}qMNPy|c
zT3Rfdm_3Upv;z)#Q8^F7*br8V8tO=Kz>Ya}_tX#jg$=26=<t+m$@N_VutQaMPc$@#
z4XGF({nC{-a3zWZ&uyF_4~-kAZE)dJ!-f=i(Cz%WJua63xNX!Sg}|nmxn(O4oCj4c
z31HO{{Wze*B$L`FycP~1rr9~v|H7es2n}FLw{YXjmm_m^hwK9m0H%5l8(4y9##JY2
z4D1#lWtyQQM(ZFL^LjCa1vPBQ!!hH$yZ$KU5&+Q4C`u~s4RHW*pgdI~=2z?KNXr3H
zu%N;~Huj2XTqzWOX(mG1BYqGoN<yI^)LhG|D2S>IO*)$F3eh20|L9$!Lv~h`=1K8w
z{+Ibd6xfh+MYC1O{1g<G13=MYGE_yC`?>|4+xA%d2`oe$Fe_@96&w>LaS6Q!J=ey;
z@=U6g`tZbmSL?V)pOURc#?|OYU2+Q_>XMWRM>7s%B5l`J|0H2RZ5P>5YQyc)Pu;kw
zFk2vctA(#+<3NNOHl(<-%~xYrKZ2sI24L!d{sM~Gp;gb3ITLNjxP1RabefU~`5(?f
zQ&*i#q;3YR6Pa|H+FmkvG+DM@0)Mq30fvQzA#hX1ileES_%A&BXLyytkX*(A{`nsK
zd@uX;eF$SCZe9xjx*ar8_2R&tb)ud<a{t-XpWzlV2LMyK7ep^%>qS69FiCf!!eK-H
z8u|ICZ(h6YBsH_uxpZ_^78J9J)e*nMYB7M-8DVV5hO-U&j7@_LJO>a9Bc!al7G3&u
zJSl;NcR^7Y8Ei=HE=!74uK-%f0l+eCoRoxj)dZECdLjD3QLxw?06dc+Sq74WgkLBx
zM$5{9sWu9{+XRE9hY*F`DG9QKu9Zg=Y{bE@0D_2VH2}>Y6(WE1^yTkLtlI^NO&kDh
z%W^*o36G}IQJf$fy)yMutA~W6<N9N)6>n&pGgsLv_!ZO!r|%7Xh1P;QLptV-gYN~&
z$#Aa*>t@}q0E2=Jsnt)r{A@QwWI2HS<+Z2K2x5%D5R(=S(xMG1o2}3IhzD?^g#*~p
zV5dZ#*)of|Vufl|?s~!5<bcZQ3>*kHDB5YXXV{SKqiYYE-K3^V0DvMLM0PT2AZ0=8
zgAJMS<+68Q905^P4ggZn$`vR9Yo0%vW(0c&vm|+~G0c0~kl&X^|K~c?z$F0q1!jY2
zcnaOjFHky$>6UtDi503{oT&(uK-gQuh7_%SXr^y-8<zk8#k5G+AC}rJMQFSN+du^D
z4H?+HVdgLVf8%in8)tyU;C1}O2Tewwn>f?jaqXh7<bZZ9f`6b58U6m<C;OK`n1=(w
zy_$|Bjr>5#VTKve_BWPAxke5IQ&a0#$k7t(Gb_fq1E-F-_8Fij1;z+V4sGOawq@+r
zk0r}WJcPnZZ0tl@CL3tVe3TY9+x;U`KR5<S(;NW25LZv6aTlSgQ!murb$09>Bqosp
z`4!!jlz6=?qj3E-M6%3m)ju8!n<EVy(x`lwis^@2xCCH_YVUT$+#9rW)k<&{Ibd3~
z!#_R+W!q`-Jq#c8z&>F^eu=u3W$a)`pyB`ve%NHcN=@Kp2h{olQedWwTvA}er+MEi
zIt#L-IACI3?*q($!%+})hc=|yp85Ui5J*X?G^|3ye5csUU|nz?bj79{n}6LA#>Tk6
z4Yg6(MeZ#yAk5+DgP(*rOE({{qD5f!87vvm;+--MppJ+-Pa2jm(jC|Z_3nV({LI*E
zV2%kSS8xDGiD;A`37utx<TSG*^qlLd-3(RM4C-<jYeoZH*03S2T%IR&cV~4805$me
zuIkL|RpaV61$RJ669Yh0449}_ljh?<7{)}ZosB^@S=hi+K!dyf@+L?9mrN$w)^|{L
z7=a7mQX6$M^qkO9+K{G0&fHpr7Z*7IEURlypc{;YalgI}5R~`pTiyC;=1ZL+WXu7;
zG@CIs1}=O0>!Pa@=Pd{2<N)BA_gi`?V9(S!OO)6M1M2fpWfm}%sf&WehJ3yE(9Hdt
zAuXB%@HzZsCVe0_7)CSwI?q5?Q_)o!=xvb-E^!d(Ou(OLgo-jNbK7J8ow?`~K#=Hk
z`#U?^zHpv9UmRjN90*3UU)UBs`gVb5I)sxs5R5h*nf#E6Le8Fy^oqK2P)48KJZy!}
zSb%I~G`iCE7jC`O3C^@R0Axd$Lm4pet!r@3e+25@Z~%}(oLMMtw|IkZYp?Wev0v{E
zI<uI7!{%ToIOsBvuH#PLD*XHJkg)el+SKh^AJb%cI?Qy6Envee6;GrL@pmkOCD;&<
z^_QVB>A5Iv&4FMvMLU$~!QQ2U{SgNM%{)C?;(!?y6XbxEt(N%1yw_nBJbAEJ)T{s8
zHcKJwa~T?3ymu%pbPAk`ZvG263>?7a&!pJ)J?5VaJo9RnhC1e;7rEGNu4VJGKe)OM
zCc=*MnZM1km{pYs3X@;QY2#u;A}1;@d}kO;e4R)MlVj{fAHp<RDp#FXH~(5C3ho`V
zkn>r@iRMMQaJPctOn(HXw81#a<3>@uj-7%ZN4y{=Ya^3QgPCMccYO(WH!m)%l6dn#
z(1?@{eW;-0*)@&{9*nTlksV#~)b8E*2FS_)=$Hf_uILV?g<<eaWAY@-$%YY8#<0xi
z*<q2xhIIO~-IOasYr!$u+2V8V<b2saERzS>&dXSl8X9&-{X2?~t*HTwv*@h>o&0jM
zZP&IrVKNMQ<-4mzGSLu2P$Z`a(ke=6Y15ETY{-Pyi?%)ZFYNl9yF0ARKD9oLO~^9f
z`Yt4~n~m5JR2OVW<MlIYt{4aBz#QPqh5c1He$Po<crwXWuZbF{K7+#R`x@za^ce-q
zI&aF$m%<azPq7`x=Tv)@W!ki8NVKFPQ#ZbH7@h-S_WW>=4$5-M;?f%K^zmLY)Zp{Q
z(EHy*QhRtzx#nuZK=*;K)Lpv}Y^edDT4sFFgnup2Op>!Xy~Tt37~@$kdVGbm!-Io}
zjS-Ju$^-LDsY!?Zc_w`Y41)DKosDluqp%vj_Q=gmdBn#?xB~*<dhscKvKktbUtrk^
zJXi0GyO}n<>ofe+)b^QII0*+p$Si35KlV<(GO32GY>wdAuiN*|;u)BGXSFDF?CATu
zaPkXpH{;Mr4dpfUL~%XQxg0pNAr@>FuH}0(dFwGZB@apbMgoAD`m%~ohR@6gkxveA
z>Y99%MvZ^)&&2m;>Xj@uol=KPZ+M0wStNX$d9bJp@&J7g6-BmuZ|1=oW*-PsxxXhd
z2A@6-s?*MP_Yh>^KnAq=XX5*eX#0lxV(=i9mNLhF%SD{OCLx}c0NT%CJ1l5s7OWS5
zkp*~^4_*dG`qJ7Tt(<$)?hD`$Z~*Dc{j0tkO~((=z~l~tWhP%kW<jgBb;LrA=`E1O
z70ZirDDo&#tFHU)`)i$q1IQ0}*fJ?5Fb%ZApTm<5Z->DBD=gY3#mTV*x|y*TEUF1V
zfC7=8&i6HHU20kfq7fXhFrfFrIoTH)6KRnL#Q|U(PF{6-n%)&Pxhk8+(y1=CzHN`E
zzrnVI17>cmwd$enY^;`qSvyLfc_hp@^4Q7Jk5rL`;Mjs_CNInRqx4zUofroWgc!!a
z;o<|%m4Ree4m__E`S$`b6i<c@!Nm{GN(=`=@Fc>N9C%)y`1j)c(ae+dACM>d`t1KE
ztoh?R9$vQtc6=OoUdH(M0@2J^?F^=&t-Pdmvef=%ysX1As#jd2^?o=BEE;XWF>};d
za1;kM7>rE(Ap;X*@FgX0jCw3?!0K3PQ9zS6WX_0B$FKH+Ys&!?nR<e@11H>0HsRzY
ztZFgCeov?kr!E{oEPIbwYYIk>HYC^m90xlVtp=4~48Yu}mqn+9|M>h}%GnaAU_%<U
zeEnXX)m<R?YXI0K<>0<B3jAYciM{Y2nlM9>^Q<XXw+E#1a=?TXK+nxU3fw_B1%8Dz
z{eJ)Q-E-k`BnJQ~G67s(n$hBwIEss6@p#Ol3w#e)euz`xn?iW44URGHH;2AqL#8%Q
z{HRz%=o<$@Ns!&=g-QL~611=g5k$r-s|YFjr4LdBC|xi9tw1uf)<_Jlyyo@%ywO++
zHl)cvPqs$se>nw!qifGw7$h@qP7`mqUtxCVx%tyN7lIMOhD=$N&y{o*D&=v2PAFw+
zpfjfXpn-u6gJ$NiiQrJJXZ76t={ryru_59$Wey;JmSYw5Y$ObBC?*rUUgL(NJ&SL2
zXx|AH+`JK#SJh7Wl8;0u&j3f#0FcSxBU1++nMNQfa35r>aOkY>|Gx6(bQj@(4Qg#f
z%?exqrUylX4Y_`O>Yn<m`?~~S?p{+d2DHj>I2Ez)UvZ>_jqvvcVADS>4>DN@9)C>+
zOMu1Zb#H2#o&@!E;fV}&8^Q0J5)N2<tdByi8%?!N=`qhd6Ders9yb>~#*9FAF8#lE
zTP9+?_2&}p$H&K^P?Q1Kb^9@x6uusYK{az)OK=*`%1Sae-HATPQ%#8J1P#1uYF0OC
zx@xp2{^zCoaOZ*p@0fqx8eGGQobXyv411;<+{geFk;|k{1_6`qU+<s!`U-eNfCJb|
zQ^2zx4n}=87?KNSKo@hXi^aOkX!eo(k)Mrk*y}&IUc`Z5H2X+?pIQFbI?RMVb08Sa
zK9Zlo<sIvO37$vmAEWu87&u5t>kaEIZO9kDr~N!*D&$vk0Hvfl9yE2;NZkp8W*(`K
z^piZeUsLE0IrTx7Mje4Z2cC~U|5~7BM1L4Q4h03J>()Un!5c{WN2n#&I`!}7JoyyL
z1sFiEmS|X$T5kgagUK!ryf%M!e(j9+;rcrVg2$~YVDR}PbNKo_-7)*y{1E%(KrouU
za?Q@&u1AL|u&d>Oxx3{p+d$e~<z0{1x1rn0rIjmR+`Y7`$FEQW-T;ETtrtZ8@w6AZ
zE&1o43p_I;b>#dPZ;CJzKpASO{-fM2OQ}Yk+<L6e6i7befQ2pl^A-NNz%#QY_wNab
zX+GmpYB-K$WZ>+kj-9&4!+>!hEJtDR%p6%K2zylsc3V)WRNW1C&$WEQ%t4@_8~_Gb
zAc-DO)B#O~5t0!D{+amROxSv9g%Ji<KSiU*6Y{5c0UuGx2m2lcmOKt#oWa8ttW2Wk
zWI7TC&CG%Ip>@UqeG<t{OM~Fj3dQ765YjG-6FUwdHz6WBVX(~1RJ6<-l^LvtgVjBd
z5xmsPZua)SS0}c_ez<PS0c6B-(~-Jvz1Zl4!8Ng?XGK{$0zNcPOVK>N`roNry|Z3{
z7kIj5%|0XHDUE^u|H};tSqZ^DcU7E?7d-I!{X2#4!_vqyPkuy(_Xn#Y_k$FNh-q$X
z{JahOTn?4Zj?8kOH$c;1mZ50M3@>!+<b^X%0R)>;HMvVt5nbl%JfBXn$W$C-N(K!Y
zH=eMiYXA}yIA9vECzUPw10i9syS^CA%Y=KT##uUQ5GGyHhP-_6yYr{+fc517YLL7k
zxgD7BXJd!(Ft@|tnVFIC5hyR0=uI%TPjI)NKeZbZkB^9gMHa?a$!=_Xqve7&b(**c
z2au~EZ(pwhqSvcJ1KTE<7|AgNs+qB3Rw==Q8TitTd5W)3AC`4t%bYI40p!5sve}O*
z|6Jgi$y<ZxZi74>EHe+cdw*77_GQ@EasYT>T3a2vUW0aBF-!b2@x7UL)h7J9Vd-94
z3ZzuD1_wBXZYFpcta=UV)PBiZ3)zqhZG(27U2c#K!nPc+h@v5?lW|)j44#P{-AN4$
zy%x&uhPIF2)@c9eYfkb;`9@QI{Ey~Mm_#1HH?nxDklZ@eo7C{)sCOZ8Wn!rx3jcYB
zW(CU272{BYbJ8?gBMTh#Sk6IF?sH7V^~?TDq6wDf$58ZFuy@UoTQ$#29GD)N@!coS
zGUFA9aAPyG(F?T)tcQ8V0h2Ib^70pPkyB%<0-Dhr>x#DRs7@1hvk$NLk;WhPTQhev
zm}CxEMn?7F=#4;oJTo(L>!fUJQBRwvB_w!tFVyVC=dMjmNr~>R*s@2{O>j4a1Hnvb
z_%@H;gb6eZo|!2b3dX0I@Pe%(rO<pyb^LAR@`^)R{p2JZ2<A(-_mlbO0?*7>%}^s3
zlBWPJ#X7z3_v5Vfk7MgYjd2cGc(UIZS`I0LjZ<CJ+2TyZFCmN#Ih(WdOMmZv(ItTJ
zI@{s5!7IL74td`k2&STHmmElzstgwmI1r3xzmGgI^}(}Rec_e>2SUji$Nzc8KF}BC
z{5@Dn(k*Mtha(<C4K)rtr<^Sr7{Ohsjk2x7<SgAzUb;-JVP;x8?1zUHY<L2X+0cp)
zPr`2ZrMxW%mcdM_@|Nzz&ElD!yqXJ+ra2Hw-uUd?^T?a3G}G&jok$yhWyn?KfJNT+
zf)lw=90=};z2G|cU9k1<rcfJ)1Hovj1f<|HIDC>bJ6(tB5>f=+AROGbV^19euVyPK
zRp5nk?gK7d%s7A&$m{k&o(a6L4Z)8AblZY8NBj=@`=+fE#}eqF21nUNqJ@4Q)++q?
zczBBgtKb0^0|?EUzKi)7vR@oWAe$MJ>lj3N;*9MroYQuKd!lea4l<PPUXff7`N4+F
zDE9t0i96cEbr=Icj&gEug$gPaC)zVQ(Uh_Xuhzc4q*JxFF2Vu8%P^6;=ldu2etNiw
zi*NvtM6UNZv>BFS7c~dx`LO6iC?moFKrvMwIEZLZnH`V{#w}S0lU7A69X>d*%RpMP
z8s&(Ce|{cy2CO&-ER*YJ<mMM>z%w2TOwoqi$TNG!_#1HDngh@Yr5q)@dAEy+SYn;;
z8#}2bp6hV{urf-EW+A~%ybjQ&psX-i1P881uxS-SMdWRrPjVMcICiR_i*Ufw>0#LE
zcW9@TJHqTKo4ZcJfuK$wMyw;jqB=cl*xp0a^128I%vvrxKp>UUDBuHK=wRr))NxtC
z<L%ntZu+snOD@8J=hboky+AbcA`6RCUX0?^cFfQMN36=x#Y}ZC?(7Ihn;bx9GMED&
ze>0}x(cN%Gf&+l^9CJY2D&l~d{i<RPQ1*=~;BZQ5+XFeZ*p?Zb3=U9z;K%M55wf3>
z{Bwb4X2&MMiak>u165t1GE1sg<j)230vmJo<Miz>mf^MvwaYlk5A(g52WxE^<EiWz
zh>W@Ei_*A3lX*3k*Qlv#Szg}OBbj}Y#yn(sg8s<2MrVbxSF*Xb!n!#hewg2OklnO=
zZtkXxga$oeX$TyPh^Xs@5?FkkY0b*1zbuBQF%5tYK0J$)6c0x_IQaA;Nv`0<i+?Wg
z%pA$A9D9!F)7mDMmSe}UA=5sqy5jSWSDgZ2EGaLU+Iu`ULtxtT>h>PblPXQOeo+W^
zejET#9u5cLoiy8#<BBOXlz(nNa+c4{a<U$N(V|MUauGtPol?p88=vB_PpX~Ikwaxc
zG;>kY8p%obdIsp;gcvv%We@q#=XBUVnnNp=oK#?n32-qAa0xV~FoETJGcQ(&xIM9P
zG1yQIK;rV`a_0Nq^yNz)LM*@lka!-XI}w{PjCh#u&BUu%1)&g!Fn&^;m%d<$T;xXz
z*pSkPCRb>_8dgRQ2rg*EH6P<5%=f^BDFlz<4?PMdgK7BfBlloM31L%p19G&HQIlF@
zK|^Zl&3e5Yk}Ho>Tn){$fr2DQZs<|l%y>9wjnsT;tSop)PppXY2B1o-siSv?($}FL
z#pQnnw7kD&kCDa29_OLO0=XwC=~!@rq!_3GlJMt=OVf3@^Nlr?@Pxx8QPwlCejLCq
zW}FkxzZPhevK$Dl2!v()j(Bfu8Zn8qwzGSuf*(OQJC2y1z0>YI^iD>oYg4kP7PMe`
z#gSfw@g}s~mlldo*f;GV+~2#OR`kDPxeA6Q7X~d@uozFrM~VA;;|8!4ig=S)M|@w|
z+p6eXs0(cXRIC{uG4Zbj8q!r2j^0!C!}cFmZ+u<^iXf><lx=AxZ<iKuk!||6w#OFt
zzd)5JW9eGZkgT~>6m@{8^WmVCA!tKRk9)s$%TiG3B2VRnQJXi=nj$8C1AUmFAipCm
z#dx~TWD9w<9n!4rz%p%j-NG<M@NH67?9}jl<RG<4pId#yIk*6`V$7(9Hwr&R)S&w|
zlW=-YMk}I*Y1u15o8e)}8HHljt`AU}!8IM!o8ML77g)WhpN_v<Yx0JAE>dIJiZAoO
zl1Lv7<>e;=EupjQUXVk}Tpn<+A(a+iD|0!J;39wdOP3s3VHDNDT%ZeB;0)?cgNqS(
z4Ka-#O08$J46b<c2RERHoR~gC5Q|VMNF48ff5VGkc87#Z&z3e-uO#7JB7s7Kcg9`d
zlCZ*S*pNFDAKv-BtkXrlAJVnU%2M4-DD=3`K*5S2Y}^+fIJ0a*+2Sse{aJ<5y^qzQ
zC@CI7OQ_96p&NaX2gm%OIpcNq6DV|L!x&hrNI-_;kNq)b%P<1_1pkW{C*S;@KFMrR
zkI{(w0vc~Mrp_xJ877Jb<K=cf&`F^uR|=7_w6NOF!f{{GT0}uQg)u;*d)iFA!-Wlb
z>`N~3$tEcFapLpkO;?qC3ndcFXyAk`O@1NW$ky72lF4oeGoU*C9z@56d^LXW?4ixT
zif($`GuIF2&mfADf=c7m#-MEkb~S9s*Hv0xNdLTsi~Q1J)+g!jv_uy3_NUQzD6k6J
zNS$4!djYy$KS5kp@*EO1=4_A2a^>GYkYGO8AbFr#od*9k)c8}SgL0zshmA<ewr7tY
z?fDv!bH#&im*fLHn#-D7>P(<0{>Z;b_2-VO_nxc*RTgWFN-k3~iN-J^2W#GR8pTmE
zn*&(ANdFIUSh76a^`7@jqdw8=|3+dGr<|mt?0L%h>bQT5hu07j-zfU|q&D={WVA2N
zn*=3!lW_-t2eVwIrLwed->&N?T>*{Xl><_$u?{p-#DRyO?9Ka~LkkRAQv%Y|qR;L<
z{z(&R^3WVW{4W(M03$t`H*7Hn;)s`LNueA~c7$e#aYk(hfZqr*5EY7D6;|b>{cF?S
z!ey_(#fQxY^VVMU2Guhm%s>?dM|SV={w$5U9fgFkK_wdv?;3R-<2AwrY3R}!CX%W$
z(`Oc;h5NvD8vL|8``3SkPGLv&4}pVp<WXG-N(dU$0$IHC<P)prfkt(1d^@^lxq8$V
z3#33vL@JI*>Uv>8LQ3}GR~F+`cP#vNCRw?*!0Wl(&s}iYf`>#^?V^@guLzoH>LE+s
z*ul$}@28?v@dC8e#cjk>J88i~dZEImYBAc+){d<gQ?!$d>=@9mMVUgeOr($x$sUmJ
z2LtAhVzu{;=ewx`j1B4baMi*>hoD5|;zPq{U;nZ&wVL5pVp*f`uT#Y{PrmxPi*y~o
z{MP6<Jai?F<Ye{8tT2)}pn<fLR;V-40F(W{R9L*RCX^)EfAUJxX@@(Qd8L)fc<MfW
z9|8#_!@c<chDZGc;*z1#q?Uvs9ek!7-h728m6iPKE!_r;DZjgqi*SIs*?2z7%r4#U
zSkkun*8&Ym2QMqSth1&1f~?5#c79uMpH&fh!VviLz#CokaX6!Vhe;_czk&3vYX-eS
zP0f|cK-&`0spKe>f-JwaX=LWdw63j;_6BO;s90>A1qmqz8M(iNHCD-u`{w*l@9JPy
zw+>y?B5A@uw7)q;{WA2jurdae`Jm3Ish<{Hq^g#sRboKuRo<A>NfE0GK+06Bugh0{
z(lzLba-9|tP*cDy-y@x%R1^(Mkh3b2>ONmjzusl3?>{Fgoc*hLj~Y~`s;l0K!HXUG
zHfW${(i+!z@YC|utstMX>E3^KHNRR8XPBA>y92RyGA!wMj(^nR<jlN~9k{O7(ayOO
zFd-_`{TrpWMb~_9beQu6WG>}7`RwI`v$NAF8I=EkK?$hPhQUXC9m2s9A}}k0yw~TQ
znmxuBa|r<FND#W3K0#r7OcblI>TL78A=prA7jHFxd=jdMlQF;b*_|`ZycFnJasFGD
z0t*sSvQHgU7Xe-!o5XgWxVhetAE|C;yvw$rAvMz_OL{TE{~}~#C3w;jQ$--msF)8v
z9f(+ZEai`!kM7bE<_HH+#O5CyhYE2I#skzS3?gzOy=i7SsmJM{1%_Cap>2~QPcEwu
zbulNOxY%k?`PNj#3f3brkt4!kv0f|h0_b;vKgOimyW4~I75+ir;3T6)Is4QbN-tQ-
zTKoE~;7(b-M?&gSNlOvxm4Y=VHR|%j_zkdsJh1OpmI{u&7R#z<L*=n7u@*d}CpKp^
z9j-E^rIan4A9LlE7u-Eu<kJb;8oiLWFBPG{d4K{m9R0I}!O_QtRP@a}TIx&(7g^-0
zb$4pTt~lpSr49?A_{P&ouayH<X+!!|?Krm3VOSjJF8=r3tbrF1O;A#|j+ektXxNaY
z*NW;(YC<9UgU#BzdylSSLQ%Jlc_7(J!-fp4mOI~w;W1D%c}9WRRsXDO-a(H+?KAXf
z7=&~*Y{<Nkhu<q(4=z0=ws$x3)oNoBLSVYUiJ+f{z@dX{U+~eP6nt#@YRaPO*ItF=
z<0s!%m_Mlt(o&SDB@U44H?7joM`!*Qrd0j(2iyBhen?HF@-E+Z$em@G6A_m!52ovX
zHKcDO<m?YmN$QDknvYw60;oa;9&W*Ox)1w&-QUAIJqS3--_yqbk+<PJq!#QC1RmIu
z6x+;WFW0!V`O$ZDV?-<4Be??#P87n}5ME!9+^E^I=)h-35GQy$Y>T)is`1kWP2lFD
z`?nVU^NmZQV&sX}XvSAkD!hP>G_NVBa_!-<4)OY#pvj9->eWylhHNCWZ(eMBa`|}J
ztnk1PAo9ol0!t(<?GsRc+K}q&`t80w3U=*roooJk^Vc@WrgdAZ|D({8jPhL=;RSwZ
zAH8t@5K5t8K{V{+6iHV({NfnojQ`Zs1+Q*Gx#q+ze=K-}bogobiFGkhk^Tng19`Pw
zmrhf9!mW}rM{+;?>Eq1EZ)7UwuK_K3`-F={s!aDev+}e!c^^`t<~MCy?96|3-0e2e
z%7&O#vWB(s{bOyv`gZ;$6Hed*rBCwUkQJN)Ux<ZH&Ld99O|+CEFB2kO{{^%taN}X=
zqLG1b&{i2^EwO~`c_9HLrqo9YbXItjDl%%@@`Uz<p_2Y*Z?~K}vSu!npK9;}qZBmR
zwHL=`8Fs1<L_hv~aopdp<he@4!NsoEP-dzm#VTUKW${xlCA7KLWe?)yh)eUOCJ%(M
z3jClDlHC$-Pw}J&Kni-$wud5*^7tdzknEX`<vUmQ9+b9u`u<Q?{TG5e#@=k&4WF8f
zm$=2xB8}_mUfptAQ<k@N(3;g6R<9;;$9{hErBiU7@gHA>=_7km|4A{FWvHRl7C`5;
zKB&8unqB&^=YY;o+jdyRR%zq<B8$N#2Lm;MLw{D-l0dQv<^a=%)IE|kbNjtkF7m<F
z4b8W+1uYm=--E&!4LE?>4pFfo6{<BpUglp&J6z#hyfC6?cRQ-gT{b4$CH$GX$ne#}
z2mQ@vHFuG|*O$~Rk&-}Hs$gdwZ;9$7v9Av0lIZAVt)A`Q)ED-|nFFpL>VHHRtRU3D
z5fF_(5}z9Kq$cYyE_7MOhFI{K3#4Wwj6*)DpQgG%?DD`jPEtK3ZeRATesoQgL9w_%
zmhTxM)z>-#46zBQ60)3BpeLEJM{7Z|&<lVEV?)n!X8L^eENB*b`c+}v)&5!1`JRuS
z1<gwDimg0FjFbb<M~{C^IDquj1D~!)jk<ac7FER1qR2iL08mrZWB_~v`Y5Xx*rhF-
z3@3ZdEC)t}-N{LbLt!?cU1G+Gr6sK7CA(Kre>u#?E(|7iPc_)IVhU6#$DB$|7^YRI
z0?;T_6Z(5%FjSw8SwkfU2g%AJ05mj2&4nWni^N)>xp2R=WOCnJ6(LP^@)-A^)5aqJ
zL4{FGM_H25NlT9An|u~rm&?T#?f-8m4Rl+~uyP`$=R>8%hMXzT%YA!i1*oUp;kM`9
zW&M~xjYS5~{UFHRI2=xg^2TxhIX#NS-Gp~bZuZ+;;P{!^)I5cX3dpJ)7Bm!#vYo@d
zJ$vcIp=AM@v>_i%i+V8dS`HV<JnZiJLOV)RVwTQPMhiiQK<_5vpkPCC&sq`l?;yZk
zq)qA2FP*-)W<jO<4C6r>x&DgdAAZ7!%m$fYO<o39LoEf@_3cvsttb~675LDd{BKS>
z>mA}P5DO|&4GQi*!?9!Pqqu}D@CC*1*!7DCbds3DSNaQ}W_lrLOl!CW5lNbqydsFw
z@9?H1$MrYOOL6Oj12{dNYhH2$!T}4-8057r@~Xz@#041+Jm-YupA!z)4JH;e(8r+)
zsU&L#KBzOdI-C;U9Jr?3xCK8^xd!QhUJtpgA1ql5DpIxh9kmg+4(+Li7LzvQ$JcUn
z?(scLv7W8YocgePI@KZ5sN6+0xW_bJT0C(~dU^80A!SO?jZ@H$OF7i0htlk1I>+fd
zw?AA|!bPgDIJhGDcp5r7L9XMQIIqy32K}MN1RHXH__Ec%{s9MO7h*r^(s3Xyo*ulV
zq^1T6=%Qbc7?+j^ac=mH9XQ{yAxjd*4>>;(9OS?By`Mx!)}%&A?JX_P<By{6Inc+o
zOk*U@xjBGpkx^bS|JFF)olbpM^Ms)W$uiSKu($Us$MRQO#;l*ptZu(5Sn#OQs}Thm
zS8-@DppCR4BNi{{vhLe5@D^~&{CqKA)MTol;yu8DF~T@u@Q|MMwK6?7Q+evAVI%6N
z8}A%$rz#)TY=*%_qCqwR%TPcL3dV4K$!U5V9Cgs>1Pf90src{wZ1q5&CiR<BZdR{a
zw7WsSK(((K(?l7o-hOlW?+?C(nh_7m4eoZd5RE1UA*%6TIcb>J1$(U#sn-vXp}DQ<
zhesWHJ~~Min=AHc^(TGfp4E%J2x`&<b&|^E+JZ+l0goDDlaq1#t}Q`&xPdY0Ipgzl
zC(%3CC_8EYSvoMPxArd1s1eYZEW8EHqImSsp4OaFPbXe4H=)C`Z{gbMAAM4K?%g(#
zj)X-IRJX!|^sylpT%;+Yfiv(sBTOe>FX=n%-L>svAyzr)#a5H1L=2|%LZuN!Xz#&r
z(1zSucemHXK2WH)?x3f{(dc!wUExld)PkVmTEz5Gmw$Z!0IPUxJ`|VdMG-7=d=~~r
zrZlj5{Qx)UAy?`MT3Clw*Wo42$<c(=ZT{is5RvC=u!7Ol<fu%FNOS1{kG5agLrXvh
z9ctm_9UkY9)A98@{n}0X5)Q@}U2OeTomiT8VKL655!I6aBD`+)OezgPC=cT4sUQS{
zpoSMUXhTY@9DikB&ay6Y^5zWRzD6zRGJ<u&Sn?M7luCw(RwM@?VncTBn)7RcMA)OB
zJ2p?x?DEo$cCh#RH?DbxbfS=JY(z;-lF)u<F>;K)6%rzwWiRRsHY9WR@7A0H*Ok;c
zlyCg$4?810F$(nX-=HJII8A#v(t8hs2PVc(nRWY(n>6V9+|fSq)QuXNF(t9+PnF)u
z(g=(y9D{DFm2F?^Uub|><WQK(^HJl54M}S|ed)&c;MDGEgVN<XzLTGhf;mNm5-_?b
zEukpmz1I`@_16=Q+9>r*Iqp>aYz)NZMD^;jnWCDMLbVke!Zn)gd-iFIs+!1Vk;!eQ
zq!f9iB%bkP7ZeZJu-X+>#OR}3CO&Q7{m_;oQ1N|q$%}ui>U|Rtr9d-*a&Vj-h>s27
z)%HpHfVnyM-49S_LD{;v@k_&?$(NO4TNGWfIt8xToW1{wGoogDYS8TVfe~~I$o7Ht
zHjcac_LOH%GB*D5*1nl(C@zd$k*f;3;xNl})m5Fa)X`+p&;p=pv>^+}FL0Om2(r4y
z)SOkf!ZMoG#iQQpR8@BKH=D(^aTkFLXm{7lPM`2Siz4&Pi9k0L1tSxfig0h7ZWF#b
z`S8iuY+&0fmCpHrvm{+&P2QG<>koT68;^D|%~<N?Z1;na6TjK(B=3xOJjz<qH~@tj
zBpM_pqft>;zA$K}RY;ym!F#soZqanc9Y5agcX$Il8JX?=kdv*NxapvYl}kO83WH;!
zBXJzsYj}`_4QV-T`?%zn!Qg#5t?Ss1KWNXr+WpyO-PI2R@Y+@-=f|gew(o<JTTw;z
zP_z*aGd3jGwx+wQ&w*pJWyhC#PS>VqdiFLlFbM~(9}e2)_(l1?3c&WcNS&><zpGM<
z4w}UQkOlD7`tO}bRIQM09UK9?xp`8@A_vPcG2)}PI9&AT<_{nQj!G2L!-iOJP>gxt
zY}#}rvJ5`;N5&3y)7^l{K@w{g2Q2%;0Z8l%&@_{W#6LG4g<HvT&a4Tk>c)_zlpllX
z)^hK)LEG7b4knEbvEjBLVlVA8F&s)JMxP4<9<09dmy;Aot>atw+BhoEAoteZFScM(
zg7R%!U0Mc*Vi}e^*^}DnKGa^lHSFolBZ=K9LCfeX?q4`uB&p~d9e=~&yo*DE4VnE?
z_V>KUVA<jT4qrHm6fFd95Jg#5RSjh3sMr02E3M&Gj(#OS&hu=`@Ag|ArH_gkwBRDe
zkY1U|nl<lq`1OvE_<8SIr|HFW-k?;UW8WYa*|D9EPQ6g<7hJh4-rR4t>vNHtb=^6~
ztO0G^(KqUFJwIJ7&3>5@7f|*%qI|%fgPRxJUwx2H4JGkfe<-{bhvMXp@E<HVax6q7
z|7p|*jz4Z@ELfSeZNWvs2KQ5o#^oZrFIi7@CnTAyfF=A2YNSM`YX;AL%lC93&BCE6
z(FLKakd}wp8MGmj7Y&JdzX{|YasU-JbkrmqrVY)vaU>0=;sG3)Y1oiQmwH63?hTP4
z4w!q#5)72rL2e{RWS`Ik(xNzEr!+DJP>o~rXqgC`*`dB9#$QFX+_yx*m_@4Sn-YgQ
zIIv&4vroVVa3HKil{gfCct*THW5+Cwdv}2G1M?q?;>AW}3J3rPLoE3+y5i6xTfi`2
zL$=&)oIA@<*sO8@hhE^62NFCYBlA#N)NOpA`OQi$!T~@rCDuq%5lTwQd&m1s8lM&R
z;T%vX1s<dIWU(LRrg>r+{gqDbVBg091%>S~847(<lRd0C@6S>F=1hm$%^WZZp@Qg;
zLrId^^Q-Us`xhaxX6~%OJ9Q^^du|_QQ{R0j8#V>6^YuH`_l&sG%(VMbcNo%_tFA4t
zQtd^!WUXAS$k@GI5E;Go(38q85<e}rP(NQ2>MY5}=+&DJ3qch$Y)GH@xK$;N!IX(B
zTkP7G?ifUpslmNa6wJX@9@_e%ZUfgp#XxVr^3{C%<bv!JCxbKzmb(CnV4pkJEIa%7
zC-Y9k{;ol-IhP~fnh!V9Sd!!^#4#-$G;(gRCpQQ21sATXa2l=x@yhMNX!2A+P5<OZ
zpF~F0U3&MEU+J<DdRr%5IZnoOXTyxB?#|>ev%3_ZIYp`?%3jD(-JMBdogbc_I=$pl
zr}3=H*TK6pI_vXO<E_WztjC6wd~0XBz3bu5>DSGok5~BMZ@NS&jx>$_ZiVRuwjvCc
zX_~Y`W5`T4ebkA)?6kZ@p<Cl;A8?Y_md$VZ;p(i+lY%#J=*1Ube=P-lV!BPRR7T7>
zb9m#l@^G%ho=c?R^`I4|40fq3G$x;xjlc}JmHlV*^8U_8%%_d@_-I~H0c6xz&%Om%
z!-m|RlD@Z9_d;OQPG4<4rXD+M6T3lq7#N{-MI3C%?|Z*JGw(K3@_6IxIm?fCrD=bb
zs*iZr#-ANh+p(qsuqp2o|GBT>xkIbAI!VHU0WFut?L`f<psS*hr^-+J)QbK61Z*)1
zKJ7K>&cch9sX%AYZZ?8aTf~zx{8}$+m`G%sg2McO33CtHR&0m}!aVFAIs4FpOH`Oa
zr$E}DFx~vw-H=S1Nbgn3PEKmn;^e*2kW0@2>L<{u>-5wahu_|JXC-c+FcJrV*-$5~
za<<z%`4k+4r@^A;te<lBi6|8ZP`eesJsHN4-EeTwCkEI%1Ha@O^7*vR4i{-KBxy&(
zU-D+SQwWEP6lIJAk3{@A;Qbdj+!Ra0lL9%AZ2TrTjXJCo?0rnCJC@^J3oepX-CFvb
zu`!cn(1}O4#3F<P8SI+sqfu{+fNB_ABx%9L4XQr^UVp(0!LqO7CdJNYJvPRbW2Yh}
zyPp@AC3-}m`e8iUNZ!p|s>I$M<#AbhF7qKW<f1Q?n3g4HVY>GZ^5F1ZE2|LT(D0a_
zHpG2!*~uw)z+G9^aPR!=!%9(Y2*Ok!vXkX~N@v?eUXKRM`HK&J@cwLicxmdR{c#FU
zf+Q8wJ9dq1w40ic;Lx%Cwn$VfVHXrP(s>=kYiH~wG6}9frb5t$tbOA`rydt_L%jN*
zOogVr`2y4V;3sft)UhfIDI}GJ!9`6lA9T<(J-YZfw9`3(C^lqz;L|ee?t+i@(LZMr
z9q-25Pc$VLA{;JNzhH)`$s5f&D^H_c{^ahJw-t2}->TR{&94#r&eAXfJ;{zxPO>ey
zNLMi_)SlD%=}=tquf92$@0|p=L6Ya|gPV5zcq!w#E!}wwE>aY(d5ZL86^HrycWnp%
ze&7<^#A&&5!mtv5P<la|dG#Df&P<VS%ySuFhKYj&)s>YfB7K+bJlCVb$`$Aa+E~M*
zmnNMrR%*7e^^8k7TTzZw`4d;9K$G9czg&pE25Jr|2ki5VMLHUfJOHCXLczma?hVUz
zgs)cOk!Ku&;Pn!pxnPezsHcuw`ega&!YVjH^7kLJ^2rGn7nRbXM>8c+K~*#N-r^p4
z$DRKb-l59#<Jf0S^HT3ytm$+@ln%xbF@1JybT>oKLk{4IZz`>*_yXhs7Y(#q*>D6U
z_gq%B@M8Ve^1n(!Ew9Vj*WEoskWZ6^Q(YE0`22{2<m>jqTe&(FV}aOU6E|8cI}Sy&
z@1-8SHUGpdcsXcE#W!w2&bRH7MdPCH!qfn<%6_`m9-Mjd;zl@o$`o)E{cLkamNfuR
z%w*E>V3y=x^OF1Xyl~TC&92p5U%A1mEBI1}CVFYu7CfFnIxckuprCmQJ|Cj=26&LF
zv~_KnKNhrsniPw66sTQk#xYyhs|2bNEx+v0-Y5a)5*spp)n#8P($hs&UG4qZsJiTG
zX^<AGxjW%dZLOs=?+*F~J$s0L)7DaHEfV2Y%bBiKhSYmGnMyp=K3|dctbviImL!7>
zdgaVCJxiR!q8#>lCBo6?K(J1!tEP;yiHb%WSJl2Wy5nUW+n|+CiO?u_xq9cDKB?DV
zQ2p+Ym!dZ{US8S8rJ$=<Rl4jcp+sR#IDiyQDxs@e8R<Fo-a31@*O|*jQc5}|jcqxQ
zs=u;RlSdv7dfLH`JU&SIx1M7;WCfgg`byd6adGyGr4ri>hl|6nMjKMWnlQ8H2+TsI
zpNdNVcd5K3Tx+VjNH6anhYz3YVL#VYS47V7#YgJ6i>`x>P?hub7NtQb8l)30_8s^b
z$xcJE-M{U8{r40gyZG_ytL`s)Q29t7dXVC@&qpL|$d18Hrz{x-*R|HnT-ht>yw9qo
zGAkrPuL^W%L(=jG>J6C$=MaBg>e%jwhHv2TTlkb`LaLP(>t3C{6Hk=#MB1V%1EQRY
z{&oLMfp3pQyNI{YFL@s}8DQs*%EeE0)CNZkt8ils#HiX#7_em7Np?@u!mvVBanvlh
zR1M_qEL~P?bST9wyH%Kd^Rr#Bgw-zED&M;eno-dPX}Xe37Y-8%1|9Mo#37`UOFbS+
z8Jef%@%DF|<oeW-x9>b-$3t@2RJXPADBOZXtz6Ir`oI<-2-lw7NnYI62L6HnOK&!k
zq@CG*8MX=bee2?0YgM#gEBhIyx})`Q+RR3swcrMewi4Aipk<2fa~nr^HXU8ff;eV-
zX?nb*s-FcHNrt*Lr>3OcYdnA5bl-7EEL*s)z+c@SQRh%Sv7;`VVeg*cY{Q0F(5Q5k
zb&l5RsBGI$@kRu@7RBDU3#YY;oweX1U8xG!6#bFQtVj}zc)Gd7{0;~09d2csC`+^j
z*G%w$LNE$pY~(Z6A9kI8BfgdKKzO*341<dVgBGvvZK?7y;N+{NN2^vIUeaD=)ox0v
z7F;@>p>HLsr^VtZh1ak_y)}7$>MAW)1q&Y1402(#EAYKPUt72dM4zogfL;kwlhXfP
zN-Dkb9yk{q00xvpu}L5;Q(TUJCcdYg4OU*6kfnB3Y{*$f*K--`lI*Yr7wJmnm761#
zAm2w3R(N0=o1pR*pk7@}GSwhh&};|vuw3eO>eygIe*dY&jMo}ucaef|3mdffty;#4
z6b2XRiaq0Fv7=JEC~l{&PjxnVZTfGti_ep8U_nG;LFJQvw4E#blvx}#pw5OSDJO~r
zk;*lAYRh%Op`nYSt;BU<PMu=SK1zc7)0Hd#u;#Z4%y|xzG#{a%&qy0GtbFIxgCD~K
zu1UWh{JLjb=9+|#aHy#3$HfL-n^@gNHlMk*{LBG+RO#+Vu$&2uc#uIO%iO8C5K3Ub
zS$*!^a>?y%y_%0v0cSx2fgrgEzUx`OrpO^+c+K<?O?x(PNxd4?&7@fiEDWSm)yIYu
zEAn01)lOO9K=9oYE4N*XwAVc;Up2k#{$+CN)kwg7_;S881;^U^U~0@%PE8&JFph&)
z)18<+7u$zQWaM<n>NjUbl)n7aoy;!s^@T!D=iPpt@@m=)scz;IoNL&S$XDmCi+mZ9
zxn~#3l6t2WEj$u-{gcyc!`fo=x_5;K7V^DW=%Tw^JGNc0JM?pCi}73?8!{>?|H5H^
zwsw)vTTh%==7au}Q4uw&fRoY)%6PD&*oc?7NmuVOEoWhN&zV24ORN7Fp%JYQY*1-K
z9OZXKUOe2`MJ8?9RlCe0dXH5cu}Bv-LaT*y0vnS4$;94o1>oHH<kMOY14&fF1WFau
ztg65bm~RZi(uOS9cD?DMR&XkFcuM!pZ~t8fl~SN!au-LD$0>g&RNAxsD@f}jU5@SD
zRo-&BS+_q~<R=A&R(yl|7TedO>ESjuWK+8=4W13W0FTkr4Ctp+kpy>A25P3x#Y;nb
zee^><7y0eW$DelF%}OtYRS4NL3obQ*G#i1}1kf-ijC<A6lKtMPZfsIssD`!wLA{G@
zC!M5LH(!dbK{-??1C**I5qisfHL8R$2y()R$1wOIS6KTg@mM+<ygtGn{{ERwG!f3K
zsIV%L-s;h@Q$z_!YyI@?myfob!_u|H!Wn1+Nd8=j$)0#Ozi0po69ye+WO7jO?8gtc
zIukK9Q|=+2o#=Hay)`(;%{Lv|b@q()WFpWOgyWCKca>Sno(~9z!AHXCNz6{{?k;E`
z{w~i7mUf6=R3jQf(${x&TN*jGJe{u3wa2nxN^PLQ2t16F=MyT;4ZHh)_uF4Eb?3Zv
zA^S^nJ29G}vsxs#7EGimO{YvLa40DSWt;TKv~3BP&M!u8SX?c+3MD6zWQno}W@>1O
zvSHcg+@2o=NMowaJimShjm}sOnbZh`RCZRa52Afj#;=KcBl#><J9Q*53B+F@HVvvP
zXh}wiAo^4oj7)bJAli_`FU$2m+wl?Po)`eS4Pizm3?@p+!aO=Feg}G@sEAU7nKuV1
z4je$b7Hs=WCypX;Ddpf3dRj3u4Ht2hE{pra>Hc3o?>}BP{WP@^mYJh(L_BrIS@4ji
z@B(R^n_3i=mMFNuDlwjVZZFV+Xe(No%cY(@ic*5C>I}OA88o1`a8L@k2YPklRYSQr
z*X0n2>jnJQ4UCXUQudo5arnt{Aa+p24BGBd2kSPNDAU+j#??j_C*o@Oe(>m6Fl{xW
z2ipCf&;V6=r-4WC$jG$X{)HO~(1~m6Cp|~EXasvn3l9759Gjke_eGk}AS}3UAHw;l
zV)wkwc3gInX8jxPzPLRfb0KMJ0j&(E(G&E-Dfpf_%+<uSfk}{r!E2`i+tj>bLtag2
zo4b_`4<&V*T7P7Xw;YshHO#RKd%GKZ8xal-C6y}y-Ux+vc3^=-dnzN>sx~tjLrND1
z!f!C79`Wx5BAq(?(z^7B)JyAmwoUG`K!Xde<8DMBU($``s)cnRq&H>3MS9^*-_+>Q
z(l-W``QhmAP7+hX{q2D%*{N79$bpYgxP}WMV@MWcq#X9rkt$%}NG!bBD_8p>EXERg
z2PXw=K}51S<C2q7J&=n}3;q5JbB(+Eat+Bhe9-7IADncOhU2Q%duOq6EFNq~)qI{X
zxb{-shx662j2;vkHsp<VkGB5$={YAU_SvU#yQ5fPc#D*E8kjbu90nOFoA=0?EHSJ;
zcQSe7UDvx0;3V+J+%L~>SAyO3e;x^oU=llhWR<Cdx5#Q7syucT8}i};M}yP1Pr=*d
z-%UJ`@+qs6DBNf1+^g>M)*F?t-rNeWzF%Lx@zoZU3sWTwtNqe_w&0?4<n?NL0=yX*
zv$4EN4Gf&y5-A-Fj$R7QwYomAd95IsC<R_Y5l|#`c@kk=4uqy8b&Y>(<U`J&ONu4$
zjK08as2aU6hYh(@`ODHpYQcn#+B&1-w1GJ?mSq@RQxBD@ZR#`@Wk35C3ADO7f=w#3
zl1)U>7<w(Iu>}#SSuWJbvwxMSP*7d~1I21u#OQT(3r!0i(hQnQRdMtUxyqfuti~VK
z(LaYO0L!mjTsySh9qQbK)zL7xNHtVRG>3AWwey;%U8y1v7tQzDs-KU&n9Z{2sj+>!
zY-2+<w0Y#N7!9}7Uuv1TSjB@8xW6`!$O~wujA|QEI6Byf$9|0T_8-{Rj@JTHO0cOb
z2&?)DS3qZ<?s#^_J6Xc=DAx`P8r3zCODpT2s|Kyv=IRx0^n|R~#F3pYj;L3L(vk_d
z)r9d?=WVw5oxK{bfSTQne_em)=*o=i&q!nT?v}sjH#!e_0{i!-W@)?gMRu?!JrwXB
zv|6Apeh7=DCB;KUb?WxZk^kwvxa{XXfI!hnXZ3GeU&>_>4m}946t=aXp>PUN8Z=22
zD$9FxdRL7;t!*f)97yhpiVPQ=9%ePyF`&sOWf)BJu+R(;gPgp3yrKEN*)RSA5@sfV
zRXCT!BF9o47Ll67b_?`nfUxsP4vXvJ(cGsUkblK0_}ycADs)GxfvP*=m6g;$_tHK8
zue2wR>nVF%)MSc8GD;>{Cm|X`MoRW%i5OXCDy8fGBwX1lLiUC!YqlBNnBN#nmIi~2
zqP%uytRuTIWDps<d7tN;@4e^Tdv5W5-ha;L{&Ao4ob#M>p7We%ZBO@U$)|$xDb3G>
zrZ0K(F55R}d!m_Wclb-xRsAx38|XdF3H!B>lp$4Xz)8cVN6guBj0#73w<v}8iZ2Bc
zSFnU!g*;2uO#I6pd;HgRAIYv(3fEu=1wce7s-cuk+J@uNYUSxO7mPaaML5kj`##Ge
z03up0xuVRHEAsf%TFaJ#e$@Q)KKKMc#AjF$=26F^)MB55l{4u#TIQ0g!vJZ%mI5Tf
zsdvo|NB(0wJaW7x=QQ(7(W2wj599*6sgkf}<x5x?ouot2g732W0dOT{@?flk%14}v
z0|(3JtyEZm1TP{f(W3%4@5zJA1tc*yt?N@NCtx@QSh5M&15-io8_4Yw6*)RSoVrGU
zItZ(<lSYcK)2h#{V({EhKafQHtCCM$UkaEoRhBoC-wCmb+pyG2kijsp$I82*Z|QYV
z>Qvb=6JSmD0ujkc>KR@MTKM_SiQTV2V$~)yUr#&o%rrQc`EBs(PXUt5Q&rL8+nK4|
z`FXnB>UrvoEimYjPuIuz<o@$+VTsLCfF(<6sYs6~e?@ua05m$0zR8jmFX~4_K=8;i
zyH`(r5>G_~O)WhQfwme&dI3n7-*#kLJMe(;I+V;!@ss*JhKJRQ8Tqxo529I?%#|Tb
z@ge{bWL#cXg=ERLTm_#aVr-;cQl+Y6Mu7Wh>wj;KxiaS8cN4P|SOF(qmX~Z%{|$9J
zVUp}t*9@iV2b>MgC_e@c5pa!C{x=fy?haf8p%9(sMWBA*8Pv)0MC!=J73T#A^>-}*
zRG3>h;%keG&d-ZptvPyr!xqncr%+@+>N4Ik7!<=n!APtK>gfmvtrkWT)g_aLMvIb>
zTnf^BJS6HYs&yix5k$#^<<RYGw~^Tcw*Lp-(@C`###EZOiAs<qB$r^PNB}b~1}8o6
zyrS3MH1C>SA?Ez(k%M;{uc0rFQaKb8b_H0(X}IU6!Ti+66&tOl+@BKqEZMR6)VsHM
zDX@rDqpGq6$)5?0j;i#oI^{2Q8a&lCd%D3Mr7$BFzu^QRllc+Fgdol3CECaDa)CIx
zrE5<|UO!6nAC^j0Ha`KDVAXr3qJmr5Z`?Xx{L$z}bS5}$u0K-wdY7S8tzuA(6T>ta
zFF#WO(gY{QAYF2xNuMp|7QM+swJS>M2cByKdd|_1)5NO)8l-+neQ~z#$bR@cNAu08
z_4K?~qg|9uvVBkvH=a=PLIBcZB3=r_H=oBe@7K74X98jK9PYI&X+^W@hO5RLlK@0W
z3QqykTtYlLTILaKn4X@QW!9S|WMB$xeh~#Y6{BfoEM6khs$5l1zCC@(%-7^N>Nv7F
zMl~6iB;AYr;bIm^Ui6;3TwC)0agw9^_AfL%>C7d^kh|yY+noffGPS|bC4Y}`YUQB*
z@8dlAcTi|h1<1zN;*)g~>MVOi#~C%U`KK*WHra?<bCZ$V%#YsV+V895{+1N?7b!i%
zxsu1E%tJcD@hd36k=?24W4PSx{Ngok?^bxD1z7yfJAaz<N6IyE@yzX5+TzjRI+APd
zJr|GaE7!6FNMxt!SrpM!SsZW}bGy1|`t#|HK&#dwetSSj+$wUE3_QXE??oYkSb#*F
zy0vE-K>jqTff~~0nchwvyHHmR#wO5H{!&FOU1jcxAb^u4QN_%=+hGYW*%NTe8Feg5
z(CZ>cWVp>4hX8~aS+ae_+w?}&A|zGwq##t8A7KHG%un0j<g#B+B`PAVVk3Q9IeWn1
zI-tM5|G>|!<{Wapagt&JvTAE8-J1WeN0Nj@tPlzX)gp)YCPl<_R8$|O+Updi#$lUd
zJVnC)dTeMaQnB^JRNGipi0x1T`u~Tm6Jo0p6c+`Bw;?-NWNe2aQ6r#Cnhqy@uc!J;
z>c=~9s=sOf>t=ZOL!_rodq5MVL!-IOsUPn^qy8qTA38K7yht~-j&b7DwD@-Q;~hBF
z-z4<|aYBh;IZlob4@Z{!8BkPdLANAZHnkX})XJ{*Uk~OTF=4sLR?_L#ECtSpPmV&k
zqX@?rMWE~mH1*WfXUUqxjZ;Qcs=k%5CTt`DPQb_Dczl1CedE_90aW~SqSWhON0%hT
zHxb9l7he$I1bie^+Zo|(lxo-qHWoB@{H0Yc2W`i`Ho?ctCf23F3HXQx!H42wx+}FN
zkLK<J`$WI)UO2W!2*=m*65s@Utu;Z=Mrn?HU?cT8R8S}lgt)P8ed6=#y|p-saqFk}
z;y!DI`^;J)rZ;S)hKC1lNRBK6iSbFvZ+A4c=$3&WCJ9N$Mw*lp);OeZdB`{@*P6Z7
zwKg#<@Nn`KZkR+lgN+npQxKJU27+2<6y?qPET9XyFL^j66NhP$bKL-hrgf#oyuk7u
z(agc)$w(5sZgAA+V-2|o&EbubbN{RieisA0zHj)^DCz~wW0d>A>7j(N;Rs{p+~(q<
z8;~h-T<W39OFb>=hk1eqA@RFHqa&yQCoEvLEx-xshaJDkTD3lTtG`sU{kTc<Zc}GS
zojgzzDMR3R8B2gee41x1QRvb{3tTp$W?jequqr`;Y(x#4`HXQ+z*XRGAWIo7W><B6
zuqDE2GMN8wEN_;xB!)yYYAA|vSk!r!tE;`B^SlZB|Ao5R56)UW99m%{?yL887@)zE
zkP4PdIe^b_?xn#;i!<g&9V-@tU8Q}4Ay%)Kqosq3WF$V+mXWrEQPVnjql0UX>+b_e
zj0UX8vfezT8IIKO=;xK&b#YH(BdKmyk}6Z{u@U8s1sls+dS~&+OH(#Ljq<piR?pAR
z4M1#~TN+s{;W0~ZjupD>LcHT3%Mr&XLSB2eXK4Q^pe0iM$^a1$h0kBr=bEvt3pe-F
z+?WGSL-gADh1iOWaVb-f1eOdOOg%WFu+urWV6dZd?%EvjSs1A`7Ye%VK=bdW-T>ma
z`DaPFfei`qc^Cb793`cQ+zGwBv5}&G`ufnmrQj-h?f2&~U4MU99%S_8l(CVX`*;Lr
zr$N-}0ISfpyNg;P^_l#72j^uWKU?OZ^;=#3_#uQy+pUZ^lJf0AQ<AVy9sX=;2{7o!
zTu(raAx$g-##$Z((<O~G{j2iUZ@fPakX#>~>pjw`KG`Rt4;Js0zRGLhXD;7C%<0A8
z!QMljxgm&n<o4llwM>#(+;2bIIq_jENWh<e7jLzF7)gXA!ZPO|Yc2u8ven}zU2O!s
zS<TsqTUs3|bC}^v)-19AF{)~B2%As*`kOV5FP;*@82y--e~2|PgOEnbaQ?8^^T=y(
zZ!e1JJo|b%oTc6}Eb})x)9!`TN*<qd4E*9JdX4k{#pw>>G`I2oiu(W?Nh_PSdh)E#
zuGF}ohhfHKzTCpPt6Ofyy#Vb>*GIWa+I1%|oLR4gXeqNpUV`n3SIN=}Ye)U1ZXHvz
z_H836rFEAEvv2S@`6TxQ|8_mV;7zM&kka8gY)q5SSEGoP%iY@uIs+*@_;O(#$a)1N
z)M4WpCBA~lJuJz+hu<1s5xgkXjGVY+dLuGZtMaqc5?xfcyWr62KFK{}0A%_~{@|Hi
z1cn>LJhg^r)dKs>EJzyX-k|5HffM$V1vgPx@S~);vcV{(27}@B^vVNXOBsoD!A8>5
zIE!{q^*xiDPjoQ`sYb>^WVHH;jocQKFN9$7g?Vjnj4A5}mD61Erb>4%E~0W&31urd
z6~5gAyW;F7Fjn;g#%jQ*OhOKk3=PONMaX}#u^1^Xs-?@xmf;PJ=8hm=rYvscx#pq2
zG_aLlxl!3Ecv?%yuqE%nD;XQfI;MyBjh@Z{($J`on4jB_%8xv*93){bG!XBV;0jRK
zNRuDm?T`+afz)MV?89A?XAqgR0#?0>QE0(OxdKk-8Upf9<c%4=gX&oq=v||9fXZ3K
zxDlX%Ca@ru5>^5r%3dF$pWzS;T#-W%-A#&)9fwPs(zcDyh1|w}T2*(jxlK(J42t49
zhfvm>94kN}E`4?2K|nj@OK4zr>`ITS8+g(23A}tZ{~T5^CYEO6dv`H70gTA8s&NP(
zu1o>L6Eo0y;;?!_5TH=it=Ox`f$FDpOoHjPcv=c@0zRhp<MG|yK7P-dov_1-!-m$)
zs1ry}g84Xkd;%QeQwzt_s?_&!y?NtO^`3_h%0piHO9jURTBWAh5nP7L2i>WZ3m|O3
z>aoj5fYf2jK$xWzTO{r-Y$VNaa$xcqhnd+Yhzfu^2E_SX$)%`D0V9Ous}qJI3LCml
zKEOSLjr1TW=zK;u$evUGX8WMTMYYM~ICKi<N<bh=07G<w-jzt3dvQ-g_6Wd68p+vq
z$FgG+>jp@keg~S=dqU07A}kKK8V=W5M&3jkDZ696u2b6p?AkE@rtbMfauh)MP)kN3
z>O=`~XAg5m1^!z$kMLa~mW74!@Y-q3M(Fu#`oq>eYKq&9ZBu@`ZFrnlb%X<W6wJ(X
z3S2RhiY@v}!aP*sb-Tvj-);xu#GjXKPY$2sM7WwT*jZLUquJ2t7@JlKM=iRGN(jT%
z#7uAea0N(QRYOq79K@Mw#5um)(^tL|>cKV&?|$IG=0ti%^fTqJL&i-7NV1cRQX%th
z=a;2ij_<Ls?I0C~_q-CA(fw0#S%|DF1clUlInrZvDsZdpy%p;f_VLF1i9HCu#u-}D
zRdVBWcmHYecVN%5nzbjv*`*>`5$1f2FQQ9TBgc-Aqr;=ejEt3|pdc5C+R?3zmU2w}
zz_nq$n7eSR|5}nVF1A>2hRU(g$dMTk&mpVGjR$|V9ArfGg{H^E*Rp1l6oAME&@Ur1
ze)8xpD93ueeFVi2TKz10cl*2N`)>dN(gY_vBs@;7>PY(ub;~q9PJOuFYoiO0h?DIA
zV)ZFP7R#ff6(J#(j~2|JL1_#KZ7@nXpruY&5P%SqNh~kFt@9qtcJ>Xq?JxaR?UyQ3
z?$Njl-DS!yVgC5et}yv|-dj-EwEiH@qcG&%E}v}SRds=M)T!K5`*v1zcdG^>l8K4V
zjVH*_#Q4?4nc(8%F{bsaBPlfehY`fwFeCu!NH2ekhmR-%c}zPJZ_nsa2npIhog&>!
zzqXO=E{16flAidW@Z=DH5R;CKta1g9OiM^Q`*Bk1ykYs|24=|2rzHR(GX5TAKJUC6
z`pG3DBFnXX=`Y!zc$PZXnq~(!Bqw6-alCBt<Z^+RU*lp>-OmkM>9emoc@gV<ECZ32
zLOxoRA6Uu=ydm7gfRaJlP>&mY;z`|WpC1sq6_~uu*b#O6ETzwnk~}QQqtG18KpNQ<
z$9WAJ$b@tVul-iAF{SJCeHQJj-yNz+g}>^XV?TwgIZx3X{52OEIB*D20vKX5Fa>rK
z@$3FW_|p5A?ZE4Orti5!!<$bg2nFGStOl_N^LtHzHOx_AgSFuXJO9A88i_}{1xV{>
zz0BYHIi+ZcYr#)bfHWdxa+{6Z3vvjOMr!lZvH^<@#|20^R$&D-y(S4ny{fH+b!lKG
zMD;*OV({jPsyaqUF@?YXed^p=!^t&2Oac(1)16%ATgM|)d|s}Y^b(?oTG;<kc}+$O
z12S_CEdU`hcHEgXz+>uSH-GSGR|pB8>pUSV<@$63Ci7_tKxA6Hae+*09ytlzgHyYe
zX`sSc6RRK|1;G(RfJ1z6_ZaI1S?(TuJWBL&3r-)>sRB8-Bh3LI9D+)~4iradba$Pa
ztyK#l^)##+FC^RHkg<_yNCkLOt0-}p6)`XpDkjIugHgt5hJUw#25w~b$o;x=hyH=5
z5BN*e3*TZr2_Fi%FJoy$Wg)`dM>yWxCcq)a55r?eKq*yx!CT>0K4@G9%HlyLr@3Eg
zVH*aee1K4IC@yxh3Q&Mc0d+RyA;JG;{GZ=hK9wEfA65W8LG8;SBYo-+lPvlF?kfC0
zz}Ua=zt%s|qOUa0BHr%itmv(v>*8E2=y=v)|AfXoXA}O{`rm;6W0nrx_%-h)ZcRx4
zN=M|;!uW;%wf->=qf*P*|MTXVwbGt~T)VVa<d4&?k>oeD|M@tc1vp=R{KEfQ{}*sP
z4UGMFsC~wv#W-*!ZFS0jM`VE`p6t^47yj4!?+B}`xETAtb)xRj6ZIg&e&VvOfj2(t
zMf!Jwzm%%jJU5PC_#gX+lUGLGjfXJK*uQ6XS=ayE1rz(t@6&s4x>AJ9g8Z*|VE?u8
zf1W<V|62cnNdL~p{%O8}Tz@GoJLtDnLy3NZ_D^zljyCo${IB(&jr4DfOoZS6AB~y*
zbV?;q*hlPaGwIN8#8zC|_=W$q{vRX#$$0qwJ(8+DIClk#PhU^4^ZUIL(dJNkR)P|8
zioJ3C!vENRZ}>|&g3VF<-$r4!?(WIuZLPXPGN|9bUDC*Hyd_w|_?~4+4y?H(2W`Bn
zPx4*(4;1QHSO3~4X`~9E5J1bG!qy5i*6vwf<i5cEzQ1&<_<F{lCuwO4hw!no5<ey~
zc1YY<<f7N{gpe8X6j9@BEPgo4$&Nt|rPRlUoDhD;2>$~`blw9pn#YwUWM$>=;F~nk
z&pq6|0@{PK!Z@dlPwFmoBX=fmlUEWDUm{YJ*MVj&k`G1?1i5TfTZiH$nIt2W4(tSi
zog`pfHk*N27p}}&3F(^T;A#yk`_lx^IymOO$dhBP>zgFEZg7A)r)SORooGCu7Pm0Q
z;D!GMa*V)(M2v5|Z%Y3=SwqT>h0OeG;<BqP9!~w7b>rimFwmWa`m_je0=}kruy74v
zV=|wQM_c<;^<4+#@3H52*qoJ}MDn9`Ty?@I1x~=X4i6gf+2QF}K47v}!xxSL(ulQI
zdu^)F*P(8HjyNYm7k+yQa00$gcu*VB`7ydg>@Bll^;s|<r2Uio{B2ubaen4bCU0GX
zQ<m=s^=|oES+f_ss;O57O~bvl6}K`!Mm3?Qbm`B$;%W70g;o9Ii&&caz{&$4iyxkn
zI{DP{4`9(ZKZq#!W3{C!J0}9l4Uj15baHHyML&D-x^OteQ_zQcp(p|-A)Li=suVbZ
zm`!o<ESr<T{jsduf<C9gte@i8x&J+vzJ!=eC}!aaJXHiB0hvASu-1ezD8wLujYI<s
zLF941(eL;}dm6*3+bR6yN`XUs<u$Vp(LM_^qjunYK$btH-_ez=$jnN5#4>^iV2F#e
zr^u<cFtu&Sgm?+nuH6@opDu=Xg7y9Mk<0ti&~F~BI^@Yy{xa^b8bu+Y-THyaHMU`D
zPLnwf#DE6!sU*<^G;RoWk3!ku4#h@#F@NB3m$Q$-NZ#&BvU?0s8WYh)u8xbmz__Vs
zP8~4e?+8BAa^W(Pdy9%X)v-?^y722O{0}ssS0@qeYSYOxn$2|@eY(=9C;pQ4mrb7r
z{Sb_#rdN3d?7t%Z&-X9<uk|0MUClg)iGTL3+;%@)42$a?@jG~uWPzdmE7-pviU|K>
z|9H{K1wcwA7{|l+Pot+mRG_gL581^C!zrV{g6qdG{I8AQ3j2?u{j>Gjv8Sl)rT}<Q
zZ25K9%EVjbK|#lV8xM1LWB=FtzI^SM1rH@^R=5IYYWlke4u_DRC#RMfic0z?iK3?@
z11CT4C(F+@xxW*h(M$8^N&#{7h-l|Z@y5xJbH!s5fMD_odTil1s|e#RRLjIjYS=j{
zs`Y^8c31&Wz$o`Yj2(>_N3Cn-o&WqTIE>Bko@+m$C1C;YgHZrPjHWhRzFI_DNS^JW
z|AL23@B0b=ejh>8+Hz2sk5Z*4vlk0cdR%f9oEljL9#^gAA)y-%7x_yUE~X{NIC`5*
zt%F7rUdR#v2{F;2s@9g^O7HTUWl+ETo>}XG!|g2}x-j@=1By`xXr4$#07Q)T=8t!t
zr7oE9&HUxousdJ)e9>m!7gWIJSgNuWPXpn^{F`3@Lv-eRpPyb);priX{$Oz2)ZEji
z;Hw=0iDa0(VU@`KuZ^25v~pPYj4j|fv8y;udFp$U+}N7?B%k|~F-!plaS2wx%D7)h
z!A;(1Kr`q7Gw+mQTP5W(U3md^7}7?lNg}`!yd`H&vbl?D4mllIndH9BZ&k>cu>sQC
zH_u!n&#ocs&m@JKxZ6;vujBMi&z_!iUJ35GdnasYA2-8`$Xsf<a|NCDln<%sbP3_H
zk=Et6ejRWW3hA{TpBnDnvmL^el=Sv)0nT$cP*(aZ;M<6?(?SBI3TMh!^zJbo!QNA!
z<rES0TTc&A1;i)q@QunK)>~cyy$_KHSx{QfIrsMKOYn%x>Ad1t!XT2y#;kCJHK`dv
z3rDO7sd1}nTw6$59DH`r{&AymkR_!C<6nKVl0M05lko!Fm1CVMu5DQr;Yx6{;S$;2
zXzaK8Kjm5kNcH9v-E7=w1VXVDlW<lfdXQ)DyYqt<pV|%~PbcDc+r&*Hg;We$brvhd
z1G?0B=I3kkH~1c9ru>mTd=(iYm+Bw~(d9w|8{{-DHa3#u#j_uuZT{R}`pE5Yant%u
z5vl|QFpsQi$olosAAmz+SmxaE+m?GGn6TKK24CI>m$*!dC)}yywm<x@VF6N;YD1N8
z#x0;0cjFl#kM9^5AqWcOA}6E$IeoHydOvWde-+_U<ClxnU?<?^m8Jw18)=sN!H)_b
zfh}5vH5)QRYpp~g!LX4I+a|mno&+z|t3!si46`e;*oD=oKEhWzAZ2-mwlLY|&OA?`
cY=aqBfBNJB)o(HVQ+Z%6x}z%m-?Zuf0$hNI+W-In

literal 0
HcmV?d00001

diff --git a/a4d-python/profiling/extraction_2024.prof b/a4d-python/profiling/extraction_2024.prof
new file mode 100644
index 0000000000000000000000000000000000000000..d3770fb9f1fbf6e6322cfef0454a7ec4d76bc143
GIT binary patch
literal 84453
zcmbR}1$<P;(?|{iB)IG0?rwKbyoI8LLZQbcxojT9cu5FWibH`Sg|;}fSdkVlP~6>%
z9j@hy6nFV%cHh3;ckk}V|LgD9&5*o#GdnxGJ3BKw@6D35?vMtNYTN)<tkoG7Zu2Ci
zN|nl;&EZgD6B3=V;jZu~S9ouSqpZcV7XG4IpdsZaI=eO5^VmkROdpsdU6%azfo0RW
zQxEpQ-%`CU*&r-QiB7Dj#9CuqiBWM8R{C#vUnM1hztvVYh`!3t`>HHStEPdMdHO?x
z+$1E0g-1IR5(GEF_~#1Hkk-Q=ZTq|3MH^|GJg48$+*y$uH68p#O%KiMvL=2U(9ufR
z7(0nPg&-O>ByYxZnVa9+CEl9iml}A5mwHOT`#jn3rHuxU+_0+KNgL_7>6@=Q+_2c8
zqwefn{_$}MO22q#VwBAj0Z+Rv3GvZNB1pa%{7cP^FQ_@>+~>V5Y3-!*>9%Fgm&lBL
z9gszJMLQFfxY&d!CB9O8f6v#59ZFn@4){xg178V!Lk?&|F8p%F=3M^VMry2id$U09
zG<IJv>4h)Jj4z3B#k*o7T(OA>hPM>jvUbbAn;+Onv!;ti4Jh=|hNG4PuskafHGPDl
z#yVqMWi1lr#v9UPeD?H_jci>$+q0nAJDV^5)qKclerOEzOt?UAKzdhfQVjH2Sr7W+
z4t6-gozc-$T~p&rtk96EwlCV{`~imY;JycGN?P_(q8!oF1XRVH-r;b@MgU$AMe&1Y
zAc%M>jtq1V$uOKEXBI57dJfvih!W#gZ~XBxrIiV%lalCg;NW};i~*zJaWU~qw97!y
zgp343_@gRzb24J5cO)n=@qjE-?sPM2pM-MLZN$Fp@YFL`R#VCbWKT(C6B`3n6CzM`
z=j2LBT(K@y31@0K8*tqj98@n|{ZKW7@Rb#zA(qL(wR@HW-9F>|y?DsE(@3AHgPInx
zf_0=I`n(?`?6E;y>k&CE%qbvN1c_BcV%B%R-HtnS-A4Xx+_-GFjd|!i$Oud-pr$D0
zFA*&#@TfY&6LALM9~=?RL?`qeU*YFHW{HnPiDz`g^mc?Pi80Q2gV3|?+LZsdg@<iq
z#^}Tym!}{1A@oPcNj67Ze4-Mg3~)KZqnv7jE733nrq>`FTtk(rsG%7hI2HRkqmy9R
zJt$JOJ~ZU3k(&yAHE@-UH0*3i{%XJm$^l1Ji{f)sNrUL)esF*sTW=L)7A8ZiE16EB
zT!?Q+I;}G9>(u1xeH-Z)|I>{MB}#a$vgJ&xtiI|y90*1@=mPF=;4+JE^z&L^#hs5U
zAE<tGv@4vhZMb0DJkiKtW)LFoN^E~gfDu6rWE!<{N}nB_9eZtr1E7ZPO#Fp$2{t7X
zbk?0!>?u)kak#<BGhY`f2SAlS0TN0HPzJR*K!(RB++R2E#okFa!U6vHOrMXhE@<z1
z>fdoT!U6vH7@v=aG&z~A-qbZV!T}tu9N1y11(lE+Spq+999HM#uCq20o^AiWg7s6;
zxe@H@7w(G2nSuQPeFRNXU^=)QPBlDA>1$kw=9hXsXlk~7HnMz4v1u*3yt0)|J0PPY
zI*t$*u0o!1u(P^@@E0HlR70j$qg!Wsnx*f48*$xScWK|ii*!eza;pVB!_`?ybg8IV
zk_NElXQPd90JnsUuyZ*h7_sHZaMpO7HI4`+#ub}@TOI7HS&?u%Xh@g3=O#Ru2qNMD
zz9Jz}Rboj3@|zJ~kquwzV83-FI>Wpc-&S8|@3X!|UmM|o7aQN;J1mq9=(JF{h@5kl
zmpli9&jB2sX7DgoG^Q-_I$fwrbw{r!%WOm`^hKMjN!#c;2{W9TD{2;i49aDCo)5pL
z9C8#)*M$TZtV^EW_?E8Fkeb6tiH5ykZ+1l$-lSNbi^Vu6K7-R5h@eTq?23*hW<_uQ
z<!>9AJUPvafj2I}fHM^<h>sLvj|&50>DKKtV(#p;k*OIghJ|)I%pdnGf+yX<Va@~>
z-TGza*qq_W)Y7GYwUGxo3ihryWvPzS5^;ih#VN5crZtfs+An16l{y7~?GI*Mp%H@z
zUhZ~ND3h3kvRw6T>`~N>G3#C~_?TQx&!b$avWi)2@uWe1oXC&<JkzoHzTc0J`gtDS
zZ`|7cfM?z55?nX~%UYEFFh^)ZY7b2Q>2`8%I~ke%pKdu5>ayJp44p8SO7%GkF*7R(
zxS_cmk#TB_6E>7UZ$RQ1VIPD^L}&0ad;@H>uoJ<YjG=SV3cq7kjH6eUK9xhq+Xx5P
zoD}FEa6YGF?=xsCN6;~KsdfbvJ{!c6p-YtmXf>E-LxAV?_lw0-)(Wl+WaNt`XQpP|
z>U-2g&rQ$k?_V$RPgfpnNW_a*Z|}yyO34AA{0Dg6dth3_Tj@$k4Mtcgoj5Ak2o02E
zWf;_hupy|O;87To0BG1Hx_@-TSAT`iTclNd?UhdLc73|rMiMvHag;530!1dT{_3ZQ
z_8B81M#hAOJu}#!$_fynJA^J+N<ug+5)p=t>&VH2QyUNb$woMUgpF^&L2&1wZ-Aqb
zOLay&;#F6q($COilM<TVb4I*Jv&VeBr+)oW8#;Q1*a!#AU1|smggaPCVB3nJJ564!
zDBk4IN*ftB?ZL1?&OfOf4c+nlgV^cCQNYKbF_U5*?!dBLtm2`P+wuaf`=GNETBlxU
zBi}VC?MnT287`UwGNai`tuGg@9!hmM#JfY->cM^wdq*C8-(YCSl-h~5YUg3$9lh<l
zA15xqMfuJE>xM$n)p&TwoioAJC&>l=0Y_q-BfdZTD+~g@!Ov@u6?q9-jPHRyfnCd&
zAWtZw4~K?4pI|$G{sUOnU9Yq{vtZ;&AJUr)gQ%8<hYc&x^JUk^<mfd@HpYxfq?SP<
z+A&D%<ILt+ZzFXx7Q6Fc!e1zHiCq=X!z%8uKn*<v%uR5+UG=cotlMqm#+%+vpDf)&
z1#TE*r4bIY1x(opJg|we>OHdO*cFFw+DPgLvv*f0o{g^Z22^zb(izBT20#SKiZ%0f
zjRu<Er8HR2NinerrLA$1*3!B?-mZUB(1+$KoXz1cVZFe<POt%IRwRZE+1xF8YuI|Q
zp*esPF*p)2P=A`hGJ{%6Uv7{+e_ls4a#mgEEXt*jsKo!7u@WaPW$Ms$t&MQN$XG#S
zEFF8dfiM2Jj%VbnlFk=eEheryQq?!eN}M2{44S{>>YZyg!U4Ky;f&+*@`Qk%!lD%g
z9)@T*|1r6N-Hpa`fEO8g%x5}a;Ta8<9UM9_>$=zN`^W2h!FIv{WJgS1r5*BO1t!3~
zrzXMCn9W>AvXU6(hy>qBm@~XL`gsDp(#TkTpNz#OMMooNVx|nLJMPC*2f%5_0V8L0
zSy8_Q^#kGouz<KcEj=p$!=26<k1i^pC+2g-p4(>>{AIq4WSzKf-lA_;Y1^1?!x$!X
z05orcACRC03@$X<q;t%|fjeeoN#0>2@iAW<-&}K-H$BfT6uq{hphFY-DR$4hC2x-D
zGJ1-QaKQiS<H-&jsB@qp$L_c4*eYbJjjXv-=gNuQ+v(~fEm}$t(o730tbx@+WfOON
z-{FLfB#nPGENIqMZ&nSW5odK1nwMyl?MThyNQzbZ06izNi4D=0R_=+zp_kY+&<lX(
zMbFa#UhYmu)VQR0Z~}N>TT7+l34~0(aDSNl<YF7)doZ1pp!L+}h6b=<X%(Z-&T#YK
z9HhM=0HanUhmC%Y*9Xs=QQR`sKF}C6bZ6_sQ%6n%4dsBhScW3nFhrA`6U-t2tAqmq
zcoYh@<=2K?Cmxw&BOLJNaX!#N*H5%7mb!k>d9E&phJ0D&>4z)1U}yAcL%%L;S^)H|
z2Hu749wA?T_S1M@8EBIgymR^JM@QrxHlX<ac(^CXcorDk`2G$hCMJm;?dAPUHwid^
zg4XeEh#!RL1~Kzz2?x9cMtwo<phQ=6G>j?=ib;zf>&bcd*$J~-?lw)XS@<Y=QVk10
z?7kag(lvsujT!eF14%~6lkv8QkLn-Z3xMY~64NwK%&c_3mUeY$vdQQXmnWo(Xr_~d
z2@ORO3VTT+I9j8XFdU6BfC(;Q2e?}`SC1ISnq%u+8S)J*kv%^+$3F2~qoT>AZH)9-
zitE2S$Q1)&4|#PoA({!RO{AU*k~6ziytOeW*k`wXxioIcJT@9emX*q>fhd>_(eW<T
zK-PqeWHW%<3xW*T*Bi(!Oc~fp=>b{@xKE?ZPk&ws&hQ7-^1n}-^_cclV5)fXg1x{I
znShRUK$Z_|CS)(N_Ypa#cI;<o@Cf_?@flg`b;l9+8=}@rJZwXOZHESkTM@>Fn6S*E
zrUFy9z|%lah&nd!gw>6YgZHoOrJ8e-Hk>hyuKE{J*@SrV;F|DgcN6=^gZB=ktTf30
z-3@}{B5q>BEGf6E+V#YepiCUV?q$`3RpIQk;<*Ln!1!VgWAK!~VI{&Do2Y~X4*_0g
z6uD9qRm2jZqN7xnaqe|l9~~TZz(zj*dDYbqjXd7t>|4erEH7&1kXn!$7l%EzqR_Cx
zb&me011TC%6P6dT>a=U%5LIv;v%=$y+JaZB=f#Z&e<%l1M2$bJV;QMY#aDL#5uoKn
zTG)`x^&Si>pC5LZ3AtPSnK$!O6r*&aG4C)mR9cD69^7F9yvoRck}EaHHiJWTCc~70
zxTxG^UH6$S$4o{sV?3w@>LFy_=ZxW4NHHWa3f;|`3QxfkcjoXURmCV2`x8(WbEi~t
z+m6BYAVkSM?<j1^<L<}jVnQ>MZjRB8AT1Cp2$m_dW5(9X;Em-#$_VnObu=@<&PdRr
zV7%DSMedQ%T@xvzXhJhl^x!GkZRyZDF1)v4ICZmu14vPJqIjynxUk((9#H<cZkHiR
z8Be*7NBZpAqJmbX>Po<<1Q?-oZ@z{~?J2r%YM#}XY&u{fpB2xm*{C-w!o^<`hkH;c
zynr^OV2=UyC-wtx3<tdWpkBsD=?-u11Dq#VXQnX2ps!O^;*zKfxh)DU)B#=~8sT*&
z0$q!A9Ic#o@_*B}K?LDcsuy#Y{HS>+4CmUVIF+(FT#&N>vGWK8PLud|U|*bSO|LP@
zvJrTDVX=eB0`$d-thTRMZ0vzIHd1GQ_D0M4HS>yMjil_;h)#?%R*7`M?jZO7XsQWn
z%=>dTvaCnue9rutF~vc|z&0XwMv9#n<$@dq8Fhoh*0pN)-)$s#MGtrUm#@(h6R5u<
zDr8(hC@Efz1B(G7%XnV4!tdF_$zxDt!-4tzPj*OcB)talGg18Tq=dw{7z6J1FIE<x
znjL+HUwr>-xi*xxcY24P^oSork9KNa{viZ{_jNBdxKINm8=8>VKiZWL<#N%W_&%ha
z70$}h{lRA8e=#tS_kMLp$gri58q#a)r?$T7@hzE><J8_^5G6&Mr#$vkvka{WV?(SX
zUk|$V<)1dPs%Fn>!=q?oi*d@l#w9Qq*P&>I?&JcQubYGeI8k(os~Eg9D>#2vM=~i^
zd6-@5T0jQ9s*dl#h77-5;<sO4K%|QUrdb(>c-n*#^YEV*ZBIFVf)$zrC>S}fqdC=M
z&<F@)N%NOU27GB8F!A|}N~S@yGbSv;2|g1~J!JMhGTYGdRU7NSK$HW(th6r{^?&k8
zh*J|?5x6zti~PLJ#7YwML45}Z5RMuSvzs>Lo87Ckc6j>SrUNFC)kl&2i+DkS@J#fI
z>!P+uA{(*s(xGouaEx-mo1Xd_`}Bs=3xsE)*Bt1%E#c8|324TN!Oec{!l65%cOWh4
z_@SnE$5Q*lIJyzAtEuQsF$}H=&qT2xYDIc<amPl+8E6(+-=}D<{I}s$y{lpODgUw~
zf~-+~dTGKl(X1AXQ_T?>&pV3Sk%|qOk@I;GNB9kJS1-1f`L@Y@%|;jLNeYU{+)-uw
zrY-l=gO`&7UfQp0O)t=_NDdn^_Lq~{#$8x#BhQW=_`6v0Il2qUeN=>8<?(1ZujI4u
zDu1w%Oj&b&eQE|xbCdMGg6^+{b7ntGtYSV}hZ0xG(W>ny5LuGEwLzZz$PjvA$<nV!
z<;}hT7Rk6povp7<q@s%?%{6eu#YR(i0_IbIfr!~Q36QS?<J}I?u_31x58PDlvByTr
zXD!=odGbr#8bXce4G=xl0m&ASc^B5-p~fY{E1dWWY{*=9?gynyLAnD!_Tcb^$or~-
z`>J{e9tM4}A|f_KsWLsf265X+70bwn?OWtv;Q|@a(+LpatRrv8G-1fNKbc-+QlQjm
z!ew$K#lzddVXcP4au5o7K^s!q_IcXFvrF2^+H<W+{PM#mlo5GQJyj4t9hFN}SP=rC
zB54s=K>xiu9y)92I6uDXDVew&2&BBYW-UV`c@s7v87W~1L;cP#rJ}Z#H?}om*<4aq
z8QVr`_@%|skXA;?*18H9;G<Sm@P|RyR>41MLu^fUbg4ZClB(u;7Bz3_rfC{p%FqkP
zG(!V4()z`NvtKr@LjL&nWzu@EF#o>4ddSH6w^1Dps-$K|RmuU40Wa=cn)NTg1ia{5
zGeR<D`-e_T^U--fvYo*ZgP|HnnDO9yzhJ7@Ekp6dMsuH-s7$X=@fGR;Xbgj6LPmj^
zkUgi6epcz|4jB;Oq?4`0VWn2izZ(ng9S)#wh;WA?s32@h{;-balfJ~fOtM+Ygw%1L
z!xDPtaJP&t-~30H(BPy*B^vE&y3@L|fmzM{42~EG{6$0m1%1;ieA4$EMd1~~!IO`Q
z?WR?{p3V-wI}SjXrM1y~R@S|-&e;B_KjIL`-=Mz=`N*uthT^D8t`?3${`k0P$Q^Nj
zSB6G>rDuRS5w1xWv7=l4g|JUt`XglRw>x~sj?F<H6P7PN79t<H!N=>H2O(YSk{$=&
zgu_BvqG|WvPYhsQ#*gZR2@84fwaUnA^6*q;T=U0*wajA12aSFU70(I=#Wy{VL^6ud
zyk|0YG6UvM(QX=K`zqDaMH7xeY=Q%*>t3U!qU%U4&nCPW7LK8#(#~<6^;AKsp`f#9
zo<}4md8ZcZNilc#)wy_N@n)*>ek5vzcd-r2gk>aJ9Us)RTOcuqHspYCPeaPJ8v~B=
z7GQc6(l;)TPk;w^9_B)I;N^lCrz5VfOI5*rVRWYQSc@KXLE#%-=2?v|%M8)4cnG0t
zZ!<7tdIueSmN`Pt<TzmNObO0NmzJgo`>qGPpR^${3yVJeW>_;ju~aEv^95;7_uUK-
zPL88VVQNFbR@*=WM291c4e2v^L!ncR&f3WA@2%q=p1MZ&2*~{;v5-lLr$Tl>V0g-Y
zq=pS~#N6l<`mm{;e5Sgdt$EiDEu{>xaLjf^;4!cayxW}~az7GP7urY_ksvmtb+d8n
zwyXx%ca}3B>K^|2EE3FuQDz{TfLWJ_J`W$)copVVr7GtRZEbqRMp{Q~t#@E3+m{SN
zR#0Iyt?^j#B~9TMWcTUm71ERdH!KGXTBFus^8p|A^SnVdnM6t=lDzP@A6%|vy5*;B
z<b$Q(goRPh0?h)k8kw*Rq&yg1rQ1b9pJ-<^Y9KQiWx~3_wqeb8Neg!cTvP>N6P8K+
z6$c7Ln}R|()v{$y{4eB`jkNr<L%Z=^&U-CtWxR!HdfrS3jTkeb8YhPJTl6ESX6^C=
zzOGRFk&#fKxMGa6AI^2bv*}evDWj%w`ocHWyl(YkGi=9ggaZbxd0oW+=^AXYM58Ij
zU!lLt$Ut)(=InT;h*Z>sL`Q5~EdGx+mEfo3f}bi^+y<7#t#cz@-kAL)kb(uk0?Lv-
zP)a{5MJlloT5e1KL`XVSo&BX#lEsq=g@i{4lJP;tr&}w*8HEFMu``6vYvaRppn+jP
z96yLgUdrpdz_pCn1h}-slWlx4M0XLkmGGFg9=tX&<iTqiD%vW*kQJH3Mt@!hj0}~~
z8AAVSgv3pPK{S#0!fq&<5;+quClm&Yodd{;;qbEn-8oqu9bC@n7Ouo57#w9cr{3dB
zupyP&3>x_I4{%O$!0R1;PX28FxXNwrt7x`MBVAnY49kXLV~yT6xi89hFm$vb4JLoS
z@6zE<?K)tVD(0@Kqkw0SsuTIgM$3>N#Z%=+;Sw)LkAKD|r!g$CG5j;|i#E>9kb%Gf
z+!(0Ep*bUQWB5}-wIYm-9)i~aMD^ZN4#Sg}IUD6npb=H&3LNEWLn<tpv-8L(*g81?
z_~|idjr-q!hzHpKbf6#wJr!zF1P=C&R?k-qdIKp-96+)#i(LI&5e^hAqIUswt+Sp&
z2)huq=l;J6ZM+8=@*MDi>dB0cGf$)PEl8R+<oL!W=Ud!PW7h#dl`b==?GdX3G%zN}
zCgauJuSwZPt|vCa0l+diZmHSNh)ENKU3M@IrT3sv0(gBQ25cio1ek|PI80rmSHTqc
z1Nx!p1!04WW4j%AhVvvC4RrA_B&>U$pP%{k5V-p}0O%Q*gB*oi1p4XD0QXd5xWQqC
zmoeqw_ci2;8@l({^EVP@{(5v{Q(ri8F078~H~0R0a5M}R2Y|F84byW5-vI|vmOcar
zQhtMr4h1&4xvB&35_wAaPWt$0qOzQ;>dAs#jz{gP7j<N6zgW2R#Q_t`X)r<sZYYgq
z>U|7iszdpG`{3G`J{KTEiUZznP~{a~oFx8QYe`<d1MoQD)lWG~)`rT74e3@oYo8M{
z;he+)z>*hD^(%a|J2WsdVx4T0x9Rz56~UC`fESvlG+=<Es#$DA2UmDg7JG7{l(5l5
zUpj!iiaUY^Zw}hCRM^@P39JHkXgco8epN$(u-Y3MP~xlbgEnN;kc$HwpGjxe0e=fL
zT!V(dk?#ds8YGrM1UW$*zy&%zPAZ&Ep99P8Y-m%klv2ptN`#ynkf2aYj;O!EA4jkj
zLIR~9j;tsgY_!wQB)$brq9%%AvZ%2rnm8&NX`NwvmxO3!#H#OI&>zMH#uMd@OLZX^
z*pRm0&HnE8SlEO);Jpbe=yq4rGbTb24;ylJZjMUD`@;Ex10YWC19U}XzY@a~#&p}Q
z>#S{yL$V160Ml!E($pbPpXunatTpBYTn${ocnOaTOa5BIv%r>k?W{^|U<{`<-i3F#
z;0{H+F?Pvw)#Qy*T85Ma#82-FlMN7f7dQaS8jfCme2JaM4%<-H3RyoKFb-^KePH3H
zQG_efnH243e5HA`Cwa{5N);iAnFBb!-uu0uIml6TTq8e1(c<Ic{V19f6$Tr9k<$Th
zMe}nFgD;Lco{@>7x=?z%`lF=@>G>vgw;~tV=*yQ5AQ#55iHGOhAv6R}?_)$nf?6T6
zpEnr!DW>y-7cu-Xghy3&X_x2H8ItOZ4E=)--+{)!hcERM)5t?T7=65vm_iQWnmGjL
zgu$}G8;|Y~m=WOApe`)q{;p>&asZ{rcSch#uo!&Pp~EC~*}HB9CYZ2I_J~o~!c1qe
z8Q;V2fdwp;`aMinqGyJ30EhqMxj`)6yod*$7opgUV}weh;<@RgV`RjWyDh{ucuN^q
zvwTp0fCI*Eo39C=HHZ3-*963C^b80Nu-@uv`!va1{S{aTt^=SMsf!thdA`0yE-l0C
z#umtq18m;28yr++{zBPpVqA#jn?J7O8M!E;&ogI)w%5X{2;7A6OE{j=_}-~7CR(%$
z+%T*X$tk+k`ZUeeD0to=4Sum)&rFB0H|Bz<xX(cfQ!L&cg`<qip<OS9_Xt}^ckOV%
z*dMW&#;9>jsOX%RI}~UULZO<XKGf7#t*l2@lm<5X(x(GPPHLNcHChb=Tw9SRO~zJd
zqP0rDs#R)5R;^N{W*tyHT2X^G<Y>d})2ojzW!C{<kd{SYu2mcG0n!o6;P#mD4{B#G
zXeS&%DI1SG7%Nm6qB02jL>qE3bXt?jZ?oEUz}OkFLa46zXlJ<QmH<bwELjE5M6@9V
zzDS%faPC{14$wIx9Ls)=j87se?_BlQ3%I(Z0l>dM`&js!=5EhXwe%FwOAZ*B7c-3(
z{9sz)&H58O>|#TH*xPo<+QymfIzU+$SDl&FhyEACak2K7&npxi_8we^8i1@zSib>+
zI|oEGpy-AR!f%OAU$>+`@6;~U9~Is~_O1rNTcmW))Hp>lY0&|iEGqA*`c(!F808@5
z2HtG<ErxVBg4k$REuZl_mzr-`&oozep&sp~Qjlhp9^v2s@NaNysNwK(&{^RocwB$h
z@<|C#ZG;1eqMazzWO!Qb$50j_MQpS+1PT_gRfXOumE2CEqr$=HHQv&Z?#m{1iUbA2
zk&Xj6-ttk<gDk_slmJ<MiC8Zs5~}3T^i}y}$g%a;7=<sCFgh;Th0_KsEN`Z)*h6ge
zn2ru0Q@RU5ZHW)If(9gs&-+30$Aao#F01fu*pQ~hPG+u^3`Y|V01NDrc20c8RIp)a
z#~0sbeF~>k4)Di)7i`ckP;dYqFNZIt>3kIcg1(7U{)ADbT#gt>f#d*xdpE@Siajp2
zz4d#KOg*p;&JG+fib9x|;QCe-&FuCb4m{eZ*pM-G_x*i$IHV_V;3Km5Og%aIdTm&d
zIKa8}EsFsYJR`GDgZu3qFmfw&CjhfzIZWj!<9d1mLQfn(-TC+`%AeNJ{4tRPHyiyZ
zu-K>nuq~Z`;ng7<;Q%thr?p3g@p9+YoCMT;>7br8>|ZQiLJjaDBU>Vv0L9_pz6stM
z^*Onexp`n|!-hOO@}bGH#kK7^fV_!(i558QEujHE#Cf~J#8w?&?uLtv8~_~C0q_$<
z#n29*UPHyih9pf{X}#6}WWfPM^{S9&NTJP&sMwGLd8b$C`6CqX;sBt^m1yz<L3ajf
zin6>eWg+Ad(T3!*oUgSmb#}WBa3$=HukQg3aEZ5XX+z!>To^g~Ye-VyfUge9UZ$ow
zfD$&O?dZ&FbC#-R*8yLsw1iq?AO}>%yw>v%IA9!J5e@-gkpIDzy0NwWl**kNLN_>|
zPgURD=8x&m8yOHQ1*>V|Q@5mYa+YJUjg$9Zun`WRZkYxfv@n&LmyJL+gt5_4bil}p
zP<6(N14@7SW=E`py&i`4x%=N`SXnw`Z-3-#md+*LZ}W2l%7o{S6}T`)YrXJ<NAERM
zuwuILj*<z1lsxd<C$fBjb|3{e-a*q|37QfB-@uaE2yo%pCT!u0pP#H+;u{D*H0e_4
z=OzWp(By>7&7vW>J~puv<Orb0as%cCX27}~bPfT*0532Sq#=Cynq`ijtxmNq3LECI
zM?Z%QKXZ>BkHoT417})IrvFx8mhIVk4I(wizB~!#SDVko6Y<$e*gJWzZ~W^W%YN5h
z8%fikalTu-X-<Q`HC`A_n_@Oy8npzjS(m*2wr<lNmyGc`l?Kw~%&x0Zwt~*Z@cf*R
z2|slC=ML>sN)Jf<!m?H+Y?rxf^08frB)d{E?CY7ZTt<DncKhrfZcy(E=6#~&jDuDj
zgy9aM8%C>+ZR^yk0x6wTnoOjoqo!fpUKckV%=C0Ltkj74Ab1E14u;hY8&a@i{$>4B
z6}IaDRouv=SXKoNgF$UzSlt=uElg$@20}No6CgV-Jc^c5c#jHz4LP7R={&RKG1v_>
z06CFORdo?6*<z+-0q~401W4MCQ2Ii$AYK88MJ|rPo5|0~QDpr;4{bVtT=1=3w%9RI
zD3y8~arER@4j|*wn5t+~x--%-rFG#T>PfxpClUMbqMye9)BQi24jB0_=6^)NcaN(J
z4(KH40c}YAS!+{oF5lIz1K0uM4P5E&uDk~E6filaCT6&A!y#f(+fyqqK`@U4bj&2j
z4GI-*i^JWWL@0cMaa_DMCX;0aXW$hafLEAo4=21v4TA=br6SHexNh?u>ggtS!T~@H
zK^=u_zTr5VXo{3OqyDQ1pe(lM?Jt6oGgb%hKL>nJ_Mm4K!`$?~yRmGcFHfmR5c4<@
z)51zf$|+*S+&gCU+zRG92Y_sP%t6HI??EKE<BV}8pr%Yfiw7GrDgBt3!ND2qI)I(^
zn_0F1j7$X^(sjzDtW{^&?K%K>BC||wgp$=P7ZE`$o>0xPKLSo996-^a7_p)s-ef{v
zKSf?)hJsTK^$_{>&@;dlc&Ane1Y$U>Ajl3}=}hBFlL6AfwSqnrdl0-)y@uGIjX(YQ
zjf0T0!2!U|7#62OkwQw_flq42D8^`6pq3A$JfdDMA~bs4!BSAXZAOq3Hl%d&h-T+L
z6tU}oFOGd%!S62Hx{unv9qdaD094^=XHGU2zm(Q;U;4w#Bp3o#PV6i;dM<|!_+nAE
zW6!}w5d|Ca)B9?tK3`SEt^>YMWjnSdQpJYY%5I%e>ltK@aUjJ@6eNf6C2D1M-~=0z
zuSdCMPwv&U>i{lMURAR^ST#%i2B^c7#WACeo<XhyfGO4}dZwibb^*6cq-Hdg)Sak8
zSTP2u2_q?ImbpuEPKE;t2LRI$3i$=mf*6_=nZ!mfOQHjSCe1inp9sqsXjA+xPH}9=
zDdp4oH}ZwrbpU(ED~bB?i}(tg1Vf3@Xv`a>M+dhB3VwN2-!z#K*fZ&Ro%#xU(+3(5
zh=}N}JDj!Z+%M1D2nPVoG^b_ts}DIh3N~cpygC)WZC}-{1HMpY^~1a#mfW*_QMWe7
zegzK#2aM_$AaM|LlW=>?0m`I|3kEiF=KE}aoE2ul@kPgmg#P>$HJnXdkhhy`ID@9+
z@MJtT?rKcSigps+?dYc;YJWv<GZ`Jwn4-t`sR7Ud1sn1@Z^t3u?*h*+2MirhfiJM`
zl{R%UrlJiAz53_S_xI-5$)c|gjt)&fmomwV4Ac6=YCSeI!un+ww`cNFbTeVO^{!eg
zrw#L(hI*Al{&*Mc!I$jqT@l8Hl%KtHeuc(x^5X!Eo*}5GU}ZkFKf|ktc-UySFd@I3
zg~xuvO~7lWtN-9Yn`XM_c){Kmi$YQ)2LMwFt*b+k#xO>2IKtTIm)&*13ybEvX=?36
zENpZ?qz)jKxKO0t!Y6M-1Cs%FC$>e+?veK3&Q)M4Uf7;tcl5was17n#0erF`G=Q}V
z-+&ESxoF+h0qx<`!2!VXPKxk-tAJOW)=N(#J?2!RS7GSxZKw2<XE2j!LyoTQJ?CKE
zS`cN?0KhWD7p1gh`LYwQiz64vk=H(TDf9+zS;0AhRx@^D53$j!H|hXT)a{#$z@O@&
zOiD@YrVA5*A`??80){)IpNz87+j2dq(QcECZ~(BqjTN;g5}pS9!Dv{KS8VhgHXZOL
zjAvSRCQLy~^pVR}KGUl~ztjgM<$%;xT2>b<N62)9D-KvMwog$Q6l_S{u3I<9{0vSy
z4j@@x;t@@&yvQLFlQIyaH`owo#gb7)VuI{CfF1S9%T(pHOPI>Pc|Nn&?FRP?I3RKA
zSs+o{mJO(3Lw0?+>2-7xEO#6L6v@1$lTKr?9<qoH`F(=w*^>w?asZILHd{|2SdFzi
z`L4b!TUR;l%#eyUWZ0xzWBUfrvg-hL5>i=|STH`(1jT)A19GfD114t+gkQlpX%hpI
zW7t&LkE;zc{~-UFQ2TlXJjeGnCn92_*OJx&K;$Y*!^3<meyk21#fB`1+S#^sf5>s=
z0H8?glkykr7?47#^m9Z;I|-&p2y(s*Kf~@@0y!%Q4QR~_;Fvb#RO$tj%iT%^=79zP
zNdwwzM0-Qgq)oenZEo2uHNcADfH&G@MC-%Q1e5xGB6jia3JO!dpyeUJ700n6J~sL+
z(gDCREH><hpeYHWb?Z+%&gclojkXV+>px%m4rv+jWN!+tqiiv)dwA2OvkxIG!vVna
zb5V-Mb+9307o~CknCH5UtSy^#^w9@e^g$qbC?!oAg3{8mu|t<+f*?uLt$&<KSNREY
zXqtMm<%3nc6>LbZXU`XoYTFQ8)f(Un71nG07$z*AnisAIZw>`V7zYf7L*Q?}@b994
z{iEK;(ZWWn6Lf}`8DdqVK62<_>N<&M1Wm%e3xOFfebSu^8**sI;!>%G!1Wyt7+7a_
z^(@LMj9Z+=xW%{iYi8*46qdv}q4h_ct5pYWo<I?~f{R`I?h_CV2l(Uk1PXG;g+3cf
z6&q1hk5|`&J{Sxbbp$?Jn&DXy#zr^cHPe6=1~%e#LD`yaLiozhmX-&VF1ZVV0&ppe
zI9`oXCktH4Sh(l%%h$^h#zqSigXzbtdNloHEcO+JwTza)no?!myf5nfY9k!LQPo4>
zv~ZJpiXl0X6gC=#ah%jRN=mYneA_%rAMec>m-(oTZ~#c@KDE^-zctW+B+4KmY{;yU
zZI3VC4iPC107?q?bYEHC(!Ny}X=wXaLm;bQLt1PrcRI8pWCU;k=>@oZKu;#@c)~6a
zfCGyIK3Mh4LaN%T;zSr5-QLszMD^P1Je%=x(~bL&?IE7GfCjm%B3Zju4Un)EUxtmg
z5=8QqAQFdC-c3B0VF%+?M%-{)Nx_D=Ju}XQ1(&w#fHzvFAfU^t5mbZi3opmghOGZ9
zN72=DAZEb<z%(xMax_2)$&}y+c*Ya1`Y#ai(Ye07bA7$0gi42FHi!YRL=?u?LMMyF
zkbWu-IUyUaj2TxM%J*{sJ7&muq<YQvb17RqY}=U$OVvd-!T}RrALy5=vd#&5(-YRt
zTeD<}jc~w(R~tvU4(ncfgs~y|j?MwVlUJ8s_+)Q}CDtUKlb{``HhJrbnj4wSLzz@A
z;9(gXk}<t=n@t608V7)wL6*MnAe<jm;d&0`2;|^vfH#_N8>e1sTi2^OVTIv<HyUPQ
ztBFjKR_rG>`n1ylFEk|+*tG5tsB(zc)tcewjX+^U?4eY*W%G|7gKPv20KT7{QKT?%
z7oqGc^cUR{gRY;)SW(|oUeT@3uxl2jE=)e!kfcWwwq_}l$4;6Is(8koRDk*r3<HoJ
z`lbd$W0<8=LPj^s^5iva3mV`h62owdQX_?nAAWUWd=@+50H7Hsw`{?Q5vVflM)23O
zz_-(I&QC=)9DHKzR=`WC3KYAwDAl3kv>|m;?d)<sH>Blp0Nsiy=<%Dzw}1R2;~N{{
z0H8_J!m|oA#T^U|`D7)6e%Vb#5YFA$RA~9ml{UfwqmlDD9TawD4gD&l<@>V_zDf(F
zmd1}<8vbS68ya%-3eM1@%|>|Iur%p4ofmE_y|7fS3pfjf<Fg$QQrjan`3N6$eRa>7
ze}S#HFf?Juj6p2c$ji6kDe5_3xPvfX3h=~?KRw~;hble(gvoTto#|i(H`4NAvMORi
zRD_iSGH}Y0@z>i3D>HE-<s%B-eKc0Z{Z?K|JViCd1E3j3<+as+L=8$?$5I|nqCl}B
zN8j{V8n)A8(*deg-qAhv1Uw632!Ll~B0yMA3#XuR|A@;eHpDYL@#kE>fZsB0`)dVj
zWo6%}F&#k8BHQN}D`JlM+CcTwE%k_L4jEy7Jv=oj?ok2#>dptI0`m1j^#;<qNogrP
zkWXyL`xPTTY@JluP8v^2p1be!TC|RVxL7y_ku)>tdxWvkzI+0qqDfDjy)vY}j?|<?
zAhjdR23`bD#Hg;Ms(xihTli!J2MiKcKj0LSQ{8!;Tyi#7^_>@nvoh=^o08^kY8l=_
zggk+V@M?v?p<!u}cQb*O@6x1dMG2(JF*L7~gxBH&4f-`KbQj@GS+J=SD$(1_{SrGn
z4VlQ2!J?NB<Nzw?$L}ierwIoPlJjvBKcRm@B@9W@Z!F*(6*iOU3RTKjFrgV)C}^6a
z$by1Ju5s0ug1ALWw>|z<|7|wH0i-X^G3q?jGK|x}>=X+(e^|#dlCP-W95AGW>$4t{
zH6S}FjNc=W<l!e1NJj<d9-6uC49;Yy3fBN=y)q$A6S|SHTqe1|3s4|p^&WWqWaOG+
zkkP>b6bP6wBF986iaUQXy7Nn%_bXCl*-vw!R3irf4?F`Z^_$Tts7+ia@ULP+MqIYO
z-FOaC@;PAS*8C9-xF8z_jy$6ZMYi6NpPYi}&w-S3%%9g0jpW65MzHfNn@kr22mA~p
z|LU0bi97oFu@p(sgy@eaO^5I<8Xp=C_~D70?YbeKQaPCrjXa5E2zi23(-?kLFNKWh
zHTXG@QpWi6`p5Z<j8*-}H1sJip`HAufc_l=WQ%LGS`sILNuy0TMvm(19EC?iO%JA1
z{bHgkxv(%#B{{0B!SYxtL#lw68yoPcUkvU%Z5cY(8GyXWd*0_b$=X5#*7^C0fQAjZ
zIrz+-oGw7)0Afiop!SH>fnrIw5Xhsu9d1to3zq|4w50u2!Tc)Pkj7QE&K~*?c;q->
z6h&QK6#C|sazWG>2~@BlZ8I$C^2?eqNUzlZ6oeElzYhFpcYQs%v3E6K+(-pwLD}*J
zAm4%mMkGux=15;4ToaLk&ux0Q<NQ^qG^_zeF?hDXlWsVP;g>HltP7Gq0A4}bknT6H
z9^5_$_~d|58ufH(i0cO_76;A4XUX`}uB91JX2CTZ;Q)#wI1-Ek8snq(rItuSvmLO}
zpVa{)Z#DyOXkGlTdfTJ|hyfc?qsgho6X&+K>wvf3*1~C38yb*a05l_q4Rj9WS}G}*
zA60v7$bv$-AB_C@FL3;50P<(DlVxvv09=1eM!H<ueL~+Xe%YpVJJceB*`|bmKaDn|
z`u;INqrSdq*8ybGJ4$A;(8C#!0!cmxfzpOd+5FGo&eZ^y13plzB5GRT0&E_fE^N+N
zkB>aQGf$+QaKPBThWZ%LI<|pS#ApAcES<sb!#Tel4!4dt;G=&^7GyFv+^vs;>4p`}
zRaat?8Vi~J@Er!(QOQfH>vs{&Jyt)#UN)gxC-r!Bt|6PAw}MzZ2aG-bMDH=?;;>NU
z|K4qpF7zRH*uj09VD56jSGQk*hlX!E0Z@&cR?#_)U`5>+n~vxNNUV&k)D9ZBwq;N^
z>foXcdD^!7kxk*i7Y7C!-)=q-V?8|hT3IDlTo0`^7p|h%XxY*)dD`?#>ccRcg@SM}
zENn2Wh=+|{5=sYP7!7Fh5lXn&7B`9{C+gp_5e|5x`F04tDNxq+Q%@){%>i#T-wwf|
zgK|GOa~T5q9571Cd@O+vlSNfh5}@D<NJ+snF>Of4nxlTZ{1jrf96()=cWOCXBLG?o
z>Bl;$GfccF(`B;nR1T<W#DSF2=TGZsAEQ42ze5Bii>p_|{wLrPhYh(hVDs{DTYb9@
zAbokb6|8!!<^qAi@+SO<oqo92ynE+*cESNKG(U-H-#s2we{XNdP~?C&ns4PQGR-zC
z!)GuvIAH8<3Daqdc31j%L|8AJ9HFS>*pRxjPGuf2^&SMIHNd;u>UDhf1~jn71;8^h
zQccW%{lgV(37`x$m4B%pN+qe*316|IY=J~O;ed%P*@-VkgFmk08QBuY<jClx1np{C
z0FG2l45kg~c)VS^mi0hT90<fwAUq>S<_ibx(=}kC#w*mbCyv^tU@Nka5f;>N___!t
z;rxq3<z_<_0L{ojIg`#X4(R7^9Q2Yl?r`8aMa{7y32b!7k`5p@e*72#u#C)<3djr=
zBfxvs$OyHVu_0Tpts4@08LVUuAS0$rUetoh56^=d2f#J3qn^O$Ei4ra^RY-V<>b-T
z_u#81lS-b?Tz6;cj|KhhZ~Jb|77w3)=0M<}KTjQ$atH(EM6%0|f51(IbKA;ITly5-
zknHhpz_<AtE^}c`=f#7j>yLNG$9quOcm^WuguRgbarE%hsWTw$gah77l$?fRMKo;m
zOaT4RZxHEgaYTj!JJGI4&9sNxr_pfV0=|)xP$>dG9Sp05SQtdI)rVS9!7p5M?Sun3
z*j|>X`T}R|OSV!6Ks7REE<l2x3&8Jn81?>5&wK^`I{yJSY7IaR<c-457kBvMI-Zey
zxd!|WleL=?50Sg(U?5eZ#wIUHQL}cnsx@3yycY1UV}in;!zk6&024bFl!lh`EiK^Q
zcm{UVOej5YTOuy~GQy#Ap;hw~1_%2XXTNlt*9Dova~}Lqj~0HHOl#(!fE%FKEbn#?
zOZ58M%{b5)cL@F3jph_ESkf%MJr4rT?Z>RE*^lMN8NR2WW<d_KBDZqFn(ox%*Vhca
zdtFA~o{+R=o5E;+0(C|cTD6sR&vOSgI~FIz)4c0?4vmCzj~p<GTHdq~#Sfm58DT3+
z=NQzzPm&@dU8)Oe*E!)9iOiI=4F6E-i>!^dgU6l&-b^X@xeql1lMv2OHck2CI-Zd!
z;bKd0xq9O@JV{Fa`4al22QN6_&6gj;h(E4>CD6!MWq%{*mnUTube%RNXPtM4UD+Gk
zb-=`v?~{PZ_wPO9Q=<~%?hB^ja3qHfnOALmnakH3*>%7hO;#5%GR*l25oQi}qxn7w
zFh@L~aloJ8a6nTsn96AE2{xq0r3Ux5EYAr}6b(qB;7s+7yu0FCa6i7ik+;OT9CpG1
zZ#3V6^K~E4urSMlbK*?EM!%V(1O5bupK?u+;6|X}up!H)rp|e-QVF{bm;~or0{ezf
zn)hcez~g|o1mvy=)iEimzpf;!aLZcsr4zW=TD9$>qBG05&<Hbfd(*xD^w|d4P#nOn
zWQA|w#K1NVKVo}RhhIE&+ijumhZQ*hx<A$=%N!TMl(41;J2~K=H5K#H4UBOd!T}>=
zW&_=k01+mwa4PP_s6<SY*o1|8oE$(tjEPkP@L{yE4BHidUPm<YAhs*|S#dUQz(hN^
zss`~z__r{X;^3OEf(<!)P#sk116(%c0Of{T8FaAPz+kBdp@DTvT(Lg=S)It}7qCon
z0D2+v5!KYVv6=D_@46QBjo+QgPB;Ka-kE{4tcE)ilwE@FA-dGQ=qdD+MTrc@{gq$U
z(E)gc;ac)uWOpBBSK0yjGO4eZM&Xs!cZ>uGfP`y@K0neEg{N|mQ-iy|g-9U>P<n>d
zBpex!phKzj2c~F4>i;xJUGNCjE)D>icjYN{E)%)HN?jx>`NGuHcESO``dG>!FMvll
zVC=UjPyvb60aa!iGLH?J|0ZNapYplvI$-K_73_3X+G(jWeTNN;`?hKh$*3Ig>NIu6
zMS6>>V1d1@x2}N{EDreV0R4iy-i0>KL^_H>=W~IDqhLecq+Rz7saDCZ11Z({-(5NP
zCO(0?BOHJp_*7qY7+XMwqad)+Bl0?6?1rdt%05KzzaNrLn~rL9Ab9u?Q=xp%1rwf;
zmvZ`CpuA``MIoXK)4?QGi5>g0!&A>(Sq;Zn4M-t7{Ba%6$d0-AgZAy)O5px*&`-qT
z0xLEVUKw7$O-zT^^eJ8S3{%hmh(<<)Ux;Uju~FjeU=0BHjjnMLOQuq;R5a2z%W0Vg
z^)#LFf$)qRiBtgJ9MP}Y$}CBCXN|u7wtn$FTxsF}V@Z6(PxWnd@W*vLBTHtlJ1qf1
z>uexo9IAVjo92u80HF*H(4k5}RtJAxNBkHU4rf?+C2VL1kqZ%~I9fc*#cJr)<^XUJ
zsAMC5On=@$T!nkVcq)cK5X1{`?w@{<J=@Fzu<$jld85I)9=WJL2o{J`YFcc-V~iVp
zfai_x&w|fu$wJgUyQf*USMPg6rQ>%oZ6}?3z&><H-=7iR5Bcr*etPP{Tp?n59^Nmz
z2vr*GJjck0=`rey|ArNQxWGm@fP?k%v@HI#j)v6aYmoHLrTQQ0zU(?||NPv9NrmAi
z2d_a(6;%3)tojUl*NOGciZC|BgopHe+{>^?_cF?+eRAykuvg$CYZ8;~?<4PN^hd`j
z4Xn9ygvUW9rxFXvBlz(F_I)e)Zind|-cl_C+_|&x?{{k+S?IEmu<2})G6|c|C}p_x
zLWm3N%qn?d*MkqwyTX!)LBu?NkGwumyF!U+g{iy7U(z-Tmr2-!=1s34(hJf)R_a7N
zY{<`!r{9j*2$!3Fe4frRtu>toeyiLCK=Tr;2W>2@XCCE(Pi9f~2z~`xh}Cq!q+%5=
zarG;hEM}Lu2@UDWipy>j4Fl>1skTU-USZWmNT1L7uy=_JJK2|(J}y-g8j>@XLZRDv
zA4*TbE4;KJn`f^+o2?OKw4^W6COTnW40F0k6UBqBTM!V0gOlR5N++-&SmC#9Kv`-u
z49wv_NQ?6Ek1<o#JB8FkQ~fD%*@t#1L!Q{<2jFsQ!EKp;x%U;l<7li+qAI|t+6x*3
z%|cbGJ9<5V>&@TZz57X@S$8Q-?_0m2h{_T}l&aWaY)H3`$-R#6fy>{Gn%6yKD;Z-)
zN%7QQPgCp`J$YD^aYX?K8?v=di!&__ML-plZ=+{Tj`)TODHL=73;2LT86zW~A*R+t
zAsoG^1Uo`3Kt?$+^%?NPk2zbj0WoZdeO2zelNNTglgd9dS^e+*-k2_IvJ;n~(lKhD
z&PaI${6f<i*el{P@3&uXloe5RYWM`FRu#4l1sk%y!I*b5=hd;3-PXSQE{D;Ntm!B;
zqM@C`gvyj067~1({%~&j<yrbPdAn7oRN|fVGBLXutcgM7mNFMDq@eJd8o-!*WQmf5
zw;W+?$lbmZR{xL()MMD1s%fI@&}4mY%~CI+5HCXm3gSdmZ1h60WXKR(_nQ4_r5$m=
z^t8hVH7==KsQ8K;t&?ZhOW4YDo&0C=lDB!VV@7rKU<gA)RKhUB8ynK-@5iAB?!h@&
zng3?Ph#TGMka?E|IxSG8<%Rj5;kpF7&9ILu2p8s12}PuaGtV=8lAD!ap?49a>@ez3
z*9L7n$c2_GC);aZPQ80zaR|OwulwKS)Af<XtWnhM3+4Afk!elwRYI-QIY=BEvTfLl
z4;y}lE5)<U&$wqT^AGZv4NeM9DCDHTPi+SLCUGl9La$@6HI>Jb@Aq|x92x<}Tx<dj
z#lY0b3|w+$rYg4%m3jK@YM)fU3PHCXwncp{W$BlWgZnD3Wa?LtQWZUgk?^00Gi-3a
z-f8DS2x0IK^`nbbe}TjV4&Cy#Q5VU<CqK#7XLp|s@F}cwu|bP-(66mzN(hIFzbZI~
z;2eaBa$H%&zQ7I&5E;ujyXV2-b9Ng^Jr!M&QmlVkIcLePR#53~cbk?!jsNKu;>de~
zr;#K=s-xHtCb`o#@?Vzft0N~qq#}gX2Rvzs3avZEN>*uIv*JszA^NpXmM=6P5v3AL
z^34N*q@RGe%LoU|xYp6TbQ(1=(z@-$KQOH!N^H^_=Nh6|9rTakO5bY~qlS(fE`G5#
ztomf%&jpU{u#qhlt6Xnb?F?S2(bqa9BZ{9b<8&!u>&e^hRl;tc202a~*STV^C2!GC
z6J?~;JV3~>%S7ayv%KUvxa7??^FL91K67Qo+*~&>GJV8;NEl~ddU!+G67`Di;?UfK
z#<1uA^7pCs9pLf>Y2UY0|3cq4q}z**<SC4uVXl8^+chDf0DL=3nMYDKYBF59yXSB&
zn9=D5^{P>CI!{=Viq!puoNhu+Wf!Xn4~fbeOskTpkAP!C4_VbqxDVXUb2if_$BwZC
zDcQ=%g`FJ6=vk3AHpGO7^g{eN808v{?j!MKE!SJv$+oR6-&7jcjfoU8!ssWGJw4&&
z?u@JkvG)1U8pr@P#P-|s6-PdSAl&p!O@<z<7erU{K*ohAC^jwcqfHOm0@<)dw#8q1
zx>DmJn3Gkvqblz}HM2<h8&RLmDqHh4gnOs;JW%)S=j<MnK%&l2Ex%PHi<pq8{_`^G
zc<4}PQ$kY4>A?B!<6+@3-~t@{uHSpj){_&g>Cw%UsA@t(Ql@=a6qAw9VZ4ALDRO4P
zBCCgfp4gx;o-V+uI}3b`f_?gzS(t`tXnF_IH}73%vCnjEks081l*xq*xndS($;K2x
zF9voE6oD@;R)n$9i!bX)NYS_ks(;{En#i$SE6B!}aX2D5O%67(Li8d%Xeh=21-J}O
z?P)_lO}I$aP`ei^M>0Q;h29clSH&g`xv~GdgRtiGnv!^J|1f%qOIp_Gjmw}w&m$eL
z1P28R<+AE;va{p6-sgTgQ86v}Fz*k3HFkV;Dot5~q!fMW`*x@1J<3uz4_re%P&GFB
z;F}6KqvXWD_9%HRMIQ%%jRMO(feXx|b483k-R~7HzcQ_k_@s7%uZS=<q+_-(+e}+=
z-bO~w9A9qNhD>w{h8iRK4dFq!s);T@6)qcDJopy%7>p>%6kauW)oHMkIDp4JFLXH}
z0FnG)qFD7+T<wJq_J+o=Fh2aToXh<UY)KQkJ}<GdE-^0s>Lx@oE&V1Wq$Fi&Nk>w7
z(T~kLVRhr<U`{VCTK)Q-=;L$|{<sUqgoe}%m!~`hP@V<gN;v(vmhOSm>N<mM34Iop
z6Z?esMH}G&irDZ%CM+~w4Z9D2UPnYugjFwvjV!c+1uJ9mHY~KD>V!aNpZ>kxHJ?MP
zsK{6=QO3+B353OZ?OnZErA*4b<7TcND>51xTf94EdL9WGwp2WMsgDs)Uf5Wr)b0Ep
z<q^}Cs&2)O4TGUEtTHA%q^F<wzQ&30gwm2~bM<~2S9knIIFkM~cJ6OvZda<MI?nG%
zM>}wY=Yj(VHY88p(8QK|;M1-lEgwAVQL#PFdAXjKdJ54BQE@1j0HzIDzx|=RVL2#b
z-@D<lYaIsVLo}TdJ*sJx-h=y7!G;_^{p*0FlW@E5^Ry*9_t;j#fFd7Zv3{n44f!j1
zXuI2W%Gt@Ekk=fZp{mgdfHKppN2N8S9MOhMY*?e~zMFOJWL4=$MPKx6Y!HHHl8zIk
zG({Y2$gvMshur%Ea3+3n{qDDo8zXDNvh{sPIDKVK+35RFn~Hsh;}|s|4U(gH%(|5-
zq17&$H2S-&kY2p8@UqoUn|zA=N!x(Qx=q|z$5FN@SkUa`$tsGA57>Cn_%m;fGbdDc
zY^n#ImoY_l=ehfko&`gq;PXamG{ooexO7e6d8oaA83va;yZ^RprRMkHl=b45?^a*O
zL_(7d;dv@h=@!8D0anfvPFm8})5N+;GYi@Dm2h~ZT{}CmQ>URWrAoId4bh2&u^~#v
zi}ed`fx47UAFpi_{6%3Lu`Ce^O_PdEgfGZr7gzb@v-_a46I!QUXw!;Cuf{GKORcG|
zLEX7b1x@|t?ZJHy(v-C9rRNO1lZ58NFM^hm3a1G+<mu&+bN-kOr9=15ojRt^%G$`L
z`ADv=foC~AE4~OD{nKE2UM=mTv7DTT9{)|^VP`_HHQKav&e+?Q*8B=VcSRVaxzXXL
zUN;R73p~(L4<zrmw?_Uv8Z3a{n*CJyVluU<gA+073;L+gWE%|!wMC^Wv*!8GGMgHK
zU;VeypBDbT0n6+2<p7Xw`u6Srd-&BQu%Gt);2itJa}7nQPdLx_$d5)xH~^aOZ_@c*
zG}syUW0n>lF`L$r@aq6T0WvA-VL2Wg2T~cq)Q9bkrb=&=##&(Uc!VtbOi}>~PkV_+
zp(01y*O~R(1gN!kRXs7g0L0IMn7m1NhDd0lYiC<5jm*>x&UwFA9GB#|N~;LyVpnha
z)Q+!4ZYuQEz*T%*SdSu<oCdO&M|6vqdDm~P8jw7@CGJG0*k|Ryk;T2&1|&ZfqAT{?
zKBM3-^C1^o@+YwZ+)*wU{T}vviJCAB_tq+~b?Ur_U{3DM(RkMA9Nr@I6A|K$TYbQA
zzck&RbK+prV(b=L7+1j(x#a4%-=4EKin5c(wGU3Lwj<GNNxlb2kQUPqcQU-KMY6R$
zSgq>kZR{lf$aFodIl9ut$E)I&r!w@;ofZyEfQqF}X+uUAE&S%*#O8K#t#@+ylD~KK
zg(`n2T=@b~u_0q3FKp}mt|jEc9bHy&Xxh#`Q6u3=ZR#kP?n@iuC{r&nsbo_-S$Z<f
zlWa>P=sxOwl)zhiYGddh+=h7$KiH+c`G=bAdi$uiog~kEkleA?MY^4Op?XfhDa0L&
zpX+cY#=&=m1K~3RO-^8-Cb!8zW8c_@n|Q-cMvP8QPrq>??UN=0&GbAYBwK>il||PT
z*%D+yie)y!0km^JZg2Cabu=@*!McLW^z{9Q11Y1&pC%kI(<|eX9xtt@*Vs!LJrkOl
z9^T+($|m<ucT931W%T&ddPWD*lOt-ykQy~aEuK=?Q~FuJQ+I}K7(n18&jFw&sYx9`
z0=pU?_47QEk(X$CsBvdNzqunWHo8Ap^I~zT@9<c9J%zkJ4q)E`96JMGn&=h<9-&Y$
z=3{cgR_rD=dX+C7K*9#Li9Q%|)Q`n2hVTNILzttJU&{70Lju~2z-p~3He|t~Ya`A^
z<ps05{{07M>UN}a-sDM=Vq20$$1(vR`8ebCc0(3}GXeNCEyGgCPr5+<vi!kGop(Up
zuSzfPw(EDG1GDxu155o6Sq;bGv`F;<Y8B0YH21b*b~54DS-+-Prg=I(T2{b>hNB@J
zQPK0jzR@7xd^o&pZ>Pu8;Hynz&lH)ttL_temNRvZGI|vm4N~b502?x^ck3L>D}uk{
z&&fkFP3}U2113~@3Tn(yoyY<<`VOkco{(9uC0G%cb7e<R_MbPk`RmJUu(O>{-=g}Y
z9KKd>KVJ|qp(0guu1Rr%^*F6G^%2(0>sgz6RBrPK0$(o|?A);^KP75#uBitQ@gOvY
zGw+=8JMx782^I9_r)t=G5MhUp03KawVut)T>e-$OcOl7W{f{fIkIzMQ$1p!IO~!3;
z#m9w58KyLgxva5iceK~gK~2$=Hes5k^eyb>2kfTo5-@%DAcb?;gy%~S@NT-=+?!;n
z<hC7y>wyW!tg$_`lU^#M-bHTjA*#HBm{5_bslMnP#Pv|J3MPKjhO7@7Qn6I;qEIU2
z@A3OP<?l~5!7wUI5N|1?DHhB8D_eDbdkx|cL-VGoT<|zO-5Ddia>9X>HE^#-%=zon
z!N>4NSa6*>vy#z9^6@!i^+!6#JXLXyrA6mNmXTj%ot*v#+``THsMxdVkLa@H6&hC0
z1D2b88ZA0JDH^hbKvM1T9oUc$r@I|VZVrd89Jy9>YF4I_Ne8Ll%AJu`W5;(V7}Ub_
z$#YbTkEQ;akZ^R2bB(TL+9b6iv)GU}d7GY}RuM#ebzA>F*Oyf^4~_2)#e_$dUMc`D
zIgBjIm!OTbA-nz~FRDEPRp>XNZB+Lal^8u4Pq<5h0^!jPQt8QGN>b0@h|1NqYHqc4
z9X5Zn2>hZr1FpCt(rLm)qF!sl22fgeChD9{h)Yt#T|iwNipN$TQ78Acn>KR#!KwZE
z+Et<5^?C!{1u>`&S|p;#tupTG)Z{80Au~6A^+%hNWvB`p{o=A?TTGfCHx8?Fau--a
zs`}U1pKE6^s~^U2)V*|)N;|e*w@X?7-Q3vCCC!>3Pg0>lCOoPMQm|0@1?kcIhVt^K
zCz%u~(e%}@+}G(^BpZ6wQAuk+V_1hwXePy@SrIe>Cl?j_{O46yKQw}mPZjLi<!sgF
zLuvO+dLUaQVka}<B2C@R`3$?K`S--P2MTnl)49;WPLOk(H}{=kxxEjQCjXxP^%ItH
zw*^-oe;Hvx%3M5zVnap^?L4SZesC?__&UDM##A&TC{VOb{)7ro86YDzUOM!R`Zv<_
z8#j}cvsRBsX}Z4zN5%4PC);O^q<$s8HbD?eO~-^ba&gJUyNM%j!`5zz$vJv{T6%c(
zDi^Iv7NwE~uxO)wG624T?n-Cdw>M)YL`~0AZ>HiH(8W#eAFB%vS?b)PF!v8PDUK*6
ze$|N|`nN3xu@~pyW0SkRyW?{kxP+*tR3>&O9~>V1)*aB4KKn(#MW_)}P;+QQPTziZ
z<J4w|W3^bcv((8{&FE}5IzXjlALU{&AYwxb-~7y($puIHPpf|YGJH%p6{z=ywHkL<
zO*&4TRoLit;S5Pvu~0qDML)bGCniNBqu7vJbsqP=c|X6MtbgD6R;T?mF-ac<nlGWz
z5wj=v^E?mozlCC~yEpw5mwNIk6lRK@pRDrdPd1I)HB?0n`AF(osdr-K-5GhT{iyO_
zXrJlQX3BGiS8kD%kHjtv<627Qlt?pRR4%yD*0}%J>wRx#p`&0lbtwU@i-K6L>s^lg
zmkI7P=WhM@O3(fDgA88tLDtarI0o2|c~cH|N|PBb>pt)P!zb>3AIlY@+KLTnI%S9Z
zMoY-1FZ<oU!&0|@;A86I&csJug!7ubSW&#mp_QWMs5U1gbDo9)v_4Wt5;o+uyJ%GN
zyAbF&UVUiZ1zY|_in_0s-q+&9#L(+|!@!Z27ikNhqsLC^e1+wE`O+!Az_PyahCPce
zLV@-TxlXp;GSN<#YEeP#mDDeBSk03y?5_^{;Iz?xNuI)Ge@O3R?8Gs}P%F4ftB#Am
z*#>@}Cdq>*+&Y8(k|!)RX_+*XJ-{z*NUC6K>b&RSz*%5Q>jwj_)<JS235153H3`yP
znyS~-vgMz(?C})RDu*{qS0@vTbqB~5wJ;wi=E0Hs*W0e|Ng&X+;m_z1E3Yz{1l+!8
z`kZfE+`bIPp@N1m`_L|i*wG*r21Vocwu|FWgQ_vF@u`3tbpSNOrYT~B7Mj`0(p$rZ
zF6<jV0|IcPir#D+?(~XW%E3XA5^KUS&=EKmB@(SrY{=Ny89zTM{fV8l8<zS_p?xl@
zVJX>dm+U;2|7J4e-?raV`QL-bXzHk>&vI~j3hD|rB(6!zzqTzc33pDW*Sc0c-)E>R
zzB53n--S6}N{`EuSiKzhzekq(c1@o`Ij9+D8gQCLa}J2Wh&gdp!G_Fte_J483ls&q
zHGji@+Y6Sa-TTNVQcO4~MsMZx{0gsk2Z!}{(8CK5wIWe$$g-;T2KNgC!#~UzGQUyt
zRFtUUkoO(%sg6Zv<%6XOkB*;tW0z_1>JMbn)>fzHMLnP@Y0zjtt_2e!5|gu3L`IB7
zGRBK1?AbZJ++XnJ(vs0?#%Uhfw-lN2CQM3Dd<Ik%%Zo)?Ui#EcyFclr)lPmGTea_v
zuB|9R)96dqY9L%BDe2oP95QAfD`{agXhR|^7wTP6fud*}@Oe&>DF(pxq9`h0TBO=`
z)7NgAowf+9E0sOpSDRkpJRQV9eGG()6unGWVcN;7nO=sz=C0VH-(R^)sT$PO_c4ck
zA8oo#3z;3mZ6csA6lWrvj`~N$4b|ukrN|YW8oj)yhVBc0S!1Pj(z8Q!`}CcNFMsL$
z)-RXFEtv<t*XAc<pH?mM@Z*AAj=W++Ot>gm?|v$ofKzw+gg7<P5gBV(1x#NJ0yUES
z@U*14Jo`=0(}6TvzSI)Eh{CZbk74tt4S7(0QU_&6kX;8*Vf{OK0%7`~>B0fg4s}P+
z+Qx>&jvv)&_NOo{IbiG^JJd<F<b$vMJ$PO|u$DRCOKEx{sc9g5!?MUfHz|L2(t8}#
zG?FP~#WBQ2|8$uSpkRz5mGn(=o6THyHuJLuV4!dyphT(1jJeIe8B{dt*?h>9=YX$%
zqT5Ujf-@`hlhzKzhV&Yk>h<(aa5~@s4u*cV7S14x@@oSa25d-Zx@(^|I{^t!9KfO1
zaoi{rI&?u&KG2fl-A}jq3mi`z02DuIIzdvJPM7A1w>xhRu@eqp&jK7+C6ldHp-hS7
zBpf0+ATjBAg`>roWS%n2uhPTuIv}C=`HJ7f5j9*V=eC2KB@Hmh?}9E1i<IYdMGcy`
zy%v-x{4gP+`ql2A)7>Q{=1;FR!3VR9g-h|LZ{{Dexe-l}(ocW#2}hWL%&!4qRd)4z
zXUfd$@q23bJUkB^xb1J{%%81G)c__FodejAn%B1NY%v{Hgh!WqrMhvJUI_ASlmCfg
z!G`27Jgst{i;&D;duXS2YT9SUQ;mE~6sMZa%ZlEa-2#%TB)5V%2~oRSv;76m!M;t;
zdlDgi>%X0S8h=PbPZ@??hsFprG@Qk3D(jVF`2|JPTFJMj%4ZtkJRIKs<b=!lk3lr_
z&EB(fy3#}vuk&aloQ)biC(^@4%Y}lAxI9Ay=y@T^r$aH!>|Ux~5P%M|kcoUL#7F0N
z(gv!oWKGir!wr1G4l^8C#D;8LVY_&#AV{)BssGaSZOvjB5|)VB$)Bt@VHu{0_=Jdj
zQ}{`)oUtt@LY!}Dhr<hAk59{tFx3Sff4mD7rNm=)89iZ`>IfDXyCcuqcaSxEDrVZ~
z*^N@s<ESz3<q38PbLb4~{@^WTT+Q-<ow26WT+f{_H{J8~we13qnzj{AfTdKyhFr*A
z>A~=}u+6m3)c=QTN^#0)dUM1yNJ)h_*pP-FzL_%hYpCquSd{PQd>x7)gQgmZsQ>Qt
za0MC*Ljaq?<H1Z5__`f;H~T`DMMD$+u+ai+5Mv1)TBl(9YWH!<8FZS?piWFMLN(X#
zJu>ycx=A)YF#ym+ULiWC)ELwiC>V_}HsnFX-l<8&;ey%mMISa6fBFv<rdPa6xr<pV
z@HO)YSG2<cswRpB=$U>TpeBaV2~RCzllT6y<HM^(gW;AM2Y}g+r_h_C^nm4c%JA*;
zHx&Y<GfDXJvZAVKE^&H44jWSU#NCD0E5M1Z;g$mnc4^m&0vg}}aFL?$(co_8&H&#A
zaloa+B#enTkp*nD)CCww*4;_I%~Ps7rWiO!(Q%QiY!QEgW6$h1DTkeZ+=}p&O&my*
zH6=TAg~QB*izH3B-vM2B5PTT~ucM2;w%xkU+O{|>R@)}z>(XpUWjZqr%Dx9A#ey-i
zS*&~JW24UYYh0#eikFXWrL*=qF>@(6*jta-oPK3a>NfB){;1Q;hV#p!3<ADsLk3>B
za;Me5P_JpmoAh-$Jz@m{yfAN|bZ<ffxn2Dc6C0ANf8EU^+W=<y-~P=Vm6L{P4Sn=|
zqT*W`nc1!4t&KUi{|_fB{gx^}&Ec4M@p>P54MScn^c(i<L-tL}tk}OJO=dgk*)6(h
z)5kg4n(mdfr^@Mb1F)ai5ECv^HJVK{m$3~KZEGkFqF_Tl+xTSJnOtAkNv+?us+rzJ
zGNRrY4N}4gMe~D8)z6z@nz~ER5Ed!!-gnTSbtiNvU?+FJnN)n?W5su8Ma(`Z5H8Y{
zya?2Op!3rrS@ZAH{JLb;A&7l%$g%rHs$iO}7dYA~P68%eq^R$FrC`(I6B}0-YBg)i
z0GMy}C-+=BecesEmU#IA#MLkP$~jv}=JC>O?5e-n>m;M-wKurtmX&v)g~*g<(OW?S
zm;tAU^|*}#IOg!26x)$5a_a(d@0$|Wzw>#VAYOfwef+{0tDCXdod*-({yv{sC`s>a
z4?nTMJ~$vdWtL=Dr<W(-tNdcsfRXOL-Zz}YjaYfLsy1j-xAIjWRvlh%!qMyB=f%}Z
zY|T`!AL5*laiZ0Ny~nwsaz^K0pU?gBb6ST&;5<SBKK91pAvKcRdwR&eCmy<D1hU7n
z;cKuVBYx^0wqX#Q;|2}r|7=)w8a?!K7WlTu3dUtqsuh4FxcEPc6&pT?2G|UXn{2IE
zksdarTDHuI|AjzcXF>TF9bY#t%G|f!fjP0`$Tv*qj(anG>+AoZg72Zs_d5SVYfAgx
zan$NCD?qGHq>BwX?>;+WcFVOk62JAss~3A{I=E@Gk^-!fPmNv0gYN`Z>3=J!*c6(w
zXB3eq8A!NuK;`dv{M?1q8{k2x-^dqD&P>e;wqfs)J;$y%{I^f5s}QQ+OITK6c|H;W
zUkAd5ROp$!+f@e~t?877Q&WxIO;;>0&6N|B0-^d`D8<Tdp^Cw@V{<~jyk)YNfWoX7
zLjH7IW(%}G?|>xjEYGTKI~xf#;2YGa`XTq<G+<~@4&TW$rkq-sF9tMu!xX+bmKgwf
zan`ZrnmwFK>k)WudI|`X`w@i+6Xa<S^4pJ4t@UQqgynCmv0M`4VMI>Cx1u&-qb;wn
zNb=PZS0E#zJZl8SO=&xCxwSeJP8U_~pZj_@%QTk`X(CW!p)nE`D7iejW{zJzgTP<G
z6?0sRT7TtxpOk&jBFJLG#o?FZcx_NL^uTLThhh)0A^)suyFY&~s1G>&_WP?Jdb5aA
zzzKtbVbbZdu0U_kXW$3e^ZT&8cii-HRY3EZR$<3RUxi4SYe%wv+JN6YH-99_A|=LN
zKUTZJ^zrX)Wbc-5ny;VsH5HFROGWAnoPBXW!iE&SGNxwbaJVGZ(Ng-*<?-yEg17Y{
zB1!Tp&1*xDnQNNN>F{G_dP?+0l?FsTj#9>kM1|BUQn>pW8~LjD57XCouj0!R75koS
zqy1LkUEJeVjp1tCjfpdQOr@zaW+OtPD%p1?T)GN)JM1>#7%I?!vHl7<#)h<sEqv(m
zt7kTnE8mB@<ubft2NQ4Hyl9BzW9u$m`>`RJiw&6h_Aaah{nPHuI5ma_@(oiO4+uQ?
zCF%m?NgDZVXcllW)Gj~Z>k756nLPY1<TR3UDp}keA3gu#`5JI$X6jaQ)!(_AQcduh
zm=%#A#&r$0x(O5I<8{W|i<sI>5k95X5nJmW7z$c6vVZ0^wP&&znAox919$)=IvidK
z<iX*9JNAxP7d?OrbXEWs{K~JkwA|ZZ6RR<AnqrdSEXC|hxO71fHzrlQ#mc*BMKNQe
zeItA(Y}{S%7dv#^j|D3!A4T(nizNMBx0KTaZ@lT<^vP1V2Uq&}=5BFqUQ^AJ!;;jv
zq(dS*VN7ULy3)2xYwuj~*-!l>&A(tskHlUhqx$Zr2^Z-KRak|>)bs~s%7mjM@ynk7
zAA%g$NRaxLOayhO2selS2ZAPCB<Qu*iW{l&iJxWSE`sVy>-Q#J9LkQ-CY6=t>O>J?
zLrl1IJpEs1l|$mprWnUlyVp?_GOR$dQ6YxKgoiY}EH33Hy2!G%f{R`Bt8fU=8(y-r
z?Ag%+e-}%>V<Q{@aZ8cEM$kd95`}Y(Kc+uVJL|2yB6Usfte#iIKAe1!t<)(~UK1|T
z70N4)aWX+Y607FemnWh8YBoW|^-=YPKFQ?m(}d=8K$}YIt=K>LH=fDk7M-oXjnz&8
zf%+H#7wPJOnxQZh{^sXO8%Z8}c=E}emuVMMl2gGZwuFepj5Wj9<xp*g3Vr9bxJZr@
zb>_Z%%t~DNCm8^d%GFyoVqdT*tzmqW?$D6&+tW|m5n+du;IswDW;lB@Bh%ZVB0EJ&
z!T2cHka|zQNT_xK;$M6I{ns;iNjGW^d7}znOc2FlsQa$G+44ze_^f!f=3lS-GaoBD
z=go0Tv@KdO+d}Muy-v9AUa|gbBc*a?ep@zuT53tjrY+5{U|uKbay9qN6Luau>U)w1
zA<0L$wK={zxH}$_;@D*dS}x7Bh{-Nmv7q#IEM0UZH>d*-A>r7FFr285Bp-RpSMGjr
zJ=Pn@{z<`?A$98oG;KXOP=UV!F_Gb;{w>*J&2<RT)Yvz9<i9jdXyQ{|Y{eYu(Edit
zYo%b%J(hpz;motGRH~ALi)I~Ae~v|Y3$$oM4*YmLcf$)%k8)<os`H1`>Vk|)tDKhB
zEe=8hqns@cu7PR@%cs@pUNYzix-4{`)<e)K?lKa`yoonYWb?F!^o@=q&OFF-`!=Eo
z&$^WTsGLKk#)h<MKC0G=Q&pf=RKy<@H#|4ig~T*tPDYHA9$J)cX6rGdtMF2`L<C8<
z>{?y_-TwX}oFgxg#e*i?sEO)t*kW!;Xo8Zy3Q9f+pM}|Iv>zMN%6{eUvVPZ~GGO{v
zHxiD1pms6ae^qBJtzD_Cz;2n=6us6c_rTz;pDkX6FRx<}r$i-|(EI*NP=_eCykP59
z0@$KPebW9HB+*4)RDhhV5!vFO4tprSVpG9OXPi}m#LTxnkPmvk_o!VDYEq@wkvt8c
zf9}xeIA?@|M|=$)G!r^bG{bOY1+wlSaFAg_r&v$cj~`jH^EGhST`6~~e(Ue5vdPA2
zU=@p2h?oh#1I!Zr5`b_3d?YLfVSdBz(oY&#q(jS~O&|JfIRy7QgCE}LyzC*1Ql{w8
zV!}j%Ue=fhO~^DqoE+tu9u8Gj_KZyzb+Ju5+Ep)1$!8*QYr-@xV<N-XLK6vCHbG=7
zYne)KVHwMDw|@8cBXhG6^-)kRNGd3Ibla$;Lf_rBkrk~*)Ht#(C*4%M?I77@=S1;h
zqu*5|w%h{-W>0&`bbQ484|k5RB&c(t#A*ee9N}>h5Rp?_f_~A4EWbCr-}K&a@Z|u`
znE)db028HTa-X2f!)?JX8LztOwkHRWt_j<BeiTR1uCtG$UH2KlR?FjtDqC|En-siz
zy%wahv+Et_=+0=GIchlDh^;7YY={XDd#jsO;`W0~i{%Y2fkgdFHRmR6IFn+t%7o}s
zv?2pcK7_2C(q~6!2NZc`dH4G%QLh1Q0zCp>Zj4JMF4>ifa~*rjy3Ef`S`n|!xEUEF
z<@;2jr-R5wfY-dE#?COHWEdN^@DAZF$05F0ZvX?MHuN4H6DAdycX%KVb}cWXnhjxW
z$oq>o`;91yMI;xGE}M0CKGTxOJ`ris2wo?VOxso|%}sVuNMFHK-#(GV5!U_N$G{@7
z=vd<=9T((g<{Zr`U?tph;KH9r`-*#9bW%(#<X`X#ydW%^frAbC=eJrd8kDoxNxqF?
zXWd0ZDBH5%pd<EBOQi^ahLQ@6gpX;$_k&=A#IzRSxt6t=N3pbWX$w-U%_c-Tb$E)3
zFgN5&{mEayTl@7s$hPeJVQ|}3A#G{z0$O(wAUSHU5ECxa3lw;>NP)K*IiDACghPhP
z&g6~X|2Eh{37e2TKcH|m6Jid+*boykRYPwtVp_D6mcjErlpj(f_-9*iK{QM^-_a(f
z`Vt<}40y-N=b+9Qow(!j^p73Gtk_j-bR{4h5y^&xgBRPW#Ih3A>#(0%=82eYnMbd9
z^1~vytW#jNrS`f1*aZdC;w`5S1;F(wUy3^nh=Y8ECw$F-e=R)@!f_$@*_%;WDn6#_
zYml$(rVW6HG))SjVrd|5=6#Q<hz*JAakXXFdvG~yLqu%R2GiIiH6v38yrxY7kdd<S
zaIJ`f-13FjAzK$jw$5|GMm%9hCzH~ds1m2dmd!eG-MmHLu7aBYt#{-nr)W{GfU{0S
z{x)|@-Ws+ZeE!F?6h8F*>U4Bz6L;4!TJ25;3!5u8(V+LHEO69&f!7XY`7bnvt;vLh
zqS28&jZsZ0lDsoA7aQCs<bZ!lPJ972`m;JfRnB{7$&Js`0hB*RoGNm4*3`d)+x+&{
zKP#>|&Z=Mp6en8kbh{xYTtg4lYZ5^#!r16vMkTGAUf$IpoYnd;j=LxYAaC{h-58EY
zd+EJ!UBd~j^-@Sk|M1J}o&6@Xc)?1d7$z3Y+0fKmFsu7n`LPYgJ)m#|s-7VKa^lE4
zS?fHe2B5#<b{1Al3tcn%cX3Ir*{dEV*34kqG-YQyO>@D9T#d37bS{P?X}?RoHt%uM
z3x-Cq9zfA()l7VdhM(8yAo?h#CkF&No_h4j&}@*`GU#o(xX{LI2a-2-nMaY8X+op4
zd=%l67m7g{V*g&a7#8DH*~!!K&5BTYh}_-l`hd&I!iqaWWM)#_tMMe6mirGlaAJ|@
zTkeM}$%7$OR`Aa<+18ZK_kWdLd0bY-*B5;d+%Pr8awA+yb4ATE0!d2LOiZ)P^$~Em
z3G#Tw1xv*gElI>B7u-ejlUv&BZkecoTdujLnVGmHF1h6Xo-^~@JLlecKz{!W_mAhx
znK^T2J1gHLD)dbl46jY}GX>vTr=Em&ka93xs;rq;QsV=cuyso$`bO#;VE~x%VPy|L
zTiv29J-4%+z8f}-g9K#y=^D#lZzx1tvZuC3_L$e5$BizhWJUhMJyq=5KB||J>@jk#
zvq9_o4i6Z6L#PtWIh4~u=TOiCol(W$<jm_&MDShy(kWMwq5Ls3;6G~t%8r_f^obuw
zjc<BIcq-eR#bvlO?XBTA&n67K@^*t!q6Cu-NgdneWGG0S!F;km(kqVn9uZLphYNjg
zRe(rPRVV4a$k8vkEAC~cliAKflU0CLN#%+%x1`Dmsdj5$m(Cx8q(;X?9P1N%hf^!$
zqExU*kmSeIHo+cftVKCMv*5fi#Oy2d02Lt8vx&eoLQ;x=Y1f^-+UNMwKgD{qA*t}l
z&YHe>!id9T6bi{6p%;XtDh>AgB~G4wlP^k}+5AoD?kS&m=P;3_oTP9s_1^jg5q_W&
zH$HI3vaC)XfUQ>$Pg;3)2qgy?qm2*1*{D*7a0xWeRpSGI`Q=uTDDxR%eBh+ebf+ZD
zpI)lO&$k&_hL1m6@a!}RmJ6PI4eRJC1lg9NoP!d33+p}Tt`2*F?g|?=JN4d-*l~~+
z#P~qo(v$Kv+@M=P1AY(%z?7lNbgOhDF%tf<o|P}Zb8V!kYgV8TN%>Q-T;}r&C!iYJ
zyx`$!sn2_X>eTW1_r7l53!5NFuMMiJRgip~MAxfJojo0ASW0-;w1@jbSiOtiG)iq;
zh`mIPQ^E2n^_Yy0k{nWN-G^6ifpKkb*yMQjR5;;DWeQIZ+MmxOzvznFt^!iV7mYh}
z46ZEd@%Pu}=r)<n!CJjOGN9}Ic0uCO6Eh6LB=P1!H8=bgf(=tZoES+5toMSS8M`Fk
zzOXUt2QmLwV}^GA#D^0rP-qIkDm3v%aLNaj_0G6B7^K`PjkG>yejivH#8~AnHBrFt
z6=s6dW)Zb~qj*b=Gagmr`1-fp{ynQL6r3_Po*?8ooOC*_Ro9*-Ezn>$_Wd-zR)@19
zb=0#Y#k{T<CK}i$BnI!(pbh0F4`X%ohL<WvJ;@W+xHqyTn_ga0r{eG8Ze~c0h87#$
zDMU>!hqt<V5A8l2;y@2w|9oTk)hpt?;esGCcm|`eHASX2gU0f_Rba|w$WxB)6*<ka
zPEGLw9Y?hR(L>kl^?kOmNz0CcMVgXH5!g|*4Ot%VU#BdK`Zxg;4O>Ga((kUZnXz<f
z`=aj$1%#Arr#OFmxo<fENE#b9>d>VWR|(K<??3m+HD{yS&pvDlz#>(WEnAk@q8pQV
zo5EX1xJq6BUnnYAK2EC(ZEGBx%Pux%p~gPbhkV+wMP)vZHXXiauU!S{fhNXDo$`ws
zJSZ_C-fb7M+GY&5Ff$aHzp|_yZ-DYHTnx#UtRQVn#)I{gBN2)aSj5Pzer9|iK{7Wr
zkQmn_QaLhyY!**LVp3wSA#3xXv5+#WQ2&^;to49#5BY>jkmoWk3dl-HMmbQ?5%mlq
z$3^$gOD5keEwn$+qNITM{8?(c=`!$xk~92h*zO8i^oQL%B)5=ieab}zXHfK*6^dT{
z%-eX<umhtn_zIs{%hvCiV!ZbH>CgN8WN5lYC`UmLWVwhhAFSH{^h=u{{JM17l#ec6
zvOSQw)>hdy%$-~B)F5!e?m}}$!SPu)v^OLtKb?k-3(F0xxM`_TGDp0MEKKoiHB)d%
zj4T1q7DmHXz(h#RCN9kc<$2*KC_d%Z_05$`Zson?|D2SL2Ul!^@Q!1v&sMnFWv-`<
z>0exTw{hK3F;kF8)4~_2C8Ye^U*YiN$v1X@chH9o>U>>8Sn<tOba^_^IaLNKTIAy>
zp}_eZ8mG2?6Z^_zjVMi_{Dze)E>R*-(4?79sV4<wn?UXup~$9b$`%Vh>wh_46s(P6
zE^M~Oh17`y#m4RAyc|+9FTT0`M7*&0SSG^rsx>3v3<GmvwrJDQNGPe+^7UG(H>p1F
zz)pHYW7(w_Hu|GfW-4T4HtJ2_fndQ6!XqIO8jF-EI4)&`o)(3;rHJ#^`4Nf@OI+(a
zqxuEVgN_NBU*br6;e<`;X_FDhr_WIkPN64pl-{b{bLvm%1=$8GKdCmm;nCuJ9Z`BZ
zFSOD_j8FDc!722fgS&)&9>xUYD}$4c4XcpeWYNkIKyS-~;9#FY!kOMe?>_$4J-z~P
z3cWXx9<O`mt&M^1@`eT8sXRHOMDtKKzj@Toc8MRT<MY9J_r-a4Xs;p;8`eE_=JDL(
z;LEn;`o+Yq(>ic3GctYp1MKEQXkgm;-5DEJW2sl}{*vIF);BMy<D<w1T&+xpr~N^?
z=?C8$HmuLl*pJV6K`D-_Z~4?6-~0=;n;LeL56_{GMB3P}VfUTGN8SN(SvT_eTJviJ
zVK;4l)0RlJd+=X0Y}mA4zKL$4zZ1&t%*t&vVex3Sr(M9`S}?|2%R<Ir!?Ie&emvd_
z9>|f!23`0yUF74ZBh)Lw&vbuifT0E8lnLAl<xkWMy*3@4@Uph-5|@x3&+JRLc?E~`
zOs7Zwv~~McegiY7VZ-_@eP{NiZ(N~lUd7a{#p8$KERd(FKNk|=gn{-kmRj3&?omAm
zRt!3K<A<y(JW;nvf|fW-eF;cl!@e8*$?MyT#)Pueg&C|qi^mBotQmICvUZ)XW<VC{
zO40ptCf()!u=rY$6~#$~Ny-b;N@XY?fhdWC<KD2G84gm-Zs6?p^C#|vd>&(}Cl&7%
zUK4w2dmG8O9}Nf@F?`CDnxSAe5^?c7B8^bvuW2_ml5X?j?<4*x@(RRUX6DpCR9^Vd
z+Rc8%|BM%n<qg}{_;k&RI=J*595XVq*At#Z#Po;a6Ybtj0&v-2V|q5wG#=D<FcyF5
zMoFL8S>F9}LcRxANu$adaD<{{+6P+ycG=c#8S$4ODUFe_2T+Q8nT)}8=q{9JY}l9<
z2M(PX59wn?-g{omoN!XcFFHv4;tM{Jn^p!uQqXgmRS%s_s*CeR{j@vazZYZE&Vnk1
zH>|-cN&TXJ3khZKwtV^Wx54l7*|w(Zl5uhl?KbWs*sv$A+Jn!ff=hY$KQ#ll|M?mM
z<qc&GVI*>1u-}wNBPpFHmdKzBD$3%iH7A7C-gW=;)_az6o0dH|MaD8X^m;g4Y}lO6
znQyFo1Kg|rb4=~s_Xy9A`wU;>#f?^0soSzrD65e^Ze+jK0XR5ywGzgV&EdhdnDL*U
zxe&tsE}g1h*uj(Is#xi*;UK<05%-tY>68N*42%Tq$e{d9{SKX{*usXf&EdJrr$UT*
zzuFTn>le5qr)NW9C!7y#*yWdUruqK>F};Sa4(HG`_DPE*Eiho#CC^Qq{{7f0JZ-nc
z+?GN{G*?2K1PN&jT|Lkt=AC@vR}3c!8vmP*J%Fmo+UtiW|J4HS>qZ_bAZ9r?q|TY9
zf-C;-p|pudAZu08;IJ1i>^#nW4LxgD9r{olCN}KKyd~Ky`rHS9I{zb`R^R4@=PcCd
zUdiPX8#eb+y?4S+Lu&p9EHgWMEl)#a+hnBzimn60q(Y4{<hdnvNOUWju<&rX)Zbw%
z5>-*TAEoU8kxzQc%i}4}4GcUFuU%2tN+j0u@cyKBZnFd<sf12?D4&rOWQ5jPGHqMm
zgZvIE_Ag@Hsu<s{>pU0axEcCJVC;;bJ^X%ey9sGn8cY-w@z#zxA>98wG;CJYpdsJh
zT^h=Ye!jcM{Aw5Y-OC2mTfy2A1<7baui!E7bxwYI0z&WIA1KhoY{aAUI>HiztI*{J
zKoA>t>YOX)cuycWD*MkLr)K=kcW95635Qk`H(G4iqoTfF=l%srW4aymDRXC0YmOqc
zI^%K{UY6R`CV;|*_1rrsYHx`TpbYEz9^Y;JauUDhmBxZn{d91J2F<U=V@%Sqll191
zwp(V~z=oi~wN$01K;4BDQ$UO@FCPVn7q1eiRf)lv2aWqtO%>$iMK<Zy@%;l|gdJ~1
zi%yp!T*6UIq6Do`h@#hD1%<S%Wr4Ahl^zHUj7~<xgnfA-BIoc8P>1h2(j+!RxGFrm
z&YA+_msmqpk7{)JWTni!)U4FnHy4AUCwTt8qBH!2?!dA=NSy;+<qA%rCv`ZK-hCe}
zyua&e2z%T$V8gnQx5ab9b3Z9P1&8!}@EU+)<GbB3oNsTPyHsMsT9xwg52^*{+^$xu
zTMhq1D7DBU(9n}uPlQ(vOkDvmJ~Ud2kGl#V66DZks&i9oL;wA0V=IF{?nlnIf|8br
z01iS<C#F`8$Onex6zdni!F3R_$@dv-*sY3ZKO43i9$8JR3~+d-<P!u*W7v3dD{R=H
z^M6ECJOF;yxkGBFbWMKh(Fcddut~4WT`!H;GN3FNm>iGRRh!dcAK%iHo1?rFQ;q1g
zqK|_khGXbb;*~utNdy2}1WpPL6#(Is0NxvYYS-9OY8tP(YE$=n_Ir=L71X!d?t_Lw
zM5O#uIvb7C7%QeU09Y%ogJ!B0BS)zREq`nLH8)St?kY%}Rhx&uhBQC5(+t>h``*0b
zbwXM79wUpjj2gjLh;5|wq>;T<kX(}Nmow=$Obxy@|CzY?NSzl#S#Z>yUppP`q^?VR
zSE?}|W6N&*X-5d;#g5C0TeEX-BkLub+KD3(j}3eKQjNWV{uLmP$@EDHKWu2vcYf0|
zl|L{}J?|Wnpn=2NU{{<L1tp|-2!`btP^_akH}b!Dc8XO%$RbZ5x@Z0T#l5E+XMhCJ
zco+#fhXZpT`vLfk4O2i|0IU}VX&|EH{JKBt|9%YQT-h?Je)#xpVk!zH01DCrO}R)Y
z%>k9ueh51VM%c6KViL-?7m-;unw|w+L2{0o+GDOGUx-^QCAU;RQ_AZxq+t?i{QtCB
znAXAX_4Np%OG*JDB@cm;bho+p+u(W4)_@-5*kf1w;IYD!-m=@sW0BGl^}FDX5gnSk
zBw}kIinX#Qm%;U`nB11#%6>k<4+=16-=98XzrP4aCf7@8Z=f96?7e!y#ZKT*a<cW^
z`92WD%%$06<4u$+CE=F>vhrTCky5%|<V5>Q3nA%e=~E4Iilq0kQSxlvQ$Q9<T6N@v
z&~S3;7fV2td9DVfc*6&0C0`Pjefa|KgR{)t0VwAc5K^+t*jGqw0yGwp@>>~KYkA~t
zC{8nF*q+f{3ull}KuC-p*<5`2+NSQuX(Klu^%_wulwDZ6=+*NH?oiGAJe8=w(XC_s
zx;)tU6kI{7#@GG5GS>*%9F?fYS_7PRY~1nD5S031Q|E>iRooH3R+19wO%%WTXJ*YR
z7XlTqBK!Xu8@6g8pYQyf-I^jnY?uPGu||6lr(px12CW7B;SF0BRBX@rpSy*!9?A9U
zZ%a=X)be=@6aYhNw*5yQdQ_Z0I~iGFSPJO$ZY{qP*tE@PPOy+mRl(ZEsCPzo@Ry4>
z8KZC7^z4&cV2oQzIxqY57aYxh77Ie!3Cb&?x7NBoFclj%(tFs=12sp6vQI93o0$B|
zM1`sA&AD(C1oObue{qD|5=ogF_*1p3b-G*(VR_j()4jsP2<6K4yhkV?BxhN<(#?qy
zi+FN8uX{1jG~}@dS4M5KnJ;y@i_vXD0U<HjLwWI_lw1jaFG<UQhidVt9WQNJV$ad!
zc~}Za%o&eA)Zy`Q8L!tOJ<~7@+mR26Wo!GC{MZFAN8<zc^pfZ{1#eD#wqzjlXF~($
zoD;vXF(Y=(4=YM@;AAflD48!N<LsF)@9qKZknv$f={$$G`<5bUiJW;WA^56yNVg_E
zR`Q!Xc#|f?yR<kFZi!1=AA;oQ!D=dOgg4E4eu7(o`alHg&{#&N0Fj+m-~a?BAdo(c
zO|LfNfJJUvfv-R>_1c0n@<pux6^hz1q&U<*MpNZuSZq{^p2w&FRf-q!@&B2f;__cc
zz25FC*yWQa96EFTQ7yjEEhem5WQb1u#)c_4n~Z8ZaDa0OIb;vhy4{1|Aka1R3K^8r
z2Z|`!1yn~0LUY3j32G&M{nq@Pl_y~~QTr58{gD`5v8IZZ`iPU&pl!zcz(eS$MbONA
zDMqM4;rgh+>>SyH)Wp_KhPHCR6#b2^aGLD(-_*7x=-1ULAC9BrGe;M#0z`TqYD&4+
z5NE&0?*scoLhx3<|2yCg^R#>U9LK5SHLNH%MbZ#RoMQNG!W>xkTKbAc84*(_)Z6fs
zF-T%J%V0=q%&^2btuO9MO^{$YMK8t6oPiqi+pquJ<&}PlFZfcuV<FS2*eLYPNM(zd
zb{rp9YB5nBjo^@CiQaJuQBG9dXkJKdAv7@S0f@qeUG0&2XYyEh?N4i2u}S~c;(;Jh
z`fvElz0g=hOhExHy#oG}r$Fn8zxNhS$i3j3#UCHH?&c?unfp<X#(i^-y1muy4`vw>
z?;tr*ABN?Av#R975H`QF-nQu_u8&X*A@Z&5AoiC(<6b`6Y&k%?^~)PRYljE}rK?<P
zhfLucnYT6*zInrroqE&t;}Wp>G@t!p>4?+9DVyT-#yHj{I828ggx}b(rLFq0LvMl}
zEU4M`{oVYY!^eyT7KJ~J<}i}tBddJJ)^9(7XL_fq?V3cb5gr3RF%V>c^OlSn>k!1y
zc{80^j1OEtCWc!YYH&Jau8p6%({)T$&mdiH?C$l$@5E6D@BBC?6%qm0n%|EFju9Rk
z))S#OGIE@t=!8FF73?pPrpG@4<+uTaPFiu2AYJ5-4y-EHuQUX{FHfHIMV;sFsy*cj
zadGI;)AGt!hYzhU0l;?UXO<oR?+p*9rRSb1KwLf6uC~Boy^ceqr)AB7nP1&~3Tif5
z<jM-9W0dPv0U|}RP3vXw<nkli1D}he#vv!a+z5s`npY@)dI8vJY-C9lBe#$;7Xxt)
zm3xF)VOu2eK8Wf|&)uZkrde*Md&-t--9KByXOO`7U0ojm6fI(HnuW#wxq#0ff$5%)
zJOyUsrN%w9M%t+fBI$<n=XZsqroimfo+2apxlB)?u#c)tuk0)m%0gH9_NY6pjB*K>
zgLB324sMH`6X#8VAvL<IXbE`2y5G)a@PA;#qF?sk`a(J+43Dm#?Opb|cso;^#eb;)
zoI<ZL?nwTenOYg3%^S9UMvEs&A3-s!YvI**wMj}=uT;fRpoRZZK{$opVsKH=x%(O2
z0i%Pj{808HlxA8wF*!ZCcVm^_AIJ;$O*{a<v0(~Mq4#ca`0YdZEr_P%OT#d~>2<yb
zr-~~bALYDy!fjBY{$QT{vmW+5)0x$V0yh_Dzwb=TZDv*6dX6R<IC*2WBdv}@If4F}
zNux{gr1Z9TFSpW`0`9{JBm=Lfy_WOdny(<=wVqL<Vc-XiRF|%oQ8u}+B4y^z`;U?;
zH-h_c*v6tI@7%uWzH|`ZNa_QKd=$)7a0)XU<K(%8Q{s*}SJo_j0#3?YN4);u;--A^
z<f}3Q3Ge_9x~C{0g;*(+uo7a+<XQ}D*tQo==DmLsw&->@cFcIYgGi-oSqXG-1>lgL
zuW2-u3Qfw%T4lp4X@3DHZ#VpIZmCa&nB=Dgk_=H`NQ+n_wN!MCYY)S*oIb0<$M<9@
zB_URA_R*QsSG?lhQ{oaB6OYQuz5rW@9HE^2c6o*O%k&2A*pu^_m7LqFqD)d^RS}gb
zP`C++(|p~T2XR@;AwAd3&OTN4O&10piy@iVgDFp1Rht)nG#hrl*448nPHP}|Vlq;H
zgd(Y|Qw4+^u~K^zff(#$IYZ3%PhN$p{aa4mEbah>Fk34?g`(C4DWWygLNTpU+x3<G
zpy1ooh1;@%c82g-uy)mjTvQC@3J@uJG<kcIYi6#`ot$(R>?p}cC)b=iTI9_msK?kz
zH$Ua&R6$v3Y2{56rL|?qZ@pqJKY&aszMFGvMm6&=G!EoEp?6^g$eD@uXI`=w-#@!?
zwema_R9Gg|fADpQ;*hAM+r-){Caw|ZmL*78_nbFG0dk7HsXZC(v8T!!S{HY`k!31P
zKX&6oyi4gn;am1LlmWV=jNhBeB&43tvyI*#>+R~hY?KpJ12Nj(6<4~5rx96;dOMUH
zzVN9Zj{-w-p0^pw+-W6~ZhX+cW+<!wD5KYQzkfnM<K3jg<MF#WI6Mjzc{U)p?ya4j
zBM&C#@<nAjy52z95e}W?y`f-`mSPY-iCA8alV0TiYjZnv?M2Ao({|&cdi6_-f>jEZ
zTPT#;BMO$&wLkZzQOT`xUI3dOJ2@@3#@~TDRF<6K|L+$A7T6A^t2i0|Kx3Kvy#e!2
z4jKTvaIX=E%Z3Ct<wv~7Y>Ulsu-LF&UUS3$x=}Qg)rs6Ub$>H%&&{uf!sT^Hwj5l$
zn1d~ft>POV%KE?Plj(J0IFeG7@SZgpjfzdaKI>=5@&8?iIj65j@`tp{=Xw}>=C-l5
zz;A5WxbkU>_Wce%xjRqHOb>q86UpV5Sc|^AtM&M`tzTWZhrF?3(h2V^ylz;2b?3N8
z05)v#onz(Z`9f0L75}9*U0sx?HI|nG8QDhHUFDJ|{NDWs3f$}{lQ-cf7f**{vuAMI
zl43q|wIBWQut|{3cxFQVaxMrTf}we|9#U#%wIGo^@3D9cVaShAG<U{{a_jMAMX8Jz
zkDR=c2VwK6dAky~H)x5ZEIK5qucyTJtzvCnb%AZvwQ<tvj6`0qU72es#t!WRxVUP~
zVOM44l6FM5c})vtjo-;ylKo#gzXvK<>2%^=dZnTJ?0Vdcj+<Ts$@FTzE^cL`@_Y#>
vSSn*q95puX<Wg{47+6o@DaksB``-2DH~t#=20Yz|RBf9*vFPoP#*P0U8xNV%

literal 0
HcmV?d00001

diff --git a/a4d-python/pyproject.toml b/a4d-python/pyproject.toml
new file mode 100644
index 0000000..d959a09
--- /dev/null
+++ b/a4d-python/pyproject.toml
@@ -0,0 +1,80 @@
+[project]
+name = "a4d"
+version = "2.0.0"
+description = "A4D Medical Tracker Data Processing Pipeline (Python)"
+readme = "README.md"
+requires-python = ">=3.11"
+authors = [
+    {name = "Michael Aydinbas", email = "michael.aydinbas@gmail.com"}
+]
+license = {text = "MIT"}
+
+dependencies = [
+    "polars>=0.20.0",
+    "duckdb>=0.10.0",
+    "pydantic>=2.6.0",
+    "pydantic-settings>=2.2.0",
+    "pandera[polars]>=0.18.0",
+    "loguru>=0.7.0",
+    "openpyxl>=3.1.0",
+    "google-cloud-bigquery>=3.17.0",
+    "google-cloud-storage>=2.14.0",
+    "pyyaml>=6.0",
+    "typer>=0.9.0",
+    "rich>=13.7.0",
+    "tqdm>=4.66.0",
+    "python-dateutil>=2.8.0",
+    "fastexcel>=0.16.0",
+]
+
+
+[dependency-groups]
+dev = [
+    "pre-commit>=4.3.0",
+    "pytest>=8.4.2",
+    "pytest-cov>=7.0.0",
+    "pytest-mock>=3.15.1",
+    "ruff>=0.14.1",
+    "ty>=0.0.1a23",
+]
+
+[project.scripts]
+a4d = "a4d.cli:main"
+
+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
+
+[tool.ruff]
+line-length = 100
+target-version = "py311"
+lint.select = [
+    "E",   # pycodestyle errors
+    "W",   # pycodestyle warnings
+    "F",   # pyflakes
+    "I",   # isort
+    "N",   # pep8-naming
+    "UP",  # pyupgrade
+    "B",   # flake8-bugbear
+    "A",   # flake8-builtins
+    "C4",  # flake8-comprehensions
+    "PT",  # flake8-pytest-style
+]
+
+[tool.ruff.lint.per-file-ignores]
+"__init__.py" = ["F401"]  # Allow unused imports in __init__.py
+
+[tool.pytest.ini_options]
+testpaths = ["tests"]
+python_files = ["test_*.py"]
+python_functions = ["test_*"]
+markers = [
+    "slow: marks tests as slow (deselected by default)",
+    "integration: marks tests as integration tests requiring real tracker files",
+    "e2e: marks tests as end-to-end tests (extraction + cleaning)",
+]
+addopts = [
+    "--cov=src/a4d",
+    "--cov-report=term-missing",
+    "--cov-report=html",
+]
diff --git a/a4d-python/scripts/analyze_logs.sql b/a4d-python/scripts/analyze_logs.sql
new file mode 100644
index 0000000..708cc72
--- /dev/null
+++ b/a4d-python/scripts/analyze_logs.sql
@@ -0,0 +1,74 @@
+-- analyze_logs.sql
+.mode box.timer on -- Summary Statistics
+SELECT
+    'Log Summary' as section;
+
+SELECT
+    COUNT(*) as total_logs,
+    COUNT(DISTINCT file_name) as unique_trackers,
+    MIN(timestamp) as earliest,
+    MAX(timestamp) as latest
+FROM
+    '/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/output_python/tables/table_logs.parquet';
+
+-- Level Distribution
+SELECT
+    'Level Distribution' as section;
+
+SELECT
+    level,
+    COUNT(*) as count
+FROM
+    '/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/output_python/tables/table_logs.parquet'
+GROUP BY
+    level
+ORDER BY
+    count DESC;
+
+-- Top Errors
+SELECT
+    'Top 10 Files with Most Errors' as section;
+
+SELECT
+    file_name,
+    COUNT(*) as issues
+FROM
+    '/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/output_python/tables/table_logs.parquet'
+WHERE
+    level = 'ERROR'
+GROUP BY
+    file_name
+ORDER BY
+    issues DESC
+LIMIT
+    10;
+
+SELECT
+    file_name,
+    COUNT(*) as issues
+FROM
+    '/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/output_python/tables/table_logs.parquet'
+WHERE
+    level = 'WARNING'
+GROUP BY
+    file_name
+ORDER BY
+    issues DESC
+LIMIT
+    10;
+
+-- Exception Summary
+SELECT
+    'Exception Types' as section;
+
+SELECT
+    exception_type,
+    COUNT(*) as count
+FROM
+    '/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/output_python/tables/table_logs.parquet'
+WHERE
+    has_exception = true
+GROUP BY
+    exception_type
+ORDER BY
+    count DESC;
\ No newline at end of file
diff --git a/a4d-python/scripts/check_sheets.py b/a4d-python/scripts/check_sheets.py
new file mode 100644
index 0000000..0037efb
--- /dev/null
+++ b/a4d-python/scripts/check_sheets.py
@@ -0,0 +1,79 @@
+#!/usr/bin/env python3
+"""Check which sheets are being processed by R vs Python."""
+
+from pathlib import Path
+
+import polars as pl
+
+
+def check_sheets():
+    """Compare which sheets were processed."""
+
+    r_file = Path("output/patient_data_raw/R/2024_Sibu Hospital A4D Tracker_patient_raw.parquet")
+    python_file = Path(
+        "output/patient_data_raw/Python/2024_Sibu Hospital A4D Tracker_patient_raw.parquet"
+    )
+
+    df_r = pl.read_parquet(r_file)
+    df_python = pl.read_parquet(python_file)
+
+    print("=" * 80)
+    print("SHEET ANALYSIS")
+    print("=" * 80)
+
+    # R sheets
+    r_sheets = df_r["sheet_name"].unique().sort().to_list()
+    r_counts = df_r.group_by("sheet_name").count().sort("sheet_name")
+
+    print("\nR PIPELINE:")
+    print(f"Total rows: {len(df_r)}")
+    print(f"Sheets: {r_sheets}")
+    print("\nRow counts per sheet:")
+    print(r_counts)
+
+    # Python sheets
+    py_sheets = df_python["sheet_name"].unique().sort().to_list()
+    py_counts = df_python.group_by("sheet_name").count().sort("sheet_name")
+
+    print("\n" + "=" * 80)
+    print("PYTHON PIPELINE:")
+    print(f"Total rows: {len(df_python)}")
+    print(f"Sheets: {py_sheets}")
+    print("\nRow counts per sheet:")
+    print(py_counts)
+
+    # Compare
+    print("\n" + "=" * 80)
+    print("COMPARISON")
+    print("=" * 80)
+
+    r_set = set(r_sheets)
+    py_set = set(py_sheets)
+
+    only_r = r_set - py_set
+    only_py = py_set - r_set
+    common = r_set & py_set
+
+    print(f"\nCommon sheets ({len(common)}): {sorted(common)}")
+    if only_r:
+        print(f"Only in R ({len(only_r)}): {sorted(only_r)}")
+    if only_py:
+        print(f"Only in Python ({len(only_py)}): {sorted(only_py)}")
+
+    # Check month order
+    print("\n" + "=" * 80)
+    print("MONTH ORDER CHECK")
+    print("=" * 80)
+
+    r_months = df_r.select(["sheet_name", "tracker_month"]).unique().sort("sheet_name")
+    py_months = df_python.select(["sheet_name", "tracker_month"]).unique().sort("sheet_name")
+
+    print("\nR month mapping:")
+    print(r_months)
+
+    print("\nPython month mapping:")
+    print(py_months)
+
+
+if __name__ == "__main__":
+    check_sheets()
diff --git a/a4d-python/scripts/compare_r_vs_python.py b/a4d-python/scripts/compare_r_vs_python.py
new file mode 100644
index 0000000..43e6a8b
--- /dev/null
+++ b/a4d-python/scripts/compare_r_vs_python.py
@@ -0,0 +1,530 @@
+#!/usr/bin/env python3
+"""Compare R vs Python cleaned parquet outputs for migration validation.
+
+This script performs detailed comparison of cleaned patient data from
+R and Python pipelines to verify the migration produces equivalent results.
+
+Usage:
+    uv run python scripts/compare_r_vs_python.py \
+        --file "2018_CDA A4D Tracker_patient_cleaned.parquet"
+    uv run python scripts/compare_r_vs_python.py \
+        -f "2018_CDA A4D Tracker_patient_cleaned.parquet"
+"""
+
+from pathlib import Path
+
+import polars as pl
+import typer
+from rich import box
+from rich.console import Console
+from rich.panel import Panel
+from rich.table import Table
+
+console = Console()
+app = typer.Typer()
+
+# Fixed base directories for R and Python outputs
+R_OUTPUT_BASE = Path("/Volumes/USB SanDisk 3.2Gen1 Media/a4d/output_r/patient_data_cleaned")
+PYTHON_OUTPUT_BASE = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/output_python/patient_data_cleaned"
+)
+
+
+def display_basic_stats(r_df: pl.DataFrame, py_df: pl.DataFrame, file_name: str):
+    """Display basic statistics about both datasets."""
+    console.print(Panel(f"[bold]Comparing: {file_name}[/bold]", expand=False))
+
+    stats_table = Table(title="Basic Statistics", box=box.ROUNDED)
+    stats_table.add_column("Metric", style="cyan")
+    stats_table.add_column("R Output", style="white", justify="right")
+    stats_table.add_column("Python Output", style="white", justify="right")
+    stats_table.add_column("Difference", justify="right")
+
+    # Record counts
+    r_count = len(r_df)
+    py_count = len(py_df)
+    diff_count = py_count - r_count
+    diff_pct = (diff_count / r_count * 100) if r_count > 0 else 0
+    diff_style = "green" if diff_count == 0 else "yellow" if abs(diff_pct) < 5 else "red"
+
+    stats_table.add_row(
+        "Records",
+        f"{r_count:,}",
+        f"{py_count:,}",
+        f"[{diff_style}]{diff_count:+,} ({diff_pct:+.1f}%)[/{diff_style}]",
+    )
+
+    # Column counts
+    r_cols = len(r_df.columns)
+    py_cols = len(py_df.columns)
+    col_diff = py_cols - r_cols
+    col_style = "green" if col_diff == 0 else "yellow"
+
+    stats_table.add_row(
+        "Columns", f"{r_cols:,}", f"{py_cols:,}", f"[{col_style}]{col_diff:+,}[/{col_style}]"
+    )
+
+    console.print(stats_table)
+    console.print()
+
+
+def compare_schemas(r_df: pl.DataFrame, py_df: pl.DataFrame):
+    """Compare column schemas between R and Python outputs."""
+    console.print(Panel("[bold]Schema Comparison[/bold]", expand=False))
+
+    r_cols = set(r_df.columns)
+    py_cols = set(py_df.columns)
+    common_cols = sorted(r_cols & py_cols)
+    only_r = sorted(r_cols - py_cols)
+    only_py = sorted(py_cols - r_cols)
+
+    # Summary
+    summary_table = Table(title="Column Summary", box=box.ROUNDED)
+    summary_table.add_column("Category", style="cyan")
+    summary_table.add_column("Count", justify="right", style="magenta")
+
+    summary_table.add_row("Common columns", f"{len(common_cols):,}")
+    summary_table.add_row("Only in R", f"{len(only_r):,}")
+    summary_table.add_row("Only in Python", f"{len(only_py):,}")
+
+    console.print(summary_table)
+    console.print()
+
+    # Columns only in R
+    if only_r:
+        console.print("[red]Columns missing in Python output:[/red]")
+        for col in only_r[:20]:  # Limit to first 20
+            r_type = str(r_df[col].dtype)
+            null_count = r_df[col].is_null().sum()
+            null_pct = (null_count / len(r_df)) * 100
+            console.print(f"  • {col:40s} ({r_type:15s}, {null_pct:.1f}% null)")
+        if len(only_r) > 20:
+            console.print(f"  [dim]... and {len(only_r) - 20} more columns[/dim]")
+        console.print()
+
+    # Columns only in Python
+    if only_py:
+        console.print("[yellow]Extra columns in Python output:[/yellow]")
+        for col in only_py[:20]:
+            py_type = str(py_df[col].dtype)
+            null_count = py_df[col].is_null().sum()
+            null_pct = (null_count / len(py_df)) * 100
+            console.print(f"  • {col:40s} ({py_type:15s}, {null_pct:.1f}% null)")
+        if len(only_py) > 20:
+            console.print(f"  [dim]... and {len(only_py) - 20} more columns[/dim]")
+        console.print()
+
+    # Type mismatches for common columns
+    type_mismatches = []
+    for col in common_cols:
+        r_type = str(r_df[col].dtype)
+        py_type = str(py_df[col].dtype)
+        if r_type != py_type:
+            type_mismatches.append((col, r_type, py_type))
+
+    if type_mismatches:
+        console.print("[yellow]Data type mismatches:[/yellow]")
+        type_table = Table(box=box.SIMPLE)
+        type_table.add_column("Column", style="cyan")
+        type_table.add_column("R Type", style="white")
+        type_table.add_column("Python Type", style="white")
+
+        for col, r_type, py_type in type_mismatches[:20]:
+            type_table.add_row(col, r_type, py_type)
+
+        console.print(type_table)
+        if len(type_mismatches) > 20:
+            console.print(f"  [dim]... and {len(type_mismatches) - 20} more mismatches[/dim]")
+        console.print()
+    else:
+        console.print("[green]✓ All data types match for common columns[/green]\n")
+
+
+def compare_metadata_fields(r_df: pl.DataFrame, py_df: pl.DataFrame):
+    """Compare critical metadata fields."""
+    console.print(Panel("[bold]Metadata Fields Comparison[/bold]", expand=False))
+
+    # Key metadata fields that must be identical
+    metadata_fields = [
+        "tracker_year",
+        "tracker_month",
+        "tracker_date",
+        "file_name",
+        "sheet_name",
+        "patient_id",
+    ]
+
+    existing_fields = [f for f in metadata_fields if f in r_df.columns and f in py_df.columns]
+
+    if not existing_fields:
+        console.print("[yellow]No common metadata fields found to compare[/yellow]\n")
+        return
+
+    for field in existing_fields:
+        console.print(f"[bold cyan]{field}:[/bold cyan]")
+
+        r_unique = r_df[field].unique().sort()
+        py_unique = py_df[field].unique().sort()
+
+        if r_unique.equals(py_unique):
+            console.print(f"  [green]✓ Match ({len(r_unique):,} unique values)[/green]")
+            # Show sample
+            sample = r_unique.head(3).to_list()
+            console.print(f"    Sample: {sample}")
+        else:
+            console.print("  [red]✗ Mismatch![/red]")
+            console.print(f"    R has {len(r_unique):,} unique values")
+            console.print(f"    Python has {len(py_unique):,} unique values")
+
+            r_set = set(r_unique.to_list())
+            py_set = set(py_unique.to_list())
+
+            only_r = r_set - py_set
+            only_py = py_set - r_set
+
+            if only_r:
+                console.print(f"    [yellow]Only in R:[/yellow] {list(only_r)[:5]}")
+            if only_py:
+                console.print(f"    [yellow]Only in Python:[/yellow] {list(only_py)[:5]}")
+
+        console.print()
+
+
+def compare_patient_records(r_df: pl.DataFrame, py_df: pl.DataFrame, n_samples: int = 5):
+    """Compare sample patient records in detail."""
+    console.print(Panel(f"[bold]Sample Patient Records (first {n_samples})[/bold]", expand=False))
+
+    if "patient_id" not in r_df.columns or "patient_id" not in py_df.columns:
+        console.print("[yellow]Cannot compare records: patient_id column missing[/yellow]\n")
+        return
+
+    # Get first n patient_ids from R
+    sample_ids = r_df["patient_id"].head(n_samples).to_list()
+
+    for idx, patient_id in enumerate(sample_ids, 1):
+        console.print(f"\n[bold]Patient {idx}:[/bold] {patient_id}")
+
+        py_records = py_df.filter(pl.col("patient_id") == patient_id)
+
+        if len(py_records) == 0:
+            console.print("[red]  ✗ Not found in Python output![/red]")
+            continue
+        elif len(py_records) > 1:
+            console.print(f"[yellow]  ⚠ Multiple records in Python ({len(py_records)})[/yellow]")
+
+        # Compare key fields
+        r_record = r_df.filter(pl.col("patient_id") == patient_id).head(1).to_dicts()[0]
+        py_record = py_records.head(1).to_dicts()[0]
+
+        comparison_fields = [
+            "tracker_year",
+            "tracker_month",
+            "tracker_date",
+            "sheet_name",
+            "sex",
+            "age",
+            "dob",
+            "status",
+            "province",
+        ]
+
+        comp_table = Table(box=box.SIMPLE, show_header=False)
+        comp_table.add_column("Field", style="cyan", width=20)
+        comp_table.add_column("R", style="white", width=25)
+        comp_table.add_column("Python", style="white", width=25)
+        comp_table.add_column("", justify="center", width=3)
+
+        for field in comparison_fields:
+            if field in r_record and field in py_record:
+                r_val = r_record[field]
+                py_val = py_record[field]
+                match = "✓" if r_val == py_val else "✗"
+                match_style = "green" if match == "✓" else "red"
+
+                comp_table.add_row(
+                    field,
+                    str(r_val)[:25],
+                    str(py_val)[:25],
+                    f"[{match_style}]{match}[/{match_style}]",
+                )
+
+        console.print(comp_table)
+
+    console.print()
+
+
+def find_value_mismatches(r_df: pl.DataFrame, py_df: pl.DataFrame):
+    """Find all value differences for common records."""
+    console.print(Panel("[bold]Value Mismatches Analysis[/bold]", expand=False))
+
+    if "patient_id" not in r_df.columns or "patient_id" not in py_df.columns:
+        console.print("[yellow]Cannot analyze values: patient_id column missing[/yellow]\n")
+        return
+
+    # Join on patient_id + sheet_name to match same month records
+    # (patients can have multiple records across different months)
+    join_keys = ["patient_id", "sheet_name"]
+    if not all(key in r_df.columns and key in py_df.columns for key in join_keys):
+        console.print(f"[yellow]Cannot analyze values: missing join keys {join_keys}[/yellow]\n")
+        return
+
+    try:
+        joined = r_df.join(py_df, on=join_keys, how="inner", suffix="_py")
+        console.print(
+            f"[cyan]Analyzing {len(joined):,} common records "
+            f"(matched on {'+'.join(join_keys)})[/cyan]\n"
+        )
+    except Exception as e:
+        console.print(f"[red]Error joining datasets: {e}[/red]\n")
+        return
+
+    # Find columns in both datasets (excluding join keys)
+    common_cols = set(r_df.columns) & set(py_df.columns) - set(join_keys)
+
+    mismatches = {}
+
+    # Tolerance for floating point comparisons
+    # Use relative tolerance of 1e-9 (about 9 decimal places)
+    float_rel_tol = 1e-9
+    float_abs_tol = 1e-12
+
+    for col in sorted(common_cols):
+        col_py = f"{col}_py"
+        if col in joined.columns and col_py in joined.columns:
+            try:
+                # Check if column is numeric (float or int)
+                col_dtype = joined[col].dtype
+                is_numeric = col_dtype in [
+                    pl.Float32,
+                    pl.Float64,
+                    pl.Int8,
+                    pl.Int16,
+                    pl.Int32,
+                    pl.Int64,
+                    pl.UInt8,
+                    pl.UInt16,
+                    pl.UInt32,
+                    pl.UInt64,
+                ]
+
+                if is_numeric:
+                    # For numeric columns, use approximate comparison
+                    # Two values are equal if:
+                    # |a - b| <= max(rel_tol * max(|a|, |b|), abs_tol)
+
+                    # Add columns for comparison logic
+                    comparison_df = joined.with_columns(
+                        [
+                            # Calculate absolute difference
+                            ((pl.col(col) - pl.col(col_py)).abs()).alias("_abs_diff"),
+                            # Calculate tolerance threshold
+                            pl.max_horizontal(
+                                [
+                                    float_rel_tol
+                                    * pl.max_horizontal([pl.col(col).abs(), pl.col(col_py).abs()]),
+                                    pl.lit(float_abs_tol),
+                                ]
+                            ).alias("_tolerance"),
+                            # Check null status
+                            pl.col(col).is_null().alias("_col_null"),
+                            pl.col(col_py).is_null().alias("_col_py_null"),
+                        ]
+                    )
+
+                    # Find mismatches
+                    # Mismatch if: (1) null status differs OR
+                    # (2) both not null and differ by more than tolerance
+                    mismatched_rows = comparison_df.filter(
+                        (pl.col("_col_null") != pl.col("_col_py_null"))  # Null mismatch
+                        | (
+                            (~pl.col("_col_null")) & (pl.col("_abs_diff") > pl.col("_tolerance"))
+                        )  # Value mismatch
+                    )
+                else:
+                    # For non-numeric columns, use exact comparison
+                    mismatched_rows = joined.filter(pl.col(col) != pl.col(col_py))
+
+                mismatch_count = len(mismatched_rows)
+
+                if mismatch_count > 0:
+                    mismatch_pct = (mismatch_count / len(joined)) * 100
+                    # Include patient_id and sheet_name in examples for debugging
+                    examples_with_ids = mismatched_rows.select(
+                        ["patient_id", "sheet_name", col, col_py]
+                    )
+                    mismatches[col] = {
+                        "count": mismatch_count,
+                        "percentage": mismatch_pct,
+                        "examples": mismatched_rows.select([col, col_py]).head(3),
+                        "examples_with_ids": examples_with_ids,
+                    }
+            except Exception as e:
+                # Some columns might not support comparison
+                console.print(f"[dim]Skipped column '{col}': {e}[/dim]")
+                pass
+
+    if mismatches:
+        mismatch_table = Table(title="Value Mismatches for Common Records", box=box.ROUNDED)
+        mismatch_table.add_column("Column", style="cyan")
+        mismatch_table.add_column("Mismatches", justify="right", style="red")
+        mismatch_table.add_column("%", justify="right")
+        mismatch_table.add_column("Priority", justify="center")
+
+        for col, stats in sorted(
+            mismatches.items(), key=lambda x: x[1]["percentage"], reverse=True
+        ):
+            # Determine priority
+            if col in [
+                "patient_id",
+                "tracker_year",
+                "tracker_month",
+                "tracker_date",
+                "file_name",
+                "sheet_name",
+            ]:
+                priority = "[red]HIGH[/red]"
+            elif stats["percentage"] > 10:
+                priority = "[yellow]MEDIUM[/yellow]"
+            else:
+                priority = "[dim]LOW[/dim]"
+
+            mismatch_table.add_row(
+                col, f"{stats['count']:,}", f"{stats['percentage']:.1f}%", priority
+            )
+
+        console.print(mismatch_table)
+
+        # Show ALL mismatched columns with patient_id and sheet_name
+        console.print("\n[bold]Detailed Mismatches (showing ALL errors):[/bold]")
+        for col, stats in sorted(
+            mismatches.items(), key=lambda x: x[1]["percentage"], reverse=True
+        ):
+            console.print(
+                f"\n[bold cyan]{col}:[/bold cyan] "
+                f"{stats['count']} mismatches ({stats['percentage']:.1f}%)"
+            )
+            # Include patient_id and sheet_name in examples
+            examples_with_ids = stats["examples_with_ids"]
+            console.print(examples_with_ids)
+
+    else:
+        console.print("[green]✓ All values match for common records![/green]")
+
+    console.print()
+
+
+def display_summary(r_df: pl.DataFrame, py_df: pl.DataFrame):
+    """Display final summary with actionable insights."""
+    console.print(Panel("[bold]Summary & Recommendations[/bold]", expand=False))
+
+    r_count = len(r_df)
+    py_count = len(py_df)
+    record_match = r_count == py_count
+
+    r_cols = set(r_df.columns)
+    py_cols = set(py_df.columns)
+    schema_match = r_cols == py_cols
+
+    summary_table = Table(box=box.ROUNDED)
+    summary_table.add_column("Check", style="cyan")
+    summary_table.add_column("Status", justify="center")
+    summary_table.add_column("Details")
+
+    # Record counts
+    record_icon = "[green]✓[/green]" if record_match else "[red]✗[/red]"
+    record_detail = (
+        f"Both have {r_count:,} records"
+        if record_match
+        else f"R: {r_count:,}, Python: {py_count:,}"
+    )
+    summary_table.add_row("Record counts", record_icon, record_detail)
+
+    # Schema
+    schema_icon = "[green]✓[/green]" if schema_match else "[yellow]⚠[/yellow]"
+    schema_detail = (
+        f"Both have {len(r_cols)} columns"
+        if schema_match
+        else f"R: {len(r_cols)}, Python: {len(py_cols)}"
+    )
+    summary_table.add_row("Schema match", schema_icon, schema_detail)
+
+    console.print(summary_table)
+    console.print()
+
+    # Recommendations
+    if not record_match or not schema_match:
+        console.print("[bold]Recommendations:[/bold]")
+        if not record_match:
+            console.print("  1. [yellow]Investigate record count differences[/yellow]")
+            console.print("     - Check data filtering logic")
+            console.print("     - Review cleaning validation rules")
+        if not schema_match:
+            console.print("  2. [yellow]Review schema differences[/yellow]")
+            console.print("     - Ensure all R columns are mapped in Python")
+            console.print("     - Validate extra Python columns are intentional")
+    else:
+        console.print("[green]✓ Basic validation passed! Record counts and schemas match.[/green]")
+        console.print("[dim]Review value mismatches above to ensure data quality.[/dim]")
+
+    console.print()
+
+
+@app.command()
+def compare(
+    file_name: str = typer.Option(
+        ...,
+        "--file",
+        "-f",
+        help="Parquet filename (e.g., '2018_CDA A4D Tracker_patient_cleaned.parquet')",
+    ),
+):
+    """Compare R vs Python cleaned patient data outputs.
+
+    The script looks for the file in fixed base directories:
+    - R output: /Volumes/USB SanDisk 3.2Gen1 Media/a4d/output_r/patient_data_cleaned/
+    - Python output: /Volumes/USB SanDisk 3.2Gen1 Media/a4d/output_python/patient_data_cleaned/
+    """
+
+    console.print("\n[bold blue]A4D Migration Validation: R vs Python Comparison[/bold blue]\n")
+
+    # Construct full paths
+    r_parquet = R_OUTPUT_BASE / file_name
+    python_parquet = PYTHON_OUTPUT_BASE / file_name
+
+    console.print(f"[dim]R path: {r_parquet}[/dim]")
+    console.print(f"[dim]Python path: {python_parquet}[/dim]")
+    console.print()
+
+    # Read data
+    console.print("[bold]Loading data...[/bold]")
+
+    try:
+        r_df = pl.read_parquet(r_parquet)
+        console.print(f"  ✓ R output: {len(r_df):,} records, {len(r_df.columns)} columns")
+    except Exception as e:
+        console.print(f"[red]  ✗ Failed to read R parquet: {e}[/red]")
+        raise typer.Exit(1) from e
+
+    try:
+        py_df = pl.read_parquet(python_parquet)
+        console.print(f"  ✓ Python output: {len(py_df):,} records, {len(py_df.columns)} columns")
+    except Exception as e:
+        console.print(f"[red]  ✗ Failed to read Python parquet: {e}[/red]")
+        raise typer.Exit(1) from e
+
+    console.print()
+
+    # Run comparisons
+    display_basic_stats(r_df, py_df, file_name)
+    compare_schemas(r_df, py_df)
+    compare_metadata_fields(r_df, py_df)
+    compare_patient_records(r_df, py_df, n_samples=3)
+    find_value_mismatches(r_df, py_df)
+    display_summary(r_df, py_df)
+
+    console.print(Panel("[bold green]Comparison Complete[/bold green]", expand=False))
+    console.print()
+
+
+if __name__ == "__main__":
+    app()
diff --git a/a4d-python/scripts/export_single_tracker.py b/a4d-python/scripts/export_single_tracker.py
new file mode 100644
index 0000000..7fda054
--- /dev/null
+++ b/a4d-python/scripts/export_single_tracker.py
@@ -0,0 +1,55 @@
+#!/usr/bin/env python3
+"""Export a single tracker for comparison with R pipeline output.
+
+Usage:
+    uv run python scripts/export_single_tracker.py <tracker_file> <output_dir>
+
+Example:
+    uv run python scripts/export_single_tracker.py \\
+        "/Volumes/USB SanDisk 3.2Gen1 Media/A4D/data/\\
+        a4dphase2_upload/Malaysia/SBU/\\
+        2024_Sibu Hospital A4D Tracker.xlsx" \\
+        output/patient_data_raw
+"""
+
+import sys
+from pathlib import Path
+
+from loguru import logger
+
+from a4d.extract.patient import export_patient_raw, read_all_patient_sheets
+
+
+def main():
+    """Extract and export a single tracker."""
+    if len(sys.argv) != 3:
+        print(__doc__)
+        sys.exit(1)
+
+    tracker_file = Path(sys.argv[1])
+    output_dir = Path(sys.argv[2])
+
+    if not tracker_file.exists():
+        logger.error(f"Tracker file not found: {tracker_file}")
+        sys.exit(1)
+
+    logger.info(f"Extracting patient data from: {tracker_file}")
+    logger.info(f"Output directory: {output_dir}")
+
+    # Extract patient data
+    df = read_all_patient_sheets(tracker_file)
+    logger.info(f"Extracted {len(df)} rows from {tracker_file.name}")
+
+    # Export to parquet
+    output_path = export_patient_raw(df, tracker_file, output_dir)
+    logger.success(f"✓ Successfully exported to: {output_path}")
+
+    # Summary
+    unique_months = df["tracker_month"].unique().to_list()
+    logger.info(f"Summary: {len(df)} patients across {len(unique_months)} months")
+    logger.info(f"Clinic ID: {df['clinic_id'][0]}")
+    logger.info(f"Tracker year: {df['tracker_year'][0]}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/a4d-python/scripts/profile_extraction.py b/a4d-python/scripts/profile_extraction.py
new file mode 100644
index 0000000..8c58e8e
--- /dev/null
+++ b/a4d-python/scripts/profile_extraction.py
@@ -0,0 +1,77 @@
+"""Profile patient data extraction to identify performance bottlenecks."""
+
+import cProfile
+import pstats
+from pathlib import Path
+from pstats import SortKey
+
+from a4d.extract.patient import extract_patient_data
+
+# Test with both 2019 and 2024 trackers
+TRACKER_2024 = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/A4D/data/a4dphase2_upload/"
+    "Malaysia/SBU/2024_Sibu Hospital A4D Tracker.xlsx"
+)
+TRACKER_2019 = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/A4D/data/a4dphase2_upload/"
+    "Malaysia/PNG/2019_Penang General Hospital A4D Tracker_DC.xlsx"
+)
+
+
+def profile_extraction():
+    """Run extraction with profiling."""
+    print("=" * 80)
+    print("Profiling 2024 tracker (Jan24)")
+    print("=" * 80)
+
+    profiler_2024 = cProfile.Profile()
+    profiler_2024.enable()
+
+    df_2024 = extract_patient_data(TRACKER_2024, "Jan24", 2024)
+
+    profiler_2024.disable()
+
+    print(f"\nExtracted: {len(df_2024)} rows × {len(df_2024.columns)} columns")
+    print("\nTop 20 functions by cumulative time:")
+    print("-" * 80)
+
+    stats_2024 = pstats.Stats(profiler_2024)
+    stats_2024.strip_dirs()
+    stats_2024.sort_stats(SortKey.CUMULATIVE)
+    stats_2024.print_stats(20)
+
+    print("\n" + "=" * 80)
+    print("Profiling 2019 tracker (Feb19 - largest sheet)")
+    print("=" * 80)
+
+    profiler_2019 = cProfile.Profile()
+    profiler_2019.enable()
+
+    df_2019 = extract_patient_data(TRACKER_2019, "Feb19", 2019)
+
+    profiler_2019.disable()
+
+    print(f"\nExtracted: {len(df_2019)} rows × {len(df_2019.columns)} columns")
+    print("\nTop 20 functions by cumulative time:")
+    print("-" * 80)
+
+    stats_2019 = pstats.Stats(profiler_2019)
+    stats_2019.strip_dirs()
+    stats_2019.sort_stats(SortKey.CUMULATIVE)
+    stats_2019.print_stats(20)
+
+    # Save detailed stats to file
+    output_dir = Path(__file__).parent.parent / "profiling"
+    output_dir.mkdir(exist_ok=True)
+
+    stats_2024.dump_stats(output_dir / "extraction_2024.prof")
+    stats_2019.dump_stats(output_dir / "extraction_2019.prof")
+
+    print("\n" + "=" * 80)
+    print(f"Detailed profiling data saved to {output_dir}/")
+    print("View with: python -m pstats profiling/extraction_2024.prof")
+    print("=" * 80)
+
+
+if __name__ == "__main__":
+    profile_extraction()
diff --git a/a4d-python/scripts/profile_extraction_detailed.py b/a4d-python/scripts/profile_extraction_detailed.py
new file mode 100644
index 0000000..c8d0148
--- /dev/null
+++ b/a4d-python/scripts/profile_extraction_detailed.py
@@ -0,0 +1,193 @@
+"""Detailed timing breakdown of extraction phases."""
+
+import time
+from pathlib import Path
+
+from openpyxl import load_workbook
+
+TRACKER_2024 = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/A4D/data/a4dphase2_upload/"
+    "Malaysia/SBU/2024_Sibu Hospital A4D Tracker.xlsx"
+)
+TRACKER_2019 = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/A4D/data/a4dphase2_upload/"
+    "Malaysia/PNG/2019_Penang General Hospital A4D Tracker_DC.xlsx"
+)
+
+
+def profile_extraction_phases(tracker_file, sheet_name, year):
+    """Profile each phase of extraction separately.
+
+    NOTE: This is the OPTIMIZED single-pass version that matches the current implementation.
+    """
+    print(f"\n{'=' * 80}")
+    print(f"Profiling: {tracker_file.name} - {sheet_name}")
+    print("=" * 80)
+
+    timings = {}
+
+    # Phase 1: Load workbook (read-only for optimal performance)
+    t0 = time.perf_counter()
+    wb = load_workbook(
+        tracker_file,
+        read_only=True,
+        data_only=True,
+        keep_vba=False,
+        keep_links=False,
+    )
+    ws = wb[sheet_name]
+    t1 = time.perf_counter()
+    timings["1. Load workbook (read-only)"] = t1 - t0
+
+    # Phase 2: Find data start row
+    t0 = time.perf_counter()
+    data_start_row = None
+    for row_idx, (cell_value,) in enumerate(
+        ws.iter_rows(min_col=1, max_col=1, values_only=True), start=1
+    ):
+        if cell_value is not None:
+            data_start_row = row_idx
+            break
+    t1 = time.perf_counter()
+    timings["2. Find data start row"] = t1 - t0
+
+    # Phase 3: Read headers
+    t0 = time.perf_counter()
+    header_row_1 = data_start_row - 1
+    header_row_2 = data_start_row - 2
+
+    max_cols = 100
+    header_1_raw = list(
+        ws.iter_rows(
+            min_row=header_row_1,
+            max_row=header_row_1,
+            min_col=1,
+            max_col=max_cols,
+            values_only=True,
+        )
+    )[0]
+    header_2_raw = list(
+        ws.iter_rows(
+            min_row=header_row_2,
+            max_row=header_row_2,
+            min_col=1,
+            max_col=max_cols,
+            values_only=True,
+        )
+    )[0]
+
+    # Trim to actual width
+    last_col = max_cols
+    for i in range(len(header_1_raw) - 1, -1, -1):
+        if header_1_raw[i] is not None or header_2_raw[i] is not None:
+            last_col = i + 1
+            break
+
+    header_1 = list(header_1_raw[:last_col])
+    header_2 = list(header_2_raw[:last_col])
+    t1 = time.perf_counter()
+    timings["3. Read headers"] = t1 - t0
+
+    # Phase 4: Merge headers with forward-fill logic
+    t0 = time.perf_counter()
+    import re
+
+    headers = []
+    prev_h2 = None  # Track previous h2 for horizontal merges
+
+    for h1, h2 in zip(header_1, header_2, strict=True):
+        if h1 and h2:
+            headers.append(f"{h2} {h1}".strip())
+            prev_h2 = h2
+        elif h2:
+            headers.append(str(h2).strip())
+            prev_h2 = h2
+        elif h1:
+            if prev_h2:
+                # Horizontally merged cell: fill forward
+                headers.append(f"{prev_h2} {h1}".strip())
+            else:
+                headers.append(str(h1).strip())
+        else:
+            headers.append(None)
+            prev_h2 = None
+
+    headers = [re.sub(r"\s+", " ", h.replace("\n", " ")) if h else None for h in headers]
+    t1 = time.perf_counter()
+    timings["4. Merge headers"] = t1 - t0
+
+    # Phase 5: Read data rows
+    t0 = time.perf_counter()
+    data = []
+    for row in ws.iter_rows(
+        min_row=data_start_row,
+        max_row=ws.max_row,
+        min_col=1,
+        max_col=len(headers),
+        values_only=True,
+    ):
+        if all(cell is None for cell in row):
+            break
+        if row[0] is None:
+            continue
+        data.append(row)
+    t1 = time.perf_counter()
+    timings["5. Read data rows"] = t1 - t0
+
+    # Phase 6: Close workbook
+    t0 = time.perf_counter()
+    wb.close()
+    t1 = time.perf_counter()
+    timings["6. Close workbook"] = t1 - t0
+
+    # Phase 7: Build DataFrame
+    t0 = time.perf_counter()
+    import polars as pl
+
+    valid_cols = [(i, h) for i, h in enumerate(headers) if h]
+    valid_indices = [i for i, _ in valid_cols]
+    valid_headers = [h for _, h in valid_cols]
+    filtered_data = [[row[i] for i in valid_indices] for row in data]
+
+    df = pl.DataFrame(
+        {
+            header: [str(row[i]) if row[i] is not None else None for row in filtered_data]
+            for i, header in enumerate(valid_headers)
+        }
+    )
+    t1 = time.perf_counter()
+    timings["7. Build Polars DataFrame"] = t1 - t0
+
+    # Print results
+    total_time = sum(timings.values())
+    print(f"\nExtracted: {len(df)} rows × {len(df.columns)} columns")
+    print(f"Total time: {total_time:.3f}s\n")
+    print(f"{'Phase':<40} {'Time (s)':<12} {'% of Total':<12}")
+    print("-" * 64)
+
+    for phase, duration in timings.items():
+        pct = (duration / total_time) * 100
+        print(f"{phase:<40} {duration:>10.3f}s  {pct:>10.1f}%")
+
+    return timings, total_time
+
+
+if __name__ == "__main__":
+    # Test 2024 tracker
+    timings_2024, total_2024 = profile_extraction_phases(TRACKER_2024, "Jan24", 2024)
+
+    # Test 2019 tracker
+    timings_2019, total_2019 = profile_extraction_phases(TRACKER_2019, "Feb19", 2019)
+
+    print("\n" + "=" * 80)
+    print("SUMMARY")
+    print("=" * 80)
+    print(f"2024 tracker total: {total_2024:.3f}s")
+    print(f"2019 tracker total: {total_2019:.3f}s")
+    print("\nSlowest phases across both trackers:")
+    all_timings = {}
+    for phase in timings_2024:
+        all_timings[phase] = (timings_2024[phase] + timings_2019[phase]) / 2
+
+    for phase, avg_time in sorted(all_timings.items(), key=lambda x: x[1], reverse=True)[:5]:
+        print(f"  {phase:<40} avg: {avg_time:.3f}s")
diff --git a/a4d-python/scripts/reprocess_tracker.py b/a4d-python/scripts/reprocess_tracker.py
new file mode 100644
index 0000000..dfd3f3b
--- /dev/null
+++ b/a4d-python/scripts/reprocess_tracker.py
@@ -0,0 +1,16 @@
+#!/usr/bin/env python3
+"""Quick script to re-process a single tracker."""
+
+from pathlib import Path
+
+from a4d.pipeline.tracker import process_tracker_patient
+
+tracker_file = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Cambodia/CDA/2025_06_CDA A4D Tracker.xlsx"  # noqa: E501
+)
+output_root = Path("/Volumes/USB SanDisk 3.2Gen1 Media/a4d/output_python")
+
+result = process_tracker_patient(tracker_file, output_root)
+print(f"Success: {result.success}")
+print(f"Cleaned output: {result.cleaned_output}")
+print(f"Cleaning errors: {result.cleaning_errors}")
diff --git a/a4d-python/scripts/test_cleaning.py b/a4d-python/scripts/test_cleaning.py
new file mode 100644
index 0000000..118c83c
--- /dev/null
+++ b/a4d-python/scripts/test_cleaning.py
@@ -0,0 +1,87 @@
+#!/usr/bin/env python3
+"""Test cleaning pipeline on Sibu Hospital 2024 tracker."""
+
+from pathlib import Path
+
+import polars as pl
+
+from a4d.clean.patient import clean_patient_data
+from a4d.errors import ErrorCollector
+
+
+def test_cleaning():
+    """Test cleaning on real tracker data."""
+
+    # Read the raw parquet we generated in Phase 2
+    raw_path = Path(
+        "output/patient_data_raw/Python/2024_Sibu Hospital A4D Tracker_patient_raw.parquet"
+    )
+
+    if not raw_path.exists():
+        print(f"❌ Raw parquet not found: {raw_path}")
+        print("Please run patient extraction first")
+        return
+
+    print("=" * 80)
+    print("CLEANING TEST - Sibu Hospital 2024")
+    print("=" * 80)
+
+    # Read raw data
+    df_raw = pl.read_parquet(raw_path)
+    print("\n📥 Raw data loaded:")
+    print(f"   Rows: {len(df_raw)}")
+    print(f"   Columns: {len(df_raw.columns)}")
+    print(f"   Columns: {df_raw.columns[:10]}...")
+
+    # Create error collector
+    collector = ErrorCollector()
+
+    # Clean data
+    print("\n🧹 Cleaning data...")
+    df_clean = clean_patient_data(df_raw, collector)
+
+    print("\n📤 Cleaned data:")
+    print(f"   Rows: {len(df_clean)}")
+    print(f"   Columns: {len(df_clean.columns)}")
+
+    # Show schema
+    print("\n📋 Schema (first 20 columns):")
+    for i, (col, dtype) in enumerate(df_clean.schema.items()):
+        if i < 20:
+            null_count = df_clean[col].null_count()
+            print(f"   {col:50s} {str(dtype):15s} ({null_count:2d} nulls)")
+    print(f"   ... and {len(df_clean.columns) - 20} more columns")
+
+    # Show errors
+    print(f"\n⚠️  Errors collected: {len(collector)}")
+    if len(collector) > 0:
+        errors_df = collector.to_dataframe()
+        print("\n   Error breakdown by column:")
+        error_counts = errors_df.group_by("column").count().sort("count", descending=True)
+        for row in error_counts.iter_rows(named=True):
+            print(f"      {row['column']:40s}: {row['count']:3d} errors")
+
+        print("\n   First 5 errors:")
+        print(errors_df.head(5))
+
+    # Write output
+    output_dir = Path("output/patient_data_clean/Python")
+    output_dir.mkdir(parents=True, exist_ok=True)
+    output_path = output_dir / "2024_Sibu Hospital A4D Tracker_patient_clean.parquet"
+
+    df_clean.write_parquet(output_path)
+    print(f"\n✅ Cleaned data written to: {output_path}")
+
+    # Sample data check
+    print("\n🔍 Sample row (first non-null patient):")
+    sample = df_clean.filter(pl.col("patient_id").is_not_null()).head(1)
+    for col in sample.columns[:15]:
+        print(f"   {col:40s}: {sample[col][0]}")
+
+    print("\n" + "=" * 80)
+    print("✅ CLEANING TEST COMPLETE")
+    print("=" * 80)
+
+
+if __name__ == "__main__":
+    test_cleaning()
diff --git a/a4d-python/scripts/test_extended_trackers.py b/a4d-python/scripts/test_extended_trackers.py
new file mode 100644
index 0000000..b4b5741
--- /dev/null
+++ b/a4d-python/scripts/test_extended_trackers.py
@@ -0,0 +1,142 @@
+#!/usr/bin/env python3
+"""Extended end-to-end tests on older tracker files (2018-2021)."""
+
+# Disable logging for clean output
+import logging
+import sys
+from pathlib import Path
+
+from a4d.clean.patient import clean_patient_data
+from a4d.errors import ErrorCollector
+from a4d.extract.patient import read_all_patient_sheets
+
+logging.disable(logging.CRITICAL)
+
+test_files = [
+    (
+        "2021_Siriraj_Thailand",
+        Path(
+            "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Thailand/SRJ/2021_Siriraj Hospital A4D Tracker.xlsx"  # noqa: E501
+        ),
+    ),
+    (
+        "2021_UdonThani_Thailand",
+        Path(
+            "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Thailand/UTH/2021_Udon Thani Hospital A4D Tracker.xlsx"  # noqa: E501
+        ),
+    ),
+    (
+        "2020_VNC_Vietnam",
+        Path(
+            "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Vietnam/VNC/2020_Vietnam National Children's Hospital A4D Tracker.xlsx"  # noqa: E501
+        ),
+    ),
+    (
+        "2019_Penang_Malaysia",
+        Path(
+            "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Malaysia/PNG/2019_Penang General Hospital A4D Tracker_DC.xlsx"  # noqa: E501
+        ),
+    ),
+    (
+        "2019_Mandalay_Myanmar",
+        Path(
+            "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Myanmar/MCH/2019_Mandalay Children's Hospital A4D Tracker.xlsx"  # noqa: E501
+        ),
+    ),
+    (
+        "2018_Yangon_Myanmar",
+        Path(
+            "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Myanmar/YCH/2018_Yangon Children's Hospital A4D Tracker.xlsx"  # noqa: E501
+        ),
+    ),
+]
+
+print("=" * 100)
+print("EXTENDED END-TO-END TESTING: Older Trackers (2018-2021)")
+print("=" * 100)
+
+results = []
+
+for name, tracker_path in test_files:
+    print(f"\n📁 {name}")
+    print("-" * 100)
+
+    if not tracker_path.exists():
+        print(f"  ❌ File not found: {tracker_path}")
+        results.append((name, "MISSING", {}))
+        continue
+
+    try:
+        # Extract
+        df_raw = read_all_patient_sheets(tracker_path)
+
+        # Get metadata
+        year = (
+            df_raw["tracker_year"][0]
+            if len(df_raw) > 0 and "tracker_year" in df_raw.columns
+            else "N/A"
+        )
+        months = (
+            df_raw["tracker_month"].unique().sort().to_list()
+            if "tracker_month" in df_raw.columns
+            else []
+        )
+
+        print(
+            f"  ✅ EXTRACTION: {len(df_raw)} rows, "
+            f"{len(df_raw.columns)} cols, year={year}, months={months}"
+        )
+
+        # Clean
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        # Validate schema
+        if len(df_clean.columns) != 83:
+            print(f"  ⚠️  Schema: Expected 83 columns, got {len(df_clean.columns)}")
+
+        # Check key columns
+        stats = {
+            "insulin_type": df_clean["insulin_type"].is_not_null().sum()
+            if "insulin_type" in df_clean.columns
+            else 0,
+            "insulin_total_units": df_clean["insulin_total_units"].is_not_null().sum()
+            if "insulin_total_units" in df_clean.columns
+            else 0,
+        }
+
+        print(
+            f"  ✅ CLEANING: {len(df_clean)} rows, "
+            f"{len(df_clean.columns)} cols, {len(collector)} errors"
+        )
+        print(
+            f"     Key columns: insulin_type={stats['insulin_type']}/{len(df_clean)}, "
+            + f"insulin_total={stats['insulin_total_units']}/{len(df_clean)}"
+        )
+
+        results.append((name, "PASS", stats))
+
+    except Exception as e:
+        print(f"  ❌ ERROR: {type(e).__name__}: {str(e)[:150]}")
+        results.append((name, "FAIL", {"error": str(e)[:100]}))
+
+# Summary
+print("\n" + "=" * 100)
+print("SUMMARY")
+print("=" * 100)
+
+passed = sum(1 for _, status, _ in results if status == "PASS")
+failed = sum(1 for _, status, _ in results if status == "FAIL")
+missing = sum(1 for _, status, _ in results if status == "MISSING")
+
+print(f"\nTotal: {len(results)} trackers")
+print(f"  ✅ Passed: {passed}")
+print(f"  ❌ Failed: {failed}")
+print(f"  ⚠️  Missing: {missing}")
+
+if passed == len(results):
+    print("\n✨ All older trackers processed successfully!")
+    sys.exit(0)
+else:
+    print("\n⚠️  Some trackers failed - review output above")
+    sys.exit(1)
diff --git a/a4d-python/scripts/test_multiple_trackers.py b/a4d-python/scripts/test_multiple_trackers.py
new file mode 100644
index 0000000..3e992ea
--- /dev/null
+++ b/a4d-python/scripts/test_multiple_trackers.py
@@ -0,0 +1,128 @@
+#!/usr/bin/env python3
+"""Test extraction + cleaning on multiple trackers for end-to-end validation."""
+
+# Disable logging for clean output
+import logging
+import sys
+from pathlib import Path
+
+from a4d.clean.patient import clean_patient_data
+from a4d.errors import ErrorCollector
+from a4d.extract.patient import read_all_patient_sheets
+
+logging.disable(logging.CRITICAL)
+
+test_files = [
+    (
+        "2024_ISDFI",
+        Path(
+            "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Philippines/ISD/2024_ISDFI A4D Tracker.xlsx"  # noqa: E501
+        ),
+    ),
+    (
+        "2024_Penang",
+        Path(
+            "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Malaysia/PNG/2024_Penang General Hospital A4D Tracker.xlsx"  # noqa: E501
+        ),
+    ),
+    (
+        "2023_Sibu",
+        Path(
+            "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Malaysia/SBU/2023_Sibu Hospital A4D Tracker.xlsx"  # noqa: E501
+        ),
+    ),
+    (
+        "2022_Penang",
+        Path(
+            "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/Malaysia/PNG/2022_Penang General Hospital A4D Tracker.xlsx"  # noqa: E501
+        ),
+    ),
+]
+
+print("=" * 100)
+print("END-TO-END TESTING: Extraction + Cleaning")
+print("=" * 100)
+
+results = []
+
+for name, tracker_path in test_files:
+    print(f"\n📁 {name}")
+    print("-" * 100)
+
+    if not tracker_path.exists():
+        print(f"  ❌ File not found: {tracker_path}")
+        results.append((name, "MISSING", {}))
+        continue
+
+    try:
+        # Extract
+        df_raw = read_all_patient_sheets(tracker_path)
+
+        # Get metadata
+        sheets = df_raw["sheet_name"].unique().to_list() if "sheet_name" in df_raw.columns else []
+        months = (
+            df_raw["tracker_month"].unique().sort().to_list()
+            if "tracker_month" in df_raw.columns
+            else []
+        )
+        year = (
+            df_raw["tracker_year"][0]
+            if len(df_raw) > 0 and "tracker_year" in df_raw.columns
+            else "N/A"
+        )
+
+        print(
+            f"  ✅ EXTRACTION: {len(df_raw)} rows, "
+            f"{len(df_raw.columns)} cols, year={year}, months={months}"
+        )
+
+        # Clean
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        # Validate schema
+        if len(df_clean.columns) != 83:
+            print(f"  ⚠️  Schema: Expected 83 columns, got {len(df_clean.columns)}")
+
+        # Check key columns
+        stats = {
+            "insulin_type": df_clean["insulin_type"].is_not_null().sum(),
+            "insulin_total_units": df_clean["insulin_total_units"].is_not_null().sum(),
+            "fbg_updated_mg": df_clean["fbg_updated_mg"].is_not_null().sum(),
+            "hba1c_updated": df_clean["hba1c_updated"].is_not_null().sum(),
+        }
+
+        print(f"  ✅ CLEANING: {len(df_clean)} rows, 83 cols, {len(collector)} errors")
+        print(
+            f"     Key columns: insulin_type={stats['insulin_type']}/{len(df_clean)}, "
+            + f"insulin_total={stats['insulin_total_units']}/{len(df_clean)}, "
+            + f"fbg_mg={stats['fbg_updated_mg']}/{len(df_clean)}, "
+            + f"hba1c={stats['hba1c_updated']}/{len(df_clean)}"
+        )
+
+        results.append((name, "PASS", stats))
+
+    except Exception as e:
+        print(f"  ❌ ERROR: {type(e).__name__}: {str(e)[:150]}")
+        results.append((name, "FAIL", {"error": str(e)[:100]}))
+
+# Summary
+print("\n" + "=" * 100)
+print("SUMMARY")
+print("=" * 100)
+
+passed = sum(1 for _, status, _ in results if status == "PASS")
+failed = sum(1 for _, status, _ in results if status == "FAIL")
+missing = sum(1 for _, status, _ in results if status == "MISSING")
+
+print(f"\nTotal: {len(results)} trackers")
+print(f"  ✅ Passed: {passed}")
+print(f"  ❌ Failed: {failed}")
+print(f"  ⚠️  Missing: {missing}")
+
+if passed == len(results):
+    print("\n✨ All trackers processed successfully!")
+    sys.exit(0)
+else:
+    print("\n⚠️  Some trackers failed - review output above")
+    sys.exit(1)
diff --git a/a4d-python/scripts/verify_fixes.py b/a4d-python/scripts/verify_fixes.py
new file mode 100644
index 0000000..f0636c1
--- /dev/null
+++ b/a4d-python/scripts/verify_fixes.py
@@ -0,0 +1,122 @@
+#!/usr/bin/env python3
+"""Verify that the Python fixes are working correctly by analyzing the output."""
+
+from pathlib import Path
+
+import polars as pl
+
+
+def verify_python_output():
+    """Verify Python output has correct types and column ordering."""
+
+    python_file = Path(
+        "output/patient_data_raw/Python/2024_Sibu Hospital A4D Tracker_patient_raw.parquet"
+    )
+
+    if not python_file.exists():
+        print(f"❌ Python file not found: {python_file}")
+        return False
+
+    print("=" * 80)
+    print("VERIFYING PYTHON OUTPUT FIXES")
+    print("=" * 80)
+
+    df = pl.read_parquet(python_file)
+
+    # Check 1: Column ordering
+    print("\n1. COLUMN ORDERING")
+    print("-" * 80)
+    priority_cols = ["tracker_year", "tracker_month", "clinic_id", "patient_id"]
+    first_n = min(10, len(df.columns))
+    actual_first_cols = df.columns[:first_n]
+
+    print(f"First {first_n} columns: {actual_first_cols}")
+
+    # Check which priority columns are at the start
+    for i, expected_col in enumerate(priority_cols):
+        if expected_col in df.columns:
+            actual_pos = df.columns.index(expected_col)
+            if actual_pos == i:
+                print(f"  ✅ {expected_col}: position {actual_pos} (expected {i})")
+            else:
+                print(f"  ❌ {expected_col}: position {actual_pos} (expected {i})")
+        else:
+            print(f"  ⚠️  {expected_col}: not found in columns")
+
+    # Check 2: Data types (all should be String)
+    print("\n2. DATA TYPES")
+    print("-" * 80)
+
+    dtypes = df.schema
+    non_string_cols = [
+        (name, dtype) for name, dtype in dtypes.items() if str(dtype) not in ["String", "Utf8"]
+    ]
+
+    if non_string_cols:
+        print(f"❌ Found {len(non_string_cols)} non-String columns:")
+        for col, dtype in non_string_cols[:10]:
+            print(f"  - {col}: {dtype}")
+        if len(non_string_cols) > 10:
+            print(f"  ... and {len(non_string_cols) - 10} more")
+    else:
+        print("✅ All columns are String type")
+
+    # Check 3: No Null dtype columns
+    null_cols = [(name, dtype) for name, dtype in dtypes.items() if str(dtype) == "Null"]
+
+    if null_cols:
+        print(f"\n❌ Found {len(null_cols)} Null-type columns (should be String):")
+        for col, dtype in null_cols:
+            print(f"  - {col}: {dtype}")
+    else:
+        print("✅ No Null-type columns found")
+
+    # Check 4: Sample data
+    print("\n3. SAMPLE DATA (first 3 rows)")
+    print("-" * 80)
+    print(df.head(3))
+
+    # Check 5: Dimensions
+    print("\n4. DIMENSIONS")
+    print("-" * 80)
+    print(f"Rows: {df.height}")
+    print(f"Columns: {df.width}")
+    print(f"Column names: {df.columns[:20]}")
+    if df.width > 20:
+        print(f"... and {df.width - 20} more")
+
+    # Summary
+    print("\n" + "=" * 80)
+    print("SUMMARY")
+    print("=" * 80)
+
+    issues = []
+    if non_string_cols:
+        issues.append(f"{len(non_string_cols)} non-String columns")
+    if null_cols:
+        issues.append(f"{len(null_cols)} Null-type columns")
+
+    # Check column ordering
+    priority_check_failed = False
+    for i, expected_col in enumerate(priority_cols):
+        if expected_col in df.columns:
+            if df.columns.index(expected_col) != i:
+                priority_check_failed = True
+                break
+
+    if priority_check_failed:
+        issues.append("Column ordering incorrect")
+
+    if issues:
+        print(f"❌ Issues found: {', '.join(issues)}")
+        return False
+    else:
+        print("✅ All checks passed!")
+        return True
+
+
+if __name__ == "__main__":
+    import sys
+
+    success = verify_python_output()
+    sys.exit(0 if success else 1)
diff --git a/a4d-python/src/a4d/__init__.py b/a4d-python/src/a4d/__init__.py
new file mode 100644
index 0000000..733bf4a
--- /dev/null
+++ b/a4d-python/src/a4d/__init__.py
@@ -0,0 +1,15 @@
+"""A4D Medical Tracker Data Processing Pipeline."""
+
+from a4d.config import settings
+from a4d.errors import DataError, ErrorCollector
+from a4d.logging import file_logger, setup_logging
+
+__version__ = "0.1.0"
+
+__all__ = [
+    "settings",
+    "setup_logging",
+    "file_logger",
+    "ErrorCollector",
+    "DataError",
+]
diff --git a/a4d-python/src/a4d/__main__.py b/a4d-python/src/a4d/__main__.py
new file mode 100644
index 0000000..e82ca3c
--- /dev/null
+++ b/a4d-python/src/a4d/__main__.py
@@ -0,0 +1,6 @@
+"""Make package executable with 'python -m a4d'."""
+
+from a4d.cli import main
+
+if __name__ == "__main__":
+    main()
diff --git a/a4d-python/src/a4d/clean/__init__.py b/a4d-python/src/a4d/clean/__init__.py
new file mode 100644
index 0000000..e821633
--- /dev/null
+++ b/a4d-python/src/a4d/clean/__init__.py
@@ -0,0 +1,15 @@
+"""Data cleaning and transformation modules."""
+
+from a4d.clean.converters import (
+    correct_decimal_sign,
+    cut_numeric_value,
+    safe_convert_column,
+    safe_convert_multiple_columns,
+)
+
+__all__ = [
+    "safe_convert_column",
+    "safe_convert_multiple_columns",
+    "correct_decimal_sign",
+    "cut_numeric_value",
+]
diff --git a/a4d-python/src/a4d/clean/converters.py b/a4d-python/src/a4d/clean/converters.py
new file mode 100644
index 0000000..8f9a4fc
--- /dev/null
+++ b/a4d-python/src/a4d/clean/converters.py
@@ -0,0 +1,349 @@
+"""Type conversion utilities with error tracking.
+
+This module provides vectorized type conversion functions that track failures
+in an ErrorCollector. This replaces R's rowwise() conversion approach with
+much faster vectorized operations.
+
+The pattern is:
+1. Try vectorized conversion (fast, handles 95%+ of data)
+2. Detect failures (nulls after conversion but not before)
+3. Log only failed rows to ErrorCollector
+4. Replace failures with error value
+"""
+
+import polars as pl
+
+from a4d.clean.date_parser import parse_date_flexible
+from a4d.config import settings
+from a4d.errors import ErrorCollector
+
+
+def safe_convert_column(
+    df: pl.DataFrame,
+    column: str,
+    target_type: pl.DataType,
+    error_collector: ErrorCollector,
+    error_value: float | str | None = None,
+    file_name_col: str = "file_name",
+    patient_id_col: str = "patient_id",
+) -> pl.DataFrame:
+    """Convert column to target type with vectorized error tracking.
+
+    This function attempts vectorized type conversion and tracks any failures
+    in the ErrorCollector. Much faster than R's rowwise() approach.
+
+    Args:
+        df: Input DataFrame
+        column: Column name to convert
+        target_type: Target Polars data type (pl.Int32, pl.Float64, etc.)
+        error_collector: ErrorCollector instance to track failures
+        error_value: Value to use for failed conversions (default from settings)
+        file_name_col: Column containing file name for error tracking
+        patient_id_col: Column containing patient ID for error tracking
+
+    Returns:
+        DataFrame with converted column (failures replaced with error_value)
+
+    Example:
+        >>> collector = ErrorCollector()
+        >>> df = safe_convert_column(
+        ...     df=df,
+        ...     column="age",
+        ...     target_type=pl.Int32,
+        ...     error_collector=collector,
+        ... )
+        >>> # Failures are logged in collector, replaced with ERROR_VAL_NUMERIC
+    """
+    # Determine error value based on target type if not provided
+    if error_value is None:
+        if target_type in (pl.Int32, pl.Int64, pl.Float32, pl.Float64):
+            error_value = settings.error_val_numeric
+        elif target_type in (pl.Utf8, pl.Categorical, pl.String):
+            error_value = settings.error_val_character
+        elif target_type == pl.Date:
+            error_value = settings.error_val_date
+        elif target_type == pl.Boolean:
+            error_value = False  # Default for boolean conversion failures
+        else:
+            raise ValueError(f"Cannot determine error value for type {target_type}")
+
+    # Skip if column doesn't exist
+    if column not in df.columns:
+        return df
+
+    # Normalize empty/whitespace/missing-value strings to null BEFORE conversion
+    # This ensures missing data stays null rather than becoming error values
+    # Matches R behavior where these values → NA (not conversion error)
+    if df[column].dtype in (pl.Utf8, pl.String):
+        # Common missing value representations to treat as null
+        missing_values = ["", "N/A", "NA", "n/a", "na", "-", ".", "None", "none", "NULL", "null"]
+        df = df.with_columns(
+            pl.when(
+                pl.col(column).str.strip_chars().is_in(missing_values)
+                | (pl.col(column).str.strip_chars().str.len_chars() == 0)
+            )
+            .then(None)
+            .otherwise(pl.col(column))
+            .alias(column)
+        )
+
+    # Store original values for error reporting
+    df = df.with_columns(pl.col(column).alias(f"_orig_{column}"))
+
+    # Try vectorized conversion (strict=False allows nulls for failures)
+    df = df.with_columns(pl.col(column).cast(target_type, strict=False).alias(f"_conv_{column}"))
+
+    # Detect failures: became null but wasn't null before
+    failed_mask = pl.col(f"_conv_{column}").is_null() & pl.col(f"_orig_{column}").is_not_null()
+
+    # Extract failed rows for error logging
+    failed_rows = df.filter(failed_mask)
+
+    # Log each failure
+    if len(failed_rows) > 0:
+        for row in failed_rows.iter_rows(named=True):
+            error_collector.add_error(
+                file_name=row.get(file_name_col) or "unknown",
+                patient_id=row.get(patient_id_col) or "unknown",
+                column=column,
+                original_value=row[f"_orig_{column}"],
+                error_message=f"Could not convert to {target_type}",
+                error_code="type_conversion",
+                function_name="safe_convert_column",
+            )
+
+    # Replace failures with error value (cast to target type)
+    df = df.with_columns(
+        pl.when(failed_mask)
+        .then(pl.lit(error_value).cast(target_type))
+        .otherwise(pl.col(f"_conv_{column}"))
+        .alias(column)
+    )
+
+    # Clean up temporary columns
+    df = df.drop([f"_orig_{column}", f"_conv_{column}"])
+
+    return df
+
+
+def parse_date_column(
+    df: pl.DataFrame,
+    column: str,
+    error_collector: ErrorCollector,
+    file_name_col: str = "file_name",
+    patient_id_col: str = "patient_id",
+) -> pl.DataFrame:
+    """Parse date column using flexible date parser.
+
+    Uses parse_date_flexible() to handle various date formats including:
+    - Standard formats (ISO, DD/MM/YYYY, etc.)
+    - Abbreviated month-year (Mar-18, Jan-20)
+    - Excel serial numbers
+    - 4-letter month names
+
+    Args:
+        df: Input DataFrame
+        column: Column name to parse
+        error_collector: ErrorCollector instance to track failures
+        file_name_col: Column containing file name for error tracking
+        patient_id_col: Column containing patient ID for error tracking
+
+    Returns:
+        DataFrame with parsed date column
+
+    Example:
+        >>> df = parse_date_column(
+        ...     df=df,
+        ...     column="hba1c_updated_date",
+        ...     error_collector=collector,
+        ... )
+    """
+    if column not in df.columns:
+        return df
+
+    # Store original values for error reporting
+    df = df.with_columns(pl.col(column).alias(f"_orig_{column}"))
+
+    # Apply parse_date_flexible to each value
+    # NOTE: Using list-based approach instead of map_elements() because
+    # map_elements() with return_dtype=pl.Date fails when ALL values are None
+    # (all-NA columns like hospitalisation_date).
+    # Explicit Series creation with dtype=pl.Date works because it doesn't
+    # require non-null values.
+    column_values = df[column].cast(pl.Utf8).to_list()
+    parsed_dates = [
+        parse_date_flexible(val, error_val=settings.error_val_date) for val in column_values
+    ]
+    parsed_series = pl.Series(f"_parsed_{column}", parsed_dates, dtype=pl.Date)
+    df = df.with_columns(parsed_series)
+
+    # Detect failures: parsed to error date
+    error_date = pl.lit(settings.error_val_date).str.to_date()
+    failed_mask = (
+        pl.col(f"_parsed_{column}").is_not_null()
+        & (pl.col(f"_parsed_{column}") == error_date)
+        & pl.col(f"_orig_{column}").is_not_null()
+    )
+
+    # Extract failed rows for error logging
+    failed_rows = df.filter(failed_mask)
+
+    # Log each failure
+    if len(failed_rows) > 0:
+        for row in failed_rows.iter_rows(named=True):
+            error_collector.add_error(
+                file_name=row.get(file_name_col) or "unknown",
+                patient_id=row.get(patient_id_col) or "unknown",
+                column=column,
+                original_value=row[f"_orig_{column}"],
+                error_message="Could not parse date",
+                error_code="type_conversion",
+                function_name="parse_date_column",
+            )
+
+    # Use parsed values
+    df = df.with_columns(pl.col(f"_parsed_{column}").alias(column))
+
+    # Clean up temporary columns
+    df = df.drop([f"_orig_{column}", f"_parsed_{column}"])
+
+    return df
+
+
+def correct_decimal_sign(df: pl.DataFrame, column: str) -> pl.DataFrame:
+    """Replace comma decimal separator with dot.
+
+    Some trackers use European decimal format (1,5 instead of 1.5).
+
+    Args:
+        df: Input DataFrame
+        column: Column name to correct
+
+    Returns:
+        DataFrame with corrected decimal signs
+
+    Example:
+        >>> df = correct_decimal_sign(df, "weight")
+    """
+    if column not in df.columns:
+        return df
+
+    df = df.with_columns(pl.col(column).cast(pl.Utf8).str.replace(",", ".").alias(column))
+
+    return df
+
+
+def cut_numeric_value(
+    df: pl.DataFrame,
+    column: str,
+    min_val: float,
+    max_val: float,
+    error_collector: ErrorCollector,
+    file_name_col: str = "file_name",
+    patient_id_col: str = "patient_id",
+) -> pl.DataFrame:
+    """Replace out-of-range numeric values with error value.
+
+    Args:
+        df: Input DataFrame
+        column: Column name to check
+        min_val: Minimum allowed value
+        max_val: Maximum allowed value
+        error_collector: ErrorCollector instance to track violations
+        file_name_col: Column containing file name for error tracking
+        patient_id_col: Column containing patient ID for error tracking
+
+    Returns:
+        DataFrame with out-of-range values replaced
+
+    Example:
+        >>> df = cut_numeric_value(
+        ...     df=df,
+        ...     column="age",
+        ...     min_val=0,
+        ...     max_val=25,
+        ...     error_collector=collector,
+        ... )
+    """
+    if column not in df.columns:
+        return df
+
+    # Find values outside allowed range (excluding nulls and existing error values)
+    invalid_mask = (
+        pl.col(column).is_not_null()
+        & (pl.col(column) != settings.error_val_numeric)
+        & ((pl.col(column) < min_val) | (pl.col(column) > max_val))
+    )
+
+    # Extract invalid rows for error logging
+    invalid_rows = df.filter(invalid_mask)
+
+    # Log each invalid value
+    if len(invalid_rows) > 0:
+        for row in invalid_rows.iter_rows(named=True):
+            error_collector.add_error(
+                file_name=row.get(file_name_col) or "unknown",
+                patient_id=row.get(patient_id_col) or "unknown",
+                column=column,
+                original_value=row[column],
+                error_message=f"Value {row[column]} outside allowed range [{min_val}, {max_val}]",
+                error_code="invalid_value",
+                function_name="cut_numeric_value",
+            )
+
+    # Replace invalid values with error value
+    df = df.with_columns(
+        pl.when(invalid_mask)
+        .then(pl.lit(settings.error_val_numeric))
+        .otherwise(pl.col(column))
+        .alias(column)
+    )
+
+    return df
+
+
+def safe_convert_multiple_columns(
+    df: pl.DataFrame,
+    columns: list[str],
+    target_type: pl.DataType,
+    error_collector: ErrorCollector,
+    error_value: float | str | None = None,
+    file_name_col: str = "file_name",
+    patient_id_col: str = "patient_id",
+) -> pl.DataFrame:
+    """Convert multiple columns to the same target type.
+
+    Convenience function for batch conversion of columns.
+
+    Args:
+        df: Input DataFrame
+        columns: List of column names to convert
+        target_type: Target Polars data type
+        error_collector: ErrorCollector instance
+        error_value: Value to use for failed conversions
+        file_name_col: Column containing file name for error tracking
+        patient_id_col: Column containing patient ID for error tracking
+
+    Returns:
+        DataFrame with all specified columns converted
+
+    Example:
+        >>> df = safe_convert_multiple_columns(
+        ...     df=df,
+        ...     columns=["age", "height", "weight"],
+        ...     target_type=pl.Float64,
+        ...     error_collector=collector,
+        ... )
+    """
+    for column in columns:
+        df = safe_convert_column(
+            df=df,
+            column=column,
+            target_type=target_type,
+            error_collector=error_collector,
+            error_value=error_value,
+            file_name_col=file_name_col,
+            patient_id_col=patient_id_col,
+        )
+
+    return df
diff --git a/a4d-python/src/a4d/clean/date_parser.py b/a4d-python/src/a4d/clean/date_parser.py
new file mode 100644
index 0000000..896216f
--- /dev/null
+++ b/a4d-python/src/a4d/clean/date_parser.py
@@ -0,0 +1,123 @@
+"""Flexible date parsing for A4D tracker data.
+
+Matches R's parse_dates() function (script2_helper_patient_data_fix.R:174-211).
+Handles various date formats found in legacy trackers including:
+- Standard formats: "28/8/2017", "01-03-2018"
+- Abbreviated month-year: "Mar-18", "Jan-20"
+- Full month-year: "March-2018", "January-20"
+- Excel serial numbers: "45341.0" (days since 1899-12-30)
+- Year only: "2018", "18"
+"""
+
+import re
+from datetime import date, datetime, timedelta
+
+from dateutil import parser as date_parser
+from loguru import logger
+
+# Excel epoch: dates stored as days since this date
+EXCEL_EPOCH = date(1899, 12, 30)
+
+
+def parse_date_flexible(date_str: str | None, error_val: str = "9999-09-09") -> date | None:
+    """Parse date strings flexibly using Python's dateutil.parser.
+
+    Handles common edge cases from A4D tracker data:
+    - NA/None/empty values → None
+    - Excel serial numbers (e.g., "45341.0") → converted from days since 1899-12-30
+    - 4-letter month names (e.g., "March") → truncated to 3 letters before parsing
+    - All standard date formats via dateutil.parser (very flexible)
+
+    Examples:
+        "Mar-18" → 2018-03-01
+        "28/8/2017" → 2017-08-28
+        "45341.0" → 2024-01-13 (Excel serial)
+        "January-20" → 2020-01-01
+
+    Args:
+        date_str: Date string to parse
+        error_val: Value to parse and return on failure (default "9999-09-09")
+
+    Returns:
+        Parsed date, None for NA/empty, or error date if parsing fails
+    """
+    # Handle None, empty, or NA strings
+    if (
+        date_str is None
+        or date_str == ""
+        or str(date_str).strip().lower() in ["na", "nan", "null", "none"]
+    ):
+        return None
+
+    date_str = str(date_str).strip()
+
+    # Handle Excel serial numbers
+    # Excel stores dates as number of days since 1899-12-30
+    try:
+        numeric_val = float(date_str)
+        if 1 < numeric_val < 100000:  # Reasonable range for Excel dates (1900-2173)
+            days = int(numeric_val)
+            result = EXCEL_EPOCH + timedelta(days=days)
+            logger.debug(f"Parsed Excel serial {date_str} → {result}")
+            return result
+    except ValueError:
+        pass  # Not a number, continue with text parsing
+
+    # Truncate 4-letter month names to 3 letters for better parsing
+    # "March" → "Mar", "January" → "Jan", etc.
+    if re.search(r"[a-zA-Z]{4}", date_str):
+        date_str = re.sub(r"([a-zA-Z]{3})[a-zA-Z]", r"\1", date_str)
+
+    # Special handling for month-year formats (e.g., "Mar-18", "Jan-20", "May18")
+    # These should be interpreted as "Mar 2018", "Jan 2020", not "Mar day-18 of current year"
+    # Separator (hyphen/space) is optional to handle both "May-18" and "May18"
+    month_year_pattern = r"^([A-Za-z]{3})[-\s]?(\d{2})$"
+    match = re.match(month_year_pattern, date_str)
+    if match:
+        month_abbr, year_2digit = match.groups()
+        # Convert 2-digit year to 4-digit: 00-68 → 2000-2068, 69-99 → 1969-1999
+        year_int = int(year_2digit)
+        if year_int <= 68:
+            year_4digit = 2000 + year_int
+        else:
+            year_4digit = 1900 + year_int
+        # Parse as "Mon YYYY" format, defaults to first day of month
+        date_str_full = f"{month_abbr} {year_4digit}"
+        try:
+            result = datetime.strptime(date_str_full, "%b %Y").date()
+            logger.debug(f"Parsed month-year '{date_str}' → {result}")
+            return result
+        except ValueError:
+            pass  # Fall through to general parser
+
+    # Try explicit DD/MM/YYYY and DD-MM-YYYY formats first (Southeast Asian standard)
+    # This is more reliable than dateutil.parser's dayfirst=True parameter
+    for fmt in [
+        "%d/%m/%Y",  # 06/05/2013 → 2013-05-06 (6th May)
+        "%d-%m-%Y",  # 06-05-2013 → 2013-05-06
+        "%d/%m/%y",  # 06/05/13 → 2013-05-06
+        "%d-%m-%y",  # 06-05-13 → 2013-05-06
+        "%Y-%m-%d",  # 2013-05-06 (ISO format from Excel)
+        "%d/%m/%Y %H:%M:%S",  # With time component
+        "%Y-%m-%d %H:%M:%S",  # ISO with time
+    ]:
+        try:
+            result = datetime.strptime(date_str, fmt).date()
+            logger.debug(f"Parsed '{date_str}' using format {fmt} → {result}")
+            return result
+        except ValueError:
+            continue
+
+    # Fall back to dateutil.parser for other formats (month names, etc.)
+    # dayfirst=True is still useful for remaining ambiguous cases
+    try:
+        result = date_parser.parse(date_str, dayfirst=True).date()
+        logger.debug(f"Parsed '{date_str}' with dateutil → {result}")
+        return result
+    except (ValueError, date_parser.ParserError) as e:
+        # If parsing fails, log warning and return error date
+        logger.warning(f"Could not parse date '{date_str}': {e}. Returning error value {error_val}")
+        try:
+            return datetime.strptime(error_val, "%Y-%m-%d").date()
+        except ValueError:
+            return None
diff --git a/a4d-python/src/a4d/clean/patient.py b/a4d-python/src/a4d/clean/patient.py
new file mode 100644
index 0000000..321ae37
--- /dev/null
+++ b/a4d-python/src/a4d/clean/patient.py
@@ -0,0 +1,933 @@
+"""Patient data cleaning pipeline.
+
+This module orchestrates the complete cleaning pipeline for patient data,
+following the R pipeline's meta schema approach (script2_process_patient_data.R):
+
+1. Load raw patient data
+2. Apply legacy format fixes
+3. Apply transformations
+4. Type conversions
+5. Validation
+6. Apply meta schema (ensure all columns exist, consistent output)
+"""
+
+from pathlib import Path
+
+import polars as pl
+from loguru import logger
+
+from a4d.clean.converters import (
+    correct_decimal_sign,
+    cut_numeric_value,
+    parse_date_column,
+    safe_convert_column,
+)
+from a4d.clean.schema import (
+    apply_schema,
+    get_date_columns,
+    get_patient_data_schema,
+)
+from a4d.clean.transformers import extract_regimen
+from a4d.clean.validators import validate_all_columns
+from a4d.config import settings
+from a4d.errors import ErrorCollector
+
+
+def clean_patient_data(
+    df_raw: pl.DataFrame,
+    error_collector: ErrorCollector,
+) -> pl.DataFrame:
+    """Clean raw patient data following the complete pipeline.
+
+    This function orchestrates all cleaning steps and ensures the output
+    conforms to the meta schema, regardless of which columns exist in input.
+
+    Args:
+        df_raw: Raw patient data from extraction
+        error_collector: ErrorCollector instance for tracking errors
+
+    Returns:
+        Cleaned DataFrame with complete meta schema applied
+
+    Example:
+        >>> from a4d.extract.patient import extract_patient_data
+        >>> from a4d.errors import ErrorCollector
+        >>>
+        >>> collector = ErrorCollector()
+        >>> df_raw = extract_patient_data(tracker_file)
+        >>> df_clean = clean_patient_data(df_raw, collector)
+        >>> # df_clean has ALL schema columns, with consistent types
+    """
+    logger.info(
+        f"Starting patient data cleaning: {len(df_raw)} rows, {len(df_raw.columns)} columns"
+    )
+
+    # Step 1: Legacy format fixes
+    df = _apply_legacy_fixes(df_raw)
+
+    # Step 2: Pre-processing transformations
+    df = _apply_preprocessing(df)
+
+    # Step 3: Data transformations (regimen extraction, lowercasing, etc.)
+    df = _apply_transformations(df)
+
+    # Step 4: Apply meta schema EARLY (like R does) to ensure all columns exist before conversions
+    # This allows unit conversions to work on columns that don't exist in raw data
+    df = apply_schema(df)
+
+    # Step 5: Type conversions
+    df = _apply_type_conversions(df, error_collector)
+
+    # Step 5.5: Fix age from DOB (like R pipeline does)
+    # Must happen after type conversions so DOB is a proper date
+    # Must happen before range validation so validated age is correct
+    df = _fix_age_from_dob(df, error_collector)
+
+    # Step 5.5b: Calculate t1d_diagnosis_age from dob and t1d_diagnosis_date
+    # Replaces any existing value (including Excel errors like #NUM!)
+    df = _fix_t1d_diagnosis_age(df)
+
+    # Step 5.6: Validate dates (replace future dates with error value)
+    # Must happen after type conversions so dates are proper date types
+    df = _validate_dates(df, error_collector)
+
+    # Step 5.7: Calculate BMI from weight and height (like R does)
+    # Must happen after type conversions and before range validation
+    df = _calculate_bmi(df)
+
+    # Step 6: Range validation and cleanup
+    df = _apply_range_validation(df, error_collector)
+
+    # Step 7: Allowed values validation
+    df = validate_all_columns(df, error_collector)
+
+    # Step 8: Unit conversions (requires schema to be applied first!)
+    df = _apply_unit_conversions(df)
+
+    # Step 9: Create tracker_date from year/month
+    df = _add_tracker_date(df)
+
+    # Step 10: Sort by tracker_date and patient_id
+    df = df.sort(["tracker_date", "patient_id"])
+
+    logger.info(f"Cleaning complete: {len(df)} rows, {len(df.columns)} columns")
+    logger.info(f"Errors collected: {len(error_collector)}")
+
+    return df
+
+
+def _extract_date_from_measurement(df: pl.DataFrame, col_name: str) -> pl.DataFrame:
+    """Extract date from measurement values in legacy trackers.
+
+    Matches R's extract_date_from_measurement() (script2_helper_patient_data_fix.R:115).
+
+    For pre-2019 trackers, values and dates are combined in format:
+    - "14.5 (Jan-20)" → value="14.5 ", date="Jan-20"
+    - ">14 (Mar-18)" → value=">14 ", date="Mar-18"
+    - "148 mg/dl   (Mar-18)" → value="148 mg/dl   ", date="Mar-18"
+
+    Args:
+        df: Input DataFrame
+        col_name: Column name containing combined value+date
+
+    Returns:
+        DataFrame with extracted date in {col_name}_date column
+    """
+    if col_name not in df.columns:
+        return df
+
+    date_col_name = col_name.replace("_mg", "").replace("_mmol", "") + "_date"
+
+    # Check if date column already exists (2019+ trackers)
+    if date_col_name in df.columns:
+        return df
+
+    # Extract value before '(' and date between '(' and ')'
+    # Using regex: everything before '(', then '(', then capture date, then optional ')'
+    df = df.with_columns(
+        [
+            # Extract value (everything before parenthesis, or entire value if no parenthesis)
+            pl.col(col_name).str.extract(r"^([^(]+)", 1).str.strip_chars().alias(col_name),
+            # Extract date (everything between parentheses, if present)
+            pl.col(col_name).str.extract(r"\(([^)]+)\)", 1).alias(date_col_name),
+        ]
+    )
+
+    logger.debug(f"Extracted date from {col_name} into {date_col_name}")
+
+    return df
+
+
+def _apply_legacy_fixes(df: pl.DataFrame) -> pl.DataFrame:
+    """Apply fixes for legacy tracker formats (pre-2024).
+
+    Legacy trackers may have:
+    - Combined date+value columns (e.g., hba1c_updated contains both)
+    - Combined blood pressure values (sys/dias in one column)
+    - Different column structures
+
+    Matches R's legacy handling in script2_process_patient_data.R:30-66.
+
+    Args:
+        df: Input DataFrame
+
+    Returns:
+        DataFrame with legacy fixes applied
+    """
+    # Extract dates from measurement columns for pre-2019 trackers
+    # R checks if *_date column exists, if not, extracts from measurement column
+    df = _extract_date_from_measurement(df, "hba1c_updated")
+    df = _extract_date_from_measurement(df, "fbg_updated_mg")
+    df = _extract_date_from_measurement(df, "fbg_updated_mmol")
+
+    # Split blood pressure for pre-2024 trackers (R line 72)
+    if "blood_pressure_mmhg" in df.columns:
+        from a4d.clean.transformers import split_bp_in_sys_and_dias
+
+        df = split_bp_in_sys_and_dias(df)
+
+    return df
+
+
+def _fix_fbg_column(col: pl.Expr) -> pl.Expr:
+    """Fix FBG column text values to numeric equivalents.
+
+    Matches R's fix_fbg() function (script2_helper_patient_data_fix.R:551-567).
+    Converts qualitative text to numeric values and removes DKA markers.
+
+    Conversions (based on CDC guidelines):
+    - "high", "bad", "hi", "hight" (typo) → "200"
+    - "medium", "med" → "170"
+    - "low", "good", "okay" → "140"
+    - Remove "(DKA)" text, "mg/dl", "mmol/l" suffixes
+    - Trim whitespace
+
+    Args:
+        col: Polars expression for FBG column
+
+    Returns:
+        Polars expression with fixed values
+    """
+    return (
+        col.str.to_lowercase()
+        # Remove unit suffixes (from legacy trackers like 2018)
+        .str.replace_all(r"\s*mg/dl\s*", "", literal=False)
+        .str.replace_all(r"\s*mmol/l\s*", "", literal=False)
+        # Use case-when to match full words, not substrings
+        .str.replace_all(r"^(high|hight|bad|hi)$", "200")  # Anchored to full string
+        .str.replace_all(r"^(med|medium)$", "170")
+        .str.replace_all(r"^(low|good|okay)$", "140")
+        .str.replace_all(r"\(DKA\)", "", literal=True)
+        .str.strip_chars()
+    )
+
+
+def _apply_preprocessing(df: pl.DataFrame) -> pl.DataFrame:
+    """Apply preprocessing transformations before type conversion.
+
+    This includes:
+    - Normalizing patient_id (remove transfer clinic suffix)
+    - Removing > and < signs from HbA1c values (but tracking them)
+    - Fixing FBG text values (high/medium/low → numeric, removing (DKA))
+    - Replacing "-" with "N" in Y/N columns
+    - Deriving insulin_type and insulin_subtype from individual columns (2024+)
+
+    Args:
+        df: Input DataFrame
+
+    Returns:
+        DataFrame with preprocessing applied
+    """
+    # Normalize patient_id: Keep only COUNTRY_ID part, remove transfer clinic suffix
+    # Pattern: "MY_SM003_SB" → "MY_SM003" (keep first two underscore-separated parts)
+    # Also normalizes hyphens first: "LA-MH093_LF" → "LA_MH093_LF" → "LA_MH093"
+    # This ensures consistent patient linking across years when patients transfer clinics
+    if "patient_id" in df.columns:
+        df = df.with_columns(
+            # First normalize hyphens to underscores
+            pl.col("patient_id").str.replace_all("-", "_").alias("_patient_id_normalized")
+        )
+        df = df.with_columns(
+            pl.when(pl.col("_patient_id_normalized").str.contains("_"))
+            .then(pl.col("_patient_id_normalized").str.extract(r"^([A-Z]+_[^_]+)", 1))
+            .otherwise(pl.col("_patient_id_normalized"))
+            .alias("patient_id")
+        )
+        df = df.drop("_patient_id_normalized")
+
+    # Track HbA1c exceeds markers (> or <)
+    if "hba1c_baseline" in df.columns:
+        df = df.with_columns(
+            pl.col("hba1c_baseline")
+            .str.contains(r"[><]")
+            .fill_null(False)
+            .alias("hba1c_baseline_exceeds")
+        )
+        df = df.with_columns(
+            pl.col("hba1c_baseline").str.replace_all(r"[><]", "").alias("hba1c_baseline")
+        )
+
+    if "hba1c_updated" in df.columns:
+        df = df.with_columns(
+            pl.col("hba1c_updated")
+            .str.contains(r"[><]")
+            .fill_null(False)
+            .alias("hba1c_updated_exceeds")
+        )
+        df = df.with_columns(
+            pl.col("hba1c_updated").str.replace_all(r"[><]", "").alias("hba1c_updated")
+        )
+
+    # Fix FBG text values (R: script2_helper_patient_data_fix.R:551-567)
+    # Convert qualitative values to numeric: high→200, medium→170, low→140
+    # Source: https://www.cdc.gov/diabetes/basics/getting-tested.html
+    if "fbg_updated_mg" in df.columns:
+        df = df.with_columns(_fix_fbg_column(pl.col("fbg_updated_mg")).alias("fbg_updated_mg"))
+
+    if "fbg_updated_mmol" in df.columns:
+        df = df.with_columns(_fix_fbg_column(pl.col("fbg_updated_mmol")).alias("fbg_updated_mmol"))
+
+    # Replace "-" with "N" in Y/N columns (2024+ trackers use "-" for No)
+    yn_columns = [
+        "analog_insulin_long_acting",
+        "analog_insulin_rapid_acting",
+        "human_insulin_intermediate_acting",
+        "human_insulin_pre_mixed",
+        "human_insulin_short_acting",
+    ]
+
+    for col in yn_columns:
+        if col in df.columns:
+            df = df.with_columns(pl.col(col).str.replace("-", "N").alias(col))
+
+    # Derive insulin_type and insulin_subtype from individual columns (2024+)
+    # R's validation will convert insulin_type to Title Case and insulin_subtype to "Undefined"
+    if "human_insulin_pre_mixed" in df.columns:
+        df = _derive_insulin_fields(df)
+
+    return df
+
+
+def _derive_insulin_fields(df: pl.DataFrame) -> pl.DataFrame:
+    """Derive insulin_type and insulin_subtype from individual columns.
+
+    Based on R's logic from script2_process_patient_data.R:91-111 but with corrections:
+    - Uses lowercase values (R does this, validation converts to Title Case later)
+    - FIXES R's typo: Uses "rapid-acting" (correct) instead of R's "rapic-acting" (typo)
+
+    For 2024+ trackers:
+    - insulin_type: "human insulin" if any human column is Y, else "analog insulin"
+    - insulin_subtype: Comma-separated list like "pre-mixed,rapid-acting,long-acting"
+      (will be replaced with "Undefined" by validation since
+      comma-separated values aren't in allowed_values)
+
+    NOTE: Python is CORRECT here. Comparison with R will show differences because R has a typo.
+
+    Args:
+        df: Input DataFrame with individual insulin columns
+
+    Returns:
+        DataFrame with insulin_type and insulin_subtype derived
+    """
+    # Determine insulin_type (lowercase to match R)
+    # Important: R's ifelse returns NA when all conditions are NA/None
+    # So we only derive insulin_type when at least one column is not None
+    df = df.with_columns(
+        pl.when(
+            # Only derive if at least one insulin column is not null
+            pl.col("human_insulin_pre_mixed").is_not_null()
+            | pl.col("human_insulin_short_acting").is_not_null()
+            | pl.col("human_insulin_intermediate_acting").is_not_null()
+            | pl.col("analog_insulin_rapid_acting").is_not_null()
+            | pl.col("analog_insulin_long_acting").is_not_null()
+        )
+        .then(
+            # Now check which type
+            pl.when(
+                (pl.col("human_insulin_pre_mixed") == "Y")
+                | (pl.col("human_insulin_short_acting") == "Y")
+                | (pl.col("human_insulin_intermediate_acting") == "Y")
+            )
+            .then(pl.lit("human insulin"))
+            .otherwise(pl.lit("analog insulin"))
+        )
+        .otherwise(None)  # Return None if all columns are None (matches R's NA)
+        .alias("insulin_type")
+    )
+
+    # Build insulin_subtype as comma-separated list (lowercase to match R)
+    # CORRECTED: Use "rapid-acting" (correct) instead of R's "rapic-acting" (typo)
+    df = df.with_columns(
+        pl.concat_list(
+            [
+                pl.when(pl.col("human_insulin_pre_mixed") == "Y")
+                .then(pl.lit("pre-mixed"))
+                .otherwise(pl.lit(None)),
+                pl.when(pl.col("human_insulin_short_acting") == "Y")
+                .then(pl.lit("short-acting"))
+                .otherwise(pl.lit(None)),
+                pl.when(pl.col("human_insulin_intermediate_acting") == "Y")
+                .then(pl.lit("intermediate-acting"))
+                .otherwise(pl.lit(None)),
+                pl.when(pl.col("analog_insulin_rapid_acting") == "Y")
+                .then(pl.lit("rapid-acting"))  # CORRECTED from R's typo
+                .otherwise(pl.lit(None)),
+                pl.when(pl.col("analog_insulin_long_acting") == "Y")
+                .then(pl.lit("long-acting"))
+                .otherwise(pl.lit(None)),
+            ]
+        )
+        .list.drop_nulls()
+        .list.join(",")
+        .alias("insulin_subtype")
+    )
+
+    return df
+
+
+def _apply_transformations(df: pl.DataFrame) -> pl.DataFrame:
+    """Apply data transformations.
+
+    Transformations are explicit Python code (not config-driven):
+    - Lowercase status for case-insensitive validation
+    - Standardize insulin regimen descriptions
+    - Map sex synonyms to M/F
+    - Correct European decimal format
+
+    Args:
+        df: Input DataFrame
+
+    Returns:
+        DataFrame with transformations applied
+    """
+    # Status should keep original case to match R pipeline
+    # R validation is case-insensitive but preserves original values
+
+    # Standardize insulin regimen
+    if "insulin_regimen" in df.columns:
+        df = extract_regimen(df)
+
+    # Map sex synonyms to M/F (matching R's fix_sex)
+    if "sex" in df.columns:
+        from a4d.clean.transformers import fix_sex
+
+        df = fix_sex(df)
+
+    # Fix testing frequency ranges (R line 258)
+    if "testing_frequency" in df.columns:
+        from a4d.clean.transformers import fix_testing_frequency
+
+        df = fix_testing_frequency(df)
+
+    # Correct European decimal format (comma → dot)
+    numeric_cols = [
+        "hba1c_baseline",
+        "hba1c_updated",
+        "fbg_updated_mg",
+        "fbg_updated_mmol",
+        "weight",
+        "height",
+        "bmi",
+    ]
+
+    for col in numeric_cols:
+        if col in df.columns:
+            df = correct_decimal_sign(df, col)
+
+    return df
+
+
+def _apply_type_conversions(df: pl.DataFrame, error_collector: ErrorCollector) -> pl.DataFrame:
+    """Convert columns to target types using safe_convert_column.
+
+    Only converts columns that exist in both the DataFrame and the schema.
+
+    Special handling:
+    - Date columns: Use flexible date parser (handles Mar-18, Excel serials, etc.)
+    - Integer columns: Convert via Float64 first to handle decimals
+
+    Args:
+        df: Input DataFrame
+        error_collector: ErrorCollector for tracking conversion failures
+
+    Returns:
+        DataFrame with types converted
+    """
+    schema = get_patient_data_schema()
+
+    # Convert each column that exists
+    for col, target_type in schema.items():
+        if col not in df.columns:
+            continue
+
+        # Skip if already the correct type (happens when schema adds NULL columns)
+        if df[col].dtype == target_type:
+            continue
+
+        # Special handling for Date columns: use flexible date parser
+        if target_type == pl.Date:
+            # Strip time component if present (e.g., "2009-04-17 00:00:00" → "2009-04-17")
+            # Use split on space instead of slice(0,10) to handle "dd-Mon-yyyy" format (11 chars)
+            df = df.with_columns(
+                pl.col(col).cast(pl.Utf8).str.split(" ").list.first().alias(col)
+            )
+            # Use custom date parser for flexibility (handles Mar-18, Excel serials, etc.)
+            df = parse_date_column(df, col, error_collector)
+        # Special handling for Int32: convert via Float64 first (handles "14.0" → 14.0 → 14)
+        elif target_type == pl.Int32:
+            df = safe_convert_column(df, col, pl.Float64, error_collector)
+            df = df.with_columns(pl.col(col).round(0).cast(pl.Int32, strict=False).alias(col))
+        else:
+            df = safe_convert_column(
+                df=df,
+                column=col,
+                target_type=target_type,
+                error_collector=error_collector,
+            )
+
+    return df
+
+
+def _calculate_bmi(df: pl.DataFrame) -> pl.DataFrame:
+    """Calculate BMI from weight and height.
+
+    Matches R's fix_bmi() function (script2_helper_patient_data_fix.R:401).
+    This REPLACES any existing BMI value with calculated BMI = weight / height^2.
+
+    Must be called after type conversions (so weight/height are numeric)
+    and before range validation (so calculated BMI gets validated).
+
+    Args:
+        df: Input DataFrame
+
+    Returns:
+        DataFrame with calculated BMI column
+    """
+    from a4d.clean.transformers import fix_bmi
+
+    return fix_bmi(df)
+
+
+def _apply_range_validation(df: pl.DataFrame, error_collector: ErrorCollector) -> pl.DataFrame:
+    """Apply range validation and value cleanup.
+
+    This includes:
+    - Height: 0-2.3m (convert cm to m if needed)
+    - Weight: 0-200kg
+    - BMI: 4-60
+    - Age: 0-25 years
+    - HbA1c: 4-18%
+    - FBG: 0-136.5 mmol/l
+
+    Args:
+        df: Input DataFrame
+        error_collector: ErrorCollector for tracking violations
+
+    Returns:
+        DataFrame with range validation applied
+    """
+    # Height: convert cm to m if > 2.3 (likely in cm), then validate
+    if "height" in df.columns:
+        df = df.with_columns(
+            pl.when(pl.col("height") > 2.3)
+            .then(pl.col("height") / 100.0)
+            .otherwise(pl.col("height"))
+            .alias("height")
+        )
+        df = cut_numeric_value(df, "height", 0, 2.3, error_collector)
+
+    # Weight: 0-200 kg
+    if "weight" in df.columns:
+        df = cut_numeric_value(df, "weight", 0, 200, error_collector)
+
+    # BMI: 4-60
+    if "bmi" in df.columns:
+        df = cut_numeric_value(df, "bmi", 10, 80, error_collector)
+
+    # Age: 0-25 years
+    if "age" in df.columns:
+        df = cut_numeric_value(df, "age", 0, 100, error_collector)
+
+    # HbA1c baseline: 4-18%
+    if "hba1c_baseline" in df.columns:
+        df = cut_numeric_value(df, "hba1c_baseline", 0, 25, error_collector)
+
+    # HbA1c updated: 4-18%
+    if "hba1c_updated" in df.columns:
+        df = cut_numeric_value(df, "hba1c_updated", 0, 25, error_collector)
+
+    # FBG updated mmol: 0-136.5 (world record)
+    if "fbg_updated_mmol" in df.columns:
+        df = cut_numeric_value(df, "fbg_updated_mmol", 0, 150, error_collector)
+
+    return df
+
+
+def _apply_unit_conversions(df: pl.DataFrame) -> pl.DataFrame:
+    """Apply unit conversions.
+
+    - FBG mmol/l ↔ mg/dl conversion (18x factor)
+    - Only convert if one is missing but the other exists
+
+    Args:
+        df: Input DataFrame
+
+    Returns:
+        DataFrame with unit conversions applied
+    """
+    # Convert fbg_updated_mg to mmol if mmol is all NULL
+    if "fbg_updated_mmol" in df.columns and "fbg_updated_mg" in df.columns:
+        if df["fbg_updated_mmol"].is_null().all():
+            df = df.with_columns(
+                pl.when(pl.col("fbg_updated_mg") != settings.error_val_numeric)
+                .then(pl.col("fbg_updated_mg") / 18.0)
+                .otherwise(None)
+                .alias("fbg_updated_mmol")
+            )
+
+    # Convert fbg_updated_mmol to mg if mg is all NULL
+    if "fbg_updated_mg" in df.columns and "fbg_updated_mmol" in df.columns:
+        if df["fbg_updated_mg"].is_null().all():
+            df = df.with_columns(
+                pl.when(pl.col("fbg_updated_mmol") != settings.error_val_numeric)
+                .then(pl.col("fbg_updated_mmol") * 18.0)
+                .otherwise(None)
+                .alias("fbg_updated_mg")
+            )
+
+    return df
+
+
+def _fix_age_from_dob(df: pl.DataFrame, error_collector: ErrorCollector) -> pl.DataFrame:
+    """Fix age by calculating from DOB and tracker date.
+
+    Matches R pipeline's fix_age() function (script2_helper_patient_data_fix.R:329).
+    Always uses calculated age from DOB rather than trusting Excel value.
+
+    Logic:
+    1. Calculate age: tracker_year - birth_year
+    2. Adjust if birthday hasn't occurred yet: if tracker_month < birth_month: age -= 1
+    3. If calculated age differs from Excel age, log warning and use calculated
+    4. If calculated age is negative, use error value and log warning
+
+    Args:
+        df: DataFrame with age, dob, tracker_year, tracker_month, patient_id columns
+        error_collector: ErrorCollector for tracking data quality issues
+
+    Returns:
+        DataFrame with corrected age values
+
+    Example:
+        >>> df = pl.DataFrame({
+        ...     "patient_id": ["P001"],
+        ...     "age": [21.0],  # Wrong value from Excel
+        ...     "dob": [date(2006, 8, 8)],
+        ...     "tracker_year": [2025],
+        ...     "tracker_month": [2]
+        ... })
+        >>> collector = ErrorCollector()
+        >>> fixed = _fix_age_from_dob(df, collector)
+        >>> fixed["age"][0]  # Should be 18, not 21
+        18.0
+    """
+    # Only fix if we have the necessary columns
+    required_cols = ["age", "dob", "tracker_year", "tracker_month", "patient_id"]
+    if not all(col in df.columns for col in required_cols):
+        logger.debug("Skipping age fix: missing required columns")
+        return df
+
+    logger.info("Fixing age values from DOB (matching R pipeline logic)")
+
+    error_date = pl.lit(settings.error_val_date).str.to_date()
+
+    # Only calculate if dob is valid (not null, not error date)
+    valid_dob = pl.col("dob").is_not_null() & (pl.col("dob") != error_date)
+
+    # Calculate age from DOB
+    # calc_age = tracker_year - year(dob)
+    # if tracker_month < month(dob): calc_age -= 1
+    df = df.with_columns(
+        pl.when(valid_dob)
+        .then(
+            pl.col("tracker_year")
+            - pl.col("dob").dt.year()
+            - pl.when(pl.col("tracker_month") < pl.col("dob").dt.month()).then(1).otherwise(0)
+        )
+        .otherwise(None)
+        .alias("_calc_age")
+    )
+
+    # Track which ages were fixed
+    ages_fixed = 0
+    ages_missing = 0
+    ages_negative = 0
+
+    # For each row where calc_age differs from age, log and fix
+    for row in df.filter(
+        pl.col("_calc_age").is_not_null()
+        & ((pl.col("age").is_null()) | (pl.col("age") != pl.col("_calc_age")))
+    ).iter_rows(named=True):
+        patient_id = row["patient_id"]
+        file_name = row.get("file_name") or "unknown"
+        excel_age = row["age"]
+        calc_age = row["_calc_age"]
+
+        if excel_age is None or (excel_age == settings.error_val_numeric):
+            logger.warning(
+                f"Patient {patient_id}: age is missing. "
+                f"Using calculated age {calc_age} instead of original age."
+            )
+            error_collector.add_error(
+                file_name=file_name,
+                patient_id=patient_id,
+                column="age",
+                original_value=excel_age if excel_age is not None else "NULL",
+                error_message=f"Age missing, calculated from DOB as {calc_age}",
+                error_code="missing_value",
+                function_name="_fix_age_from_dob",
+            )
+            ages_missing += 1
+        elif calc_age < 0:
+            logger.warning(
+                f"Patient {patient_id}: calculated age is negative ({calc_age}). "
+                f"Please check this manually. Using error value instead."
+            )
+            error_collector.add_error(
+                file_name=file_name,
+                patient_id=patient_id,
+                column="age",
+                original_value=str(excel_age),
+                error_message=f"Calculated age is negative ({calc_age}), check DOB",
+                error_code="invalid_value",
+                function_name="_fix_age_from_dob",
+            )
+            ages_negative += 1
+        else:
+            logger.warning(
+                f"Patient {patient_id}: age {excel_age} is different "
+                f"from calculated age {calc_age}. "
+                f"Using calculated age instead of original age."
+            )
+            error_collector.add_error(
+                file_name=file_name,
+                patient_id=patient_id,
+                column="age",
+                original_value=str(excel_age),
+                error_message=(
+                    f"Age mismatch: Excel={excel_age}, "
+                    f"Calculated={calc_age}. Using calculated age."
+                ),
+                error_code="invalid_value",
+                function_name="_fix_age_from_dob",
+            )
+            ages_fixed += 1
+
+    # Apply fixes:
+    # 1. Use calculated age when available and non-negative
+    # 2. Use error value for negative ages
+    df = df.with_columns(
+        pl.when(pl.col("_calc_age").is_not_null())
+        .then(
+            pl.when(pl.col("_calc_age") < 0)
+            .then(pl.lit(settings.error_val_numeric))
+            .otherwise(pl.col("_calc_age"))
+        )
+        .otherwise(pl.col("age"))
+        .alias("age")
+    )
+
+    # Drop temporary column
+    df = df.drop("_calc_age")
+
+    if ages_fixed > 0 or ages_missing > 0 or ages_negative > 0:
+        logger.info(
+            f"Age fixes applied: {ages_fixed} corrected, "
+            f"{ages_missing} filled from DOB, "
+            f"{ages_negative} negative (set to error)"
+        )
+
+    return df
+
+
+def _fix_t1d_diagnosis_age(df: pl.DataFrame) -> pl.DataFrame:
+    """Calculate t1d_diagnosis_age from dob and t1d_diagnosis_date.
+
+    If both dates are valid (not null, not error date), calculates age at diagnosis.
+    If either date is missing or is error date, result is null.
+
+    Args:
+        df: DataFrame with dob, t1d_diagnosis_date, t1d_diagnosis_age columns
+
+    Returns:
+        DataFrame with calculated t1d_diagnosis_age
+    """
+    required_cols = ["dob", "t1d_diagnosis_date", "t1d_diagnosis_age"]
+    if not all(col in df.columns for col in required_cols):
+        return df
+
+    error_date = pl.lit(settings.error_val_date).str.to_date()
+
+    # Only calculate if both dates are valid (not null, not error date)
+    valid_dob = pl.col("dob").is_not_null() & (pl.col("dob") != error_date)
+    valid_diagnosis = pl.col("t1d_diagnosis_date").is_not_null() & (
+        pl.col("t1d_diagnosis_date") != error_date
+    )
+
+    # Calculate age at diagnosis: year(diagnosis_date) - year(dob)
+    # Adjust if birthday hasn't occurred yet in diagnosis year
+    df = df.with_columns(
+        pl.when(valid_dob & valid_diagnosis)
+        .then(
+            pl.col("t1d_diagnosis_date").dt.year()
+            - pl.col("dob").dt.year()
+            - pl.when(pl.col("t1d_diagnosis_date").dt.month() < pl.col("dob").dt.month())
+            .then(1)
+            .otherwise(0)
+        )
+        .otherwise(None)
+        .cast(pl.Int32)
+        .alias("t1d_diagnosis_age")
+    )
+
+    return df
+
+
+def _validate_dates(df: pl.DataFrame, error_collector: ErrorCollector) -> pl.DataFrame:
+    """Validate date columns and replace future dates with error value.
+
+    Dates beyond the tracker year are considered invalid and replaced with
+    the error date value (9999-09-09). This matches R pipeline behavior.
+
+    Args:
+        df: Input DataFrame with date columns
+        error_collector: ErrorCollector for tracking validation errors
+
+    Returns:
+        DataFrame with invalid dates replaced
+    """
+    date_columns = get_date_columns()
+    dates_fixed = 0
+
+    # Get the error date as a date type
+    error_date = pl.lit(settings.error_val_date).str.to_date()
+
+    for col in date_columns:
+        if col not in df.columns:
+            continue
+
+        # Skip tracker_date as it's derived and shouldn't be validated
+        if col == "tracker_date":
+            continue
+
+        # Create a date representing end of tracker year (December 31)
+        # Find invalid dates and log them
+        temp_df = df.with_columns(pl.date(pl.col("tracker_year"), 12, 31).alias("_max_valid_date"))
+
+        invalid_dates = temp_df.filter(
+            pl.col(col).is_not_null() & (pl.col(col) > pl.col("_max_valid_date"))
+        )
+
+        # Log each error
+        for row in invalid_dates.iter_rows(named=True):
+            patient_id = row.get("patient_id", "UNKNOWN")
+            file_name = row.get("file_name", "UNKNOWN")
+            original_date = row.get(col)
+            tracker_year = row.get("tracker_year")
+
+            logger.warning(
+                f"Patient {patient_id}: {col} = {original_date} "
+                f"is beyond tracker year {tracker_year}. "
+                f"Replacing with error date."
+            )
+            error_collector.add_error(
+                file_name=file_name,
+                patient_id=patient_id,
+                column=col,
+                original_value=str(original_date),
+                error_message=f"Date {original_date} is beyond tracker year {tracker_year}",
+                error_code="invalid_value",
+                function_name="_validate_dates",
+            )
+            dates_fixed += 1
+
+        # Replace invalid dates with error date (using inline expression)
+        df = temp_df.with_columns(
+            pl.when(pl.col(col).is_not_null() & (pl.col(col) > pl.col("_max_valid_date")))
+            .then(error_date)
+            .otherwise(pl.col(col))
+            .alias(col)
+        ).drop("_max_valid_date")
+
+    if dates_fixed > 0:
+        logger.info(f"Date validation: {dates_fixed} future dates replaced with error value")
+
+    return df
+
+
+def _add_tracker_date(df: pl.DataFrame) -> pl.DataFrame:
+    """Create tracker_date from tracker_year and tracker_month.
+
+    Args:
+        df: Input DataFrame
+
+    Returns:
+        DataFrame with tracker_date column
+    """
+    if "tracker_year" in df.columns and "tracker_month" in df.columns:
+        # Parse year-month to date (first day of month)
+        # Cast to string first since they're now Int32
+        df = df.with_columns(
+            pl.concat_str(
+                [
+                    pl.col("tracker_year").cast(pl.String),
+                    pl.lit("-"),
+                    pl.col("tracker_month").cast(pl.String),
+                    pl.lit("-01"),
+                ]
+            )
+            .str.to_date("%Y-%m-%d")
+            .alias("tracker_date")
+        )
+
+    return df
+
+
+def clean_patient_file(
+    raw_parquet_path: Path,
+    output_parquet_path: Path,
+    error_collector: ErrorCollector | None = None,
+) -> None:
+    """Clean a single patient data parquet file.
+
+    This is the main entry point for cleaning a tracker file.
+
+    Args:
+        raw_parquet_path: Path to raw patient parquet (from extraction)
+        output_parquet_path: Path to write cleaned parquet
+        error_collector: Optional ErrorCollector (creates new one if not provided)
+
+    Example:
+        >>> from pathlib import Path
+        >>> raw_path = Path("output/patient_data_raw/2024_Hospital_patient_raw.parquet")
+        >>> clean_path = Path("output/patient_data_clean/2024_Hospital_patient_clean.parquet")
+        >>> clean_patient_file(raw_path, clean_path)
+    """
+    if error_collector is None:
+        error_collector = ErrorCollector()
+
+    logger.info(f"Cleaning patient file: {raw_parquet_path}")
+
+    # Read raw parquet
+    df_raw = pl.read_parquet(raw_parquet_path)
+
+    # Clean data
+    df_clean = clean_patient_data(df_raw, error_collector)
+
+    # Create output directory if needed
+    output_parquet_path.parent.mkdir(parents=True, exist_ok=True)
+
+    # Write cleaned parquet
+    df_clean.write_parquet(output_parquet_path)
+
+    logger.info(f"Cleaned patient file written: {output_parquet_path}")
+    logger.info(f"Total errors: {len(error_collector)}")
diff --git a/a4d-python/src/a4d/clean/schema.py b/a4d-python/src/a4d/clean/schema.py
new file mode 100644
index 0000000..f767550
--- /dev/null
+++ b/a4d-python/src/a4d/clean/schema.py
@@ -0,0 +1,159 @@
+"""Meta schema definition for patient data - matches R pipeline exactly."""
+
+
+import polars as pl
+
+
+def get_patient_data_schema() -> dict[str, pl.DataType]:
+    """Get the complete meta schema for patient data.
+
+    This schema EXACTLY matches the R pipeline's schema in script2_process_patient_data.R.
+    Column order matches R's alphabetical order.
+
+    Returns:
+        Dictionary mapping column names to Polars data types
+    """
+    return {
+        "age": pl.Int32,  # integer() in R
+        "analog_insulin_long_acting": pl.String,  # character() in R
+        "analog_insulin_rapid_acting": pl.String,
+        "blood_pressure_dias_mmhg": pl.Int32,
+        "blood_pressure_sys_mmhg": pl.Int32,
+        "blood_pressure_updated": pl.Date,
+        "bmi": pl.Float64,  # numeric() in R
+        "bmi_date": pl.Date,
+        "clinic_id": pl.String,
+        "clinic_visit": pl.String,
+        "complication_screening_eye_exam_date": pl.Date,
+        "complication_screening_eye_exam_value": pl.String,
+        "complication_screening_foot_exam_date": pl.Date,
+        "complication_screening_foot_exam_value": pl.String,
+        "complication_screening_kidney_test_date": pl.Date,
+        "complication_screening_kidney_test_value": pl.String,
+        "complication_screening_lipid_profile_cholesterol_value": pl.String,
+        "complication_screening_lipid_profile_date": pl.Date,
+        "complication_screening_lipid_profile_hdl_mmol_value": pl.Float64,
+        "complication_screening_lipid_profile_hdl_mg_value": pl.Float64,
+        "complication_screening_lipid_profile_ldl_mmol_value": pl.Float64,
+        "complication_screening_lipid_profile_ldl_mg_value": pl.Float64,
+        "complication_screening_lipid_profile_triglycerides_value": pl.Float64,
+        "complication_screening_remarks": pl.String,
+        "complication_screening_thyroid_test_date": pl.Date,
+        "complication_screening_thyroid_test_ft4_pmol_value": pl.Float64,
+        "complication_screening_thyroid_test_ft4_ng_value": pl.Float64,
+        "complication_screening_thyroid_test_tsh_value": pl.Float64,
+        "dm_complication_eye": pl.String,
+        "dm_complication_kidney": pl.String,
+        "dm_complication_others": pl.String,
+        "dm_complication_remarks": pl.String,
+        "dob": pl.Date,
+        "edu_occ": pl.String,
+        "edu_occ_updated": pl.Date,
+        "family_history": pl.String,
+        "fbg_baseline_mg": pl.Float64,
+        "fbg_baseline_mmol": pl.Float64,
+        "fbg_updated_date": pl.Date,
+        "fbg_updated_mg": pl.Float64,
+        "fbg_updated_mmol": pl.Float64,
+        "file_name": pl.String,
+        "hba1c_baseline": pl.Float64,
+        "hba1c_baseline_exceeds": pl.Boolean,  # logical() in R
+        "hba1c_updated": pl.Float64,
+        "hba1c_updated_exceeds": pl.Boolean,
+        "hba1c_updated_date": pl.Date,
+        "height": pl.Float64,
+        "hospitalisation_cause": pl.String,
+        "hospitalisation_date": pl.Date,
+        "human_insulin_intermediate_acting": pl.String,
+        "human_insulin_pre_mixed": pl.String,
+        "human_insulin_short_acting": pl.String,
+        "insulin_injections": pl.Float64,
+        "insulin_regimen": pl.String,
+        "insulin_total_units": pl.Float64,
+        "insulin_type": pl.String,
+        "insulin_subtype": pl.String,
+        "last_clinic_visit_date": pl.Date,
+        "last_remote_followup_date": pl.Date,
+        "lost_date": pl.Date,
+        "name": pl.String,
+        "observations": pl.String,
+        "observations_category": pl.String,
+        "other_issues": pl.String,
+        "patient_consent": pl.String,
+        "patient_id": pl.String,
+        "province": pl.String,
+        "recruitment_date": pl.Date,
+        "remote_followup": pl.String,
+        "sex": pl.String,
+        "sheet_name": pl.String,
+        "status": pl.String,
+        "status_out": pl.String,
+        "support_level": pl.String,
+        "t1d_diagnosis_age": pl.Int32,
+        "t1d_diagnosis_date": pl.Date,
+        "t1d_diagnosis_with_dka": pl.String,
+        "testing_frequency": pl.Int32,
+        "tracker_date": pl.Date,
+        "tracker_month": pl.Int32,
+        "tracker_year": pl.Int32,
+        "weight": pl.Float64,
+    }
+
+
+def apply_schema(df: pl.DataFrame) -> pl.DataFrame:
+    """Apply the meta schema to a DataFrame.
+
+    This function:
+    1. Adds missing columns with NULL values
+    2. Casts existing columns to target types (if they exist)
+    3. Reorders columns to match schema order
+    4. Returns a DataFrame with the exact schema
+
+    Args:
+        df: Input DataFrame (may be missing columns)
+
+    Returns:
+        DataFrame with complete schema applied
+    """
+    schema = get_patient_data_schema()
+
+    # Start with existing columns
+    df_result = df
+
+    # Add missing columns with NULL values
+    missing_cols = set(schema.keys()) - set(df.columns)
+    for col in missing_cols:
+        df_result = df_result.with_columns(pl.lit(None, dtype=schema[col]).alias(col))
+
+    # Reorder columns to match schema order
+    df_result = df_result.select(list(schema.keys()))
+
+    return df_result
+
+
+def get_numeric_columns() -> list[str]:
+    """Get list of numeric columns from schema."""
+    schema = get_patient_data_schema()
+    return [
+        col
+        for col, dtype in schema.items()
+        if dtype in (pl.Int32, pl.Int64, pl.Float32, pl.Float64)
+    ]
+
+
+def get_date_columns() -> list[str]:
+    """Get list of date columns from schema."""
+    schema = get_patient_data_schema()
+    return [col for col, dtype in schema.items() if dtype == pl.Date]
+
+
+def get_boolean_columns() -> list[str]:
+    """Get list of boolean columns from schema."""
+    schema = get_patient_data_schema()
+    return [col for col, dtype in schema.items() if dtype == pl.Boolean]
+
+
+def get_string_columns() -> list[str]:
+    """Get list of string columns from schema."""
+    schema = get_patient_data_schema()
+    return [col for col, dtype in schema.items() if dtype == pl.String]
diff --git a/a4d-python/src/a4d/clean/schema_old.py b/a4d-python/src/a4d/clean/schema_old.py
new file mode 100644
index 0000000..6d91d28
--- /dev/null
+++ b/a4d-python/src/a4d/clean/schema_old.py
@@ -0,0 +1,202 @@
+"""Meta schema definition for patient data.
+
+This module defines the complete target schema for the patient_data table.
+All cleaned patient data will conform to this schema, with missing columns
+filled with NULL values.
+
+This mirrors the R pipeline's meta schema approach (script2_process_patient_data.R)
+where a complete schema is defined upfront, and only columns that exist in the
+raw data are processed - the rest are left empty.
+"""
+
+
+import polars as pl
+
+
+def get_patient_data_schema() -> dict[str, pl.DataType]:
+    """Get the complete meta schema for patient data.
+
+    This schema defines ALL columns that should exist in the final
+    patient_data table, along with their target data types.
+
+    Returns:
+        Dictionary mapping column names to Polars data types
+
+    Note:
+        - Not all columns will exist in every tracker file
+        - Missing columns will be filled with NULL
+        - All columns in output will match this schema exactly
+    """
+    return {
+        # Metadata columns (always present from extraction)
+        "file_name": pl.String,
+        "clinic_id": pl.String,
+        "tracker_year": pl.Int32,
+        "tracker_month": pl.Int32,
+        "sheet_name": pl.String,
+        "patient_id": pl.String,
+        "tracker_date": pl.Date,
+        # Patient demographics
+        "name": pl.String,
+        "age": pl.Int32,
+        "dob": pl.Date,
+        "sex": pl.String,
+        "province": pl.String,
+        "edu_occ": pl.String,
+        "edu_occ_updated": pl.Date,
+        "family_history": pl.String,
+        # Patient status
+        "status": pl.String,
+        "status_out": pl.String,
+        "patient_consent": pl.String,
+        "recruitment_date": pl.Date,
+        "lost_date": pl.Date,
+        # Diagnosis
+        "t1d_diagnosis_date": pl.Date,
+        "t1d_diagnosis_age": pl.Int32,
+        "t1d_diagnosis_with_dka": pl.String,
+        # Physical measurements
+        "height": pl.Float64,
+        "weight": pl.Float64,
+        "bmi": pl.Float64,
+        "bmi_date": pl.Date,
+        # Blood pressure
+        "blood_pressure_sys_mmhg": pl.Int32,
+        "blood_pressure_dias_mmhg": pl.Int32,
+        "blood_pressure_updated": pl.Date,
+        # HbA1c
+        "hba1c_baseline": pl.Float64,
+        "hba1c_baseline_exceeds": pl.Boolean,
+        "hba1c_updated": pl.Float64,
+        "hba1c_updated_exceeds": pl.Boolean,
+        "hba1c_updated_date": pl.Date,
+        # FBG (Fasting Blood Glucose)
+        "fbg_baseline_mg": pl.Float64,
+        "fbg_baseline_mmol": pl.Float64,
+        "fbg_updated_mg": pl.Float64,
+        "fbg_updated_mmol": pl.Float64,
+        "fbg_updated_date": pl.Date,
+        # Testing
+        "testing_frequency": pl.Int32,
+        # Insulin type and regimen
+        "insulin_type": pl.String,
+        "insulin_subtype": pl.String,
+        "insulin_regimen": pl.String,
+        "insulin_injections": pl.Float64,
+        "insulin_total_units": pl.Float64,
+        # Human insulin (2024+ trackers)
+        "human_insulin_pre_mixed": pl.String,
+        "human_insulin_short_acting": pl.String,
+        "human_insulin_intermediate_acting": pl.String,
+        # Analog insulin (2024+ trackers)
+        "analog_insulin_rapid_acting": pl.String,
+        "analog_insulin_long_acting": pl.String,
+        # Support
+        "support_level": pl.String,
+        # Clinic visits
+        "clinic_visit": pl.String,
+        "last_clinic_visit_date": pl.Date,
+        "remote_followup": pl.String,
+        "last_remote_followup_date": pl.Date,
+        # Hospitalisation
+        "hospitalisation_cause": pl.String,
+        "hospitalisation_date": pl.Date,
+        # DM Complications
+        "dm_complication_eye": pl.String,
+        "dm_complication_kidney": pl.String,
+        "dm_complication_others": pl.String,
+        "dm_complication_remarks": pl.String,
+        # Complication screening - Eye
+        "complication_screening_eye_exam_date": pl.Date,
+        "complication_screening_eye_exam_value": pl.String,
+        # Complication screening - Foot
+        "complication_screening_foot_exam_date": pl.Date,
+        "complication_screening_foot_exam_value": pl.String,
+        # Complication screening - Kidney
+        "complication_screening_kidney_test_date": pl.Date,
+        "complication_screening_kidney_test_value": pl.String,
+        # Complication screening - Lipid profile
+        "complication_screening_lipid_profile_date": pl.Date,
+        "complication_screening_lipid_profile_cholesterol_value": pl.String,
+        "complication_screening_lipid_profile_hdl_mmol_value": pl.Float64,
+        "complication_screening_lipid_profile_hdl_mg_value": pl.Float64,
+        "complication_screening_lipid_profile_ldl_mmol_value": pl.Float64,
+        "complication_screening_lipid_profile_ldl_mg_value": pl.Float64,
+        "complication_screening_lipid_profile_triglycerides_value": pl.Float64,
+        # Complication screening - Thyroid
+        "complication_screening_thyroid_test_date": pl.Date,
+        "complication_screening_thyroid_test_tsh_value": pl.Float64,
+        "complication_screening_thyroid_test_ft4_pmol_value": pl.Float64,
+        "complication_screening_thyroid_test_ft4_ng_value": pl.Float64,
+        # Complication screening - General
+        "complication_screening_remarks": pl.String,
+        # Other
+        "other_issues": pl.String,
+        # Observations
+        "observations_category": pl.String,
+        "observations": pl.String,
+    }
+
+
+def apply_schema(df: pl.DataFrame) -> pl.DataFrame:
+    """Apply the meta schema to a DataFrame.
+
+    This function:
+    1. Adds missing columns with NULL values
+    2. Casts existing columns to target types (if they exist)
+    3. Reorders columns to match schema order
+    4. Returns a DataFrame with the exact schema
+
+    Args:
+        df: Input DataFrame (may be missing columns)
+
+    Returns:
+        DataFrame with complete schema applied
+
+    Example:
+        >>> schema = get_patient_data_schema()
+        >>> df_clean = apply_schema(df_raw)
+        >>> # Now df_clean has ALL schema columns, missing ones are NULL
+    """
+    schema = get_patient_data_schema()
+
+    # Start with existing columns
+    df_result = df
+
+    # Add missing columns with NULL values
+    missing_cols = set(schema.keys()) - set(df.columns)
+    for col in missing_cols:
+        df_result = df_result.with_columns(pl.lit(None, dtype=schema[col]).alias(col))
+
+    # Reorder columns to match schema order
+    df_result = df_result.select(list(schema.keys()))
+
+    return df_result
+
+
+def get_numeric_columns() -> list[str]:
+    """Get list of numeric columns from schema."""
+    schema = get_patient_data_schema()
+    return [
+        col
+        for col, dtype in schema.items()
+        if dtype in (pl.Int32, pl.Int64, pl.Float32, pl.Float64)
+    ]
+
+
+def get_date_columns() -> list[str]:
+    """Get list of date columns from schema."""
+    schema = get_patient_data_schema()
+    return [col for col, dtype in schema.items() if dtype == pl.Date]
+
+
+def get_boolean_columns() -> list[str]:
+    """Get list of boolean columns from schema."""
+    schema = get_patient_data_schema()
+    return [col for col, dtype in schema.items() if dtype == pl.Boolean]
+
+
+def get_string_columns() -> list[str]:
+    """Get list of string columns from schema."""
+    schema = get_patient_data_schema()
+    return [col for col, dtype in schema.items() if dtype == pl.String]
diff --git a/a4d-python/src/a4d/clean/transformers.py b/a4d-python/src/a4d/clean/transformers.py
new file mode 100644
index 0000000..b952023
--- /dev/null
+++ b/a4d-python/src/a4d/clean/transformers.py
@@ -0,0 +1,388 @@
+"""Data transformation functions for cleaning.
+
+This module provides transformation functions that are applied before validation.
+These functions standardize values, fix legacy formats, and normalize data.
+
+Transformations are referenced in reference_data/data_cleaning.yaml with
+type: basic_function.
+"""
+
+
+import polars as pl
+
+from a4d.config import settings
+
+
+def extract_regimen(df: pl.DataFrame, column: str = "insulin_regimen") -> pl.DataFrame:
+    """Extract and standardize insulin regimen values.
+
+    This function applies regex pattern matching to standardize insulin regimen
+    descriptions into canonical forms. Matches are case-insensitive.
+
+    Transformations:
+    - Contains "basal" → "Basal-bolus (MDI)"
+    - Contains "premixed" → "Premixed 30/70 BD"
+    - Contains "self-mixed" → "Self-mixed BD"
+    - Contains "conventional" → "Modified conventional TID"
+
+    Args:
+        df: Input DataFrame
+        column: Column name to transform (default: "insulin_regimen")
+
+    Returns:
+        DataFrame with standardized insulin regimen values
+
+    Example:
+        >>> df = extract_regimen(df)
+        >>> # "Basal-bolus" → "Basal-bolus (MDI)"
+        >>> # "PREMIXED 30/70" → "Premixed 30/70 BD"
+    """
+    if column not in df.columns:
+        return df
+
+    # Apply regex transformations in order (matching R's behavior)
+    df = df.with_columns(
+        pl.col(column)
+        .str.to_lowercase()
+        .str.replace(r"^.*basal.*$", "Basal-bolus (MDI)")
+        .str.replace(r"^.*premixed.*$", "Premixed 30/70 BD")
+        .str.replace(r"^.*self-mixed.*$", "Self-mixed BD")
+        .str.replace(r"^.*conventional.*$", "Modified conventional TID")
+        .alias(column)
+    )
+
+    return df
+
+
+def fix_sex(df: pl.DataFrame, column: str = "sex") -> pl.DataFrame:
+    """Map sex synonyms to canonical values (M/F) or error value.
+
+    Matches R's fix_sex() function behavior:
+    - Female synonyms: female, girl, woman, fem, feminine, f → "F"
+    - Male synonyms: male, boy, man, masculine, m → "M"
+    - Anything else → "Undefined" (error value)
+
+    Args:
+        df: Input DataFrame
+        column: Column name to transform (default: "sex")
+
+    Returns:
+        DataFrame with sex values normalized to M/F or Undefined
+
+    Example:
+        >>> df = fix_sex(df)
+        >>> # "Female" → "F"
+        >>> # "MALE" → "M"
+        >>> # "invalid" → "Undefined"
+    """
+    if column not in df.columns:
+        return df
+
+    # Define synonyms matching R's fix_sex function
+    synonyms_female = ["female", "girl", "woman", "fem", "feminine", "f"]
+    synonyms_male = ["male", "boy", "man", "masculine", "m"]
+
+    # Build expression using pl.when().then().when().then()... chain
+    # Start with null/empty handling
+    expr = pl.when(pl.col(column).is_null() | (pl.col(column) == "")).then(None)
+
+    # Add female synonyms
+    for synonym in synonyms_female:
+        expr = expr.when(pl.col(column).str.to_lowercase() == synonym).then(pl.lit("F"))
+
+    # Add male synonyms
+    for synonym in synonyms_male:
+        expr = expr.when(pl.col(column).str.to_lowercase() == synonym).then(pl.lit("M"))
+
+    # Default: anything else becomes Undefined
+    expr = expr.otherwise(pl.lit(settings.error_val_character))
+
+    df = df.with_columns(expr.alias(column))
+
+    return df
+
+
+def fix_bmi(df: pl.DataFrame) -> pl.DataFrame:
+    """Calculate BMI from weight and height.
+
+    Matches R's fix_bmi() function behavior:
+    - If weight or height is null → BMI becomes null
+    - If weight or height is error value → BMI becomes error value
+    - Otherwise: BMI = weight / height^2
+
+    Height is converted from cm to m if > 50 (R's transform_cm_to_m threshold).
+    This ensures correct BMI regardless of whether height is in cm or m.
+
+    This calculation REPLACES any existing BMI value, matching R's behavior.
+
+    Args:
+        df: Input DataFrame (must have weight and height columns)
+
+    Returns:
+        DataFrame with calculated BMI column
+
+    Example:
+        >>> df = fix_bmi(df)
+        >>> # weight=70, height=1.75 → bmi=22.86
+        >>> # weight=30.7, height=135.5 (cm) → height_m=1.355, bmi=16.72
+    """
+    if "weight" not in df.columns or "height" not in df.columns:
+        return df
+
+    # Convert height from cm to m if > 50 (R's transform_cm_to_m threshold)
+    height_m = (
+        pl.when(pl.col("height") > 50)
+        .then(pl.col("height") / 100.0)
+        .otherwise(pl.col("height"))
+    )
+
+    # Calculate BMI: weight / height^2
+    # Match R's case_when logic exactly
+    df = df.with_columns(
+        pl.when(pl.col("weight").is_null() | pl.col("height").is_null())
+        .then(None)
+        .when(
+            (pl.col("weight") == settings.error_val_numeric)
+            | (pl.col("height") == settings.error_val_numeric)
+        )
+        .then(pl.lit(settings.error_val_numeric))
+        .otherwise(pl.col("weight") / height_m.pow(2))
+        .alias("bmi")
+    )
+
+    return df
+
+
+def str_to_lower(df: pl.DataFrame, column: str) -> pl.DataFrame:
+    """Convert column values to lowercase.
+
+    This is used for case-insensitive validation. For example, the "status"
+    column may have mixed case values like "Active", "ACTIVE", "active" which
+    should all be normalized to lowercase before validation.
+
+    Args:
+        df: Input DataFrame
+        column: Column name to transform
+
+    Returns:
+        DataFrame with lowercase column values
+
+    Example:
+        >>> df = str_to_lower(df, "status")
+        >>> # "ACTIVE" → "active"
+        >>> # "Inactive" → "inactive"
+    """
+    if column not in df.columns:
+        return df
+
+    df = df.with_columns(pl.col(column).str.to_lowercase().alias(column))
+
+    return df
+
+
+def apply_transformation(
+    df: pl.DataFrame,
+    column: str,
+    function_name: str,
+) -> pl.DataFrame:
+    """Apply a named transformation function to a column.
+
+    This is the dispatcher function that maps function names from
+    data_cleaning.yaml to actual transformation functions.
+
+    Args:
+        df: Input DataFrame
+        column: Column name to transform
+        function_name: Name of transformation function (from YAML)
+
+    Returns:
+        DataFrame with transformation applied
+
+    Raises:
+        ValueError: If function_name is not recognized
+
+    Example:
+        >>> df = apply_transformation(df, "status", "stringr::str_to_lower")
+        >>> df = apply_transformation(df, "insulin_regimen", "extract_regimen")
+    """
+    # Map R function names to Python implementations
+    function_mapping = {
+        "extract_regimen": lambda df, col: extract_regimen(df, col),
+        "stringr::str_to_lower": lambda df, col: str_to_lower(df, col),
+        "str_to_lower": lambda df, col: str_to_lower(df, col),
+    }
+
+    if function_name not in function_mapping:
+        raise ValueError(f"Unknown transformation function: {function_name}")
+
+    return function_mapping[function_name](df, column)
+
+
+def correct_decimal_sign_multiple(
+    df: pl.DataFrame,
+    columns: list[str],
+) -> pl.DataFrame:
+    """Replace comma decimal separator with dot for multiple columns.
+
+    Some trackers use European decimal format (1,5 instead of 1.5).
+    This function fixes that for multiple numeric columns.
+
+    Args:
+        df: Input DataFrame
+        columns: List of column names to correct
+
+    Returns:
+        DataFrame with corrected decimal signs
+
+    Example:
+        >>> df = correct_decimal_sign_multiple(df, ["weight", "height", "hba1c"])
+    """
+    from a4d.clean.converters import correct_decimal_sign
+
+    for column in columns:
+        df = correct_decimal_sign(df, column)
+
+    return df
+
+
+def replace_range_with_mean(x: str) -> float:
+    """Calculate mean of a range string.
+
+    Matches R's replace_range_with_mean() function behavior.
+    Splits string on "-", converts parts to numeric, returns mean.
+
+    Args:
+        x: Range string (e.g., "0-2", "2-3")
+
+    Returns:
+        Mean of the range values
+
+    Example:
+        >>> replace_range_with_mean("0-2")
+        1.0
+        >>> replace_range_with_mean("2-3")
+        2.5
+    """
+    parts = x.split("-")
+    numbers = [float(p) for p in parts]
+    return sum(numbers) / len(numbers)
+
+
+def fix_testing_frequency(df: pl.DataFrame) -> pl.DataFrame:
+    """Fix testing_frequency column by replacing ranges with mean values.
+
+    Matches R's fix_testing_frequency() function behavior:
+    - Replaces ranges like "0-2" with mean "1"
+    - Preserves null and empty values as null
+    - Logs warning when ranges are detected
+
+    Args:
+        df: Input DataFrame
+
+    Returns:
+        DataFrame with testing_frequency ranges replaced by mean values
+
+    Example:
+        >>> df = fix_testing_frequency(df)
+        >>> # "0-2" → "1"
+        >>> # "2-3" → "2.5"
+        >>> # "2" → "2" (unchanged)
+    """
+    if "testing_frequency" not in df.columns:
+        return df
+
+    from loguru import logger
+
+    # Track if we logged warnings
+    has_ranges = False
+
+    def fix_value(value: str | None) -> str | None:
+        """Fix a single testing_frequency value."""
+        nonlocal has_ranges
+
+        if value is None or value == "":
+            return None
+
+        if "-" in value:
+            has_ranges = True
+
+            try:
+                mean_value = replace_range_with_mean(value)
+                # Return as string, remove trailing .0 for whole numbers
+                if mean_value == int(mean_value):
+                    return str(int(mean_value))
+                return str(mean_value)
+            except Exception:
+                # If replacement fails, return None
+                return None
+
+        return value
+
+    # Apply transformation
+    df = df.with_columns(
+        pl.col("testing_frequency")
+        .map_elements(fix_value, return_dtype=pl.String)
+        .alias("testing_frequency")
+    )
+
+    # Log warning if any ranges were found
+    if has_ranges:
+        logger.warning("Found ranges in testing_frequency column. Replacing with mean values.")
+
+    return df
+
+
+def split_bp_in_sys_and_dias(df: pl.DataFrame) -> pl.DataFrame:
+    """Split blood_pressure_mmhg into systolic and diastolic columns.
+
+    Matches R's split_bp_in_sys_and_dias() function behavior:
+    - Splits "120/80" format into two columns
+    - Invalid formats (without "/") are replaced with error value
+    - Logs warning for invalid values
+
+    Args:
+        df: Input DataFrame with blood_pressure_mmhg column
+
+    Returns:
+        DataFrame with blood_pressure_sys_mmhg and blood_pressure_dias_mmhg columns
+
+    Example:
+        >>> df = split_bp_in_sys_and_dias(df)
+        >>> # "96/55" → sys="96", dias="55"
+        >>> # "96" → sys="999999", dias="999999" (invalid)
+    """
+    if "blood_pressure_mmhg" not in df.columns:
+        return df
+
+    from loguru import logger
+
+    # First, replace invalid values (those without "/") with error format
+    error_val_int = int(settings.error_val_numeric)
+    df = df.with_columns(
+        pl.when(~pl.col("blood_pressure_mmhg").str.contains("/", literal=True))
+        .then(pl.lit(f"{error_val_int}/{error_val_int}"))
+        .otherwise(pl.col("blood_pressure_mmhg"))
+        .alias("blood_pressure_mmhg")
+    )
+
+    # Check if any invalid values were found
+    error_pattern = f"{error_val_int}/{error_val_int}"
+    has_errors = df.filter(pl.col("blood_pressure_mmhg") == error_pattern).height > 0
+
+    if has_errors:
+        logger.warning(
+            "Found invalid values for column blood_pressure_mmhg "
+            f"that do not follow the format X/Y. "
+            f"Values were replaced with {error_val_int}."
+        )
+
+    # Split the column
+    df = df.with_columns(
+        pl.col("blood_pressure_mmhg").str.split("/").list.get(0).alias("blood_pressure_sys_mmhg"),
+        pl.col("blood_pressure_mmhg").str.split("/").list.get(1).alias("blood_pressure_dias_mmhg"),
+    )
+
+    # Drop the original combined column
+    df = df.drop("blood_pressure_mmhg")
+
+    return df
diff --git a/a4d-python/src/a4d/clean/validators.py b/a4d-python/src/a4d/clean/validators.py
new file mode 100644
index 0000000..f279d52
--- /dev/null
+++ b/a4d-python/src/a4d/clean/validators.py
@@ -0,0 +1,423 @@
+"""Schema and validation utilities for data cleaning.
+
+This module provides functions for validating DataFrame columns against
+allowed values defined in reference_data/validation_rules.yaml.
+
+The validation pattern is:
+1. Load validation rules from YAML
+2. Check column values against allowed values
+3. Log invalid values to ErrorCollector
+4. Replace invalid values with error value (if configured)
+
+Note: Data transformations are NOT in the YAML - they are hardcoded in
+transformers.py for better type safety and maintainability.
+"""
+
+import re
+from typing import Any
+
+import polars as pl
+
+from a4d.config import settings
+from a4d.errors import ErrorCollector
+from a4d.reference.loaders import get_reference_data_path, load_yaml
+
+
+def sanitize_str(text: str) -> str:
+    """Sanitize string for case-insensitive matching.
+
+    Matches R's sanitize_str function:
+    1. Convert to lowercase
+    2. Remove spaces
+    3. Remove special characters (keep only alphanumeric)
+
+    Args:
+        text: String to sanitize
+
+    Returns:
+        Sanitized string
+
+    Example:
+        >>> sanitize_str("Active - Remote")
+        'activeremote'
+        >>> sanitize_str("Lost Follow Up")
+        'lostfollowup'
+    """
+    if not isinstance(text, str):
+        return text
+    return re.sub(r"[^a-z0-9]", "", text.lower())
+
+
+def load_validation_rules() -> dict[str, Any]:
+    """Load validation rules from validation_rules.yaml.
+
+    Returns:
+        Dictionary mapping column names to their validation rules.
+        Structure: {column_name: {allowed_values: [...], replace_invalid: bool}}
+
+    Example:
+        >>> rules = load_validation_rules()
+        >>> rules["status"]["allowed_values"]
+        ['active', 'inactive', ...]
+        >>> rules["status"]["replace_invalid"]
+        True
+    """
+    yaml_path = get_reference_data_path("validation_rules.yaml")
+    return load_yaml(yaml_path)
+
+
+def validate_allowed_values(
+    df: pl.DataFrame,
+    column: str,
+    allowed_values: list[str],
+    error_collector: ErrorCollector,
+    replace_invalid: bool = True,
+    file_name_col: str = "file_name",
+    patient_id_col: str = "patient_id",
+) -> pl.DataFrame:
+    """Validate column against allowed values with case-insensitive matching.
+
+    Matches R's validation behavior:
+    1. Sanitize both input values and allowed values for matching
+    2. If matched, replace with canonical value from allowed_values
+    3. If not matched, replace with error value (if replace_invalid=True)
+
+    Args:
+        df: Input DataFrame
+        column: Column name to validate
+        allowed_values: List of canonical allowed values (e.g., ["Active", "Inactive"])
+        error_collector: ErrorCollector instance to track violations
+        replace_invalid: If True, replace invalid values with error value
+        file_name_col: Column containing file name for error tracking
+        patient_id_col: Column containing patient ID for error tracking
+
+    Returns:
+        DataFrame with values normalized to canonical form or replaced
+
+    Example:
+        >>> collector = ErrorCollector()
+        >>> df = validate_allowed_values(
+        ...     df=df,
+        ...     column="status",
+        ...     allowed_values=["Active", "Inactive"],  # Canonical forms
+        ...     error_collector=collector,
+        ... )
+        >>> # "active", "ACTIVE", "Active" all become "Active"
+    """
+    if column not in df.columns:
+        return df
+
+    # Create mapping: {sanitized → canonical} like R does
+    # E.g., {"active": "Active", "activeremote": "Active - Remote"}
+    canonical_mapping = {sanitize_str(val): val for val in allowed_values}
+
+    # Get unique non-null values from the column
+    col_values = df.filter(pl.col(column).is_not_null()).select(column).unique()
+
+    # Track which values need replacement and their canonical forms
+    value_replacements = {}  # {original → canonical or error_value}
+
+    for row in col_values.iter_rows(named=True):
+        original_val = row[column]
+
+        # Skip if already the error value
+        if original_val == settings.error_val_character:
+            value_replacements[original_val] = original_val
+            continue
+
+        # Sanitize and lookup
+        sanitized = sanitize_str(original_val)
+
+        if sanitized in canonical_mapping:
+            # Valid - replace with canonical value
+            value_replacements[original_val] = canonical_mapping[sanitized]
+        else:
+            # Invalid - log error
+            error_collector.add_error(
+                file_name="unknown",  # Will be filled in bulk operations
+                patient_id="unknown",
+                column=column,
+                original_value=original_val,
+                error_message=f"Value '{original_val}' not in allowed values: {allowed_values}",
+                error_code="invalid_value",
+                function_name="validate_allowed_values",
+            )
+
+            if replace_invalid:
+                value_replacements[original_val] = settings.error_val_character
+            else:
+                value_replacements[original_val] = original_val
+
+    # Apply all replacements at once using pl.when().then() chain
+    # This ensures we replace with canonical values even if they match
+    if value_replacements:
+        expr = pl.col(column)
+        for original, replacement in value_replacements.items():
+            expr = pl.when(pl.col(column) == original).then(pl.lit(replacement)).otherwise(expr)
+
+        df = df.with_columns(expr.alias(column))
+
+    return df
+
+
+def validate_column_from_rules(
+    df: pl.DataFrame,
+    column: str,
+    rules: dict[str, Any],
+    error_collector: ErrorCollector,
+    file_name_col: str = "file_name",
+    patient_id_col: str = "patient_id",
+) -> pl.DataFrame:
+    """Validate column using rules from validation_rules.yaml.
+
+    Args:
+        df: Input DataFrame
+        column: Column name to validate
+        rules: Validation rules for this column (from validation_rules.yaml)
+                Structure: {allowed_values: [...], replace_invalid: bool}
+        error_collector: ErrorCollector instance
+        file_name_col: Column containing file name for error tracking
+        patient_id_col: Column containing patient ID for error tracking
+
+    Returns:
+        DataFrame with column validated and cleaned
+
+    Example:
+        >>> rules = load_validation_rules()
+        >>> collector = ErrorCollector()
+        >>> df = validate_column_from_rules(
+        ...     df=df,
+        ...     column="status",
+        ...     rules=rules["status"],
+        ...     error_collector=collector,
+        ... )
+    """
+    if column not in df.columns:
+        return df
+
+    # Extract validation parameters from simplified rules
+    allowed_values = rules.get("allowed_values", [])
+    replace_invalid = rules.get("replace_invalid", True)
+
+    df = validate_allowed_values(
+        df=df,
+        column=column,
+        allowed_values=allowed_values,
+        error_collector=error_collector,
+        replace_invalid=replace_invalid,
+        file_name_col=file_name_col,
+        patient_id_col=patient_id_col,
+    )
+
+    return df
+
+
+def validate_province(
+    df: pl.DataFrame,
+    error_collector: ErrorCollector,
+    file_name_col: str = "file_name",
+    patient_id_col: str = "patient_id",
+) -> pl.DataFrame:
+    """Validate province column against allowed provinces from YAML.
+
+    Uses the shared allowed_provinces.yaml file to validate province values.
+    Matches R's behavior: sanitizes values for comparison and sets invalid
+    provinces to "Undefined".
+
+    Args:
+        df: Input DataFrame
+        error_collector: ErrorCollector instance
+        file_name_col: Column containing file name for error tracking
+        patient_id_col: Column containing patient ID for error tracking
+
+    Returns:
+        DataFrame with province validated
+
+    Example:
+        >>> collector = ErrorCollector()
+        >>> df = validate_province(df, collector)
+    """
+    from a4d.reference.provinces import load_canonical_provinces
+
+    if "province" not in df.columns:
+        return df
+
+    # Load canonical province names (with proper casing) for validation
+    allowed_provinces = load_canonical_provinces()
+
+    # Use generic validator with loaded provinces
+    df = validate_allowed_values(
+        df=df,
+        column="province",
+        allowed_values=allowed_provinces,
+        error_collector=error_collector,
+        replace_invalid=True,
+        file_name_col=file_name_col,
+        patient_id_col=patient_id_col,
+    )
+
+    return df
+
+
+def validate_all_columns(
+    df: pl.DataFrame,
+    error_collector: ErrorCollector,
+    file_name_col: str = "file_name",
+    patient_id_col: str = "patient_id",
+) -> pl.DataFrame:
+    """Validate all columns that have rules in data_cleaning.yaml.
+
+    Args:
+        df: Input DataFrame
+        error_collector: ErrorCollector instance
+        file_name_col: Column containing file name for error tracking
+        patient_id_col: Column containing patient ID for error tracking
+
+    Returns:
+        DataFrame with all columns validated
+
+    Example:
+        >>> collector = ErrorCollector()
+        >>> df_clean = validate_all_columns(df, collector)
+        >>> len(collector)  # Number of validation errors found
+    """
+    rules = load_validation_rules()
+
+    for column, column_rules in rules.items():
+        if column in df.columns:
+            df = validate_column_from_rules(
+                df=df,
+                column=column,
+                rules=column_rules,
+                error_collector=error_collector,
+                file_name_col=file_name_col,
+                patient_id_col=patient_id_col,
+            )
+
+    # Validate province separately (not in validation_rules.yaml)
+    df = validate_province(
+        df=df,
+        error_collector=error_collector,
+        file_name_col=file_name_col,
+        patient_id_col=patient_id_col,
+    )
+
+    # Fix patient_id LAST (other functions use it for logging)
+    df = fix_patient_id(
+        df=df,
+        error_collector=error_collector,
+        patient_id_col=patient_id_col,
+    )
+
+    return df
+
+
+def fix_patient_id(
+    df: pl.DataFrame,
+    error_collector: ErrorCollector,
+    patient_id_col: str = "patient_id",
+) -> pl.DataFrame:
+    """Validate and fix patient ID format.
+
+    Matches R's fix_id() function behavior:
+    - Valid format: XX_YY### (e.g., "KD_EW004")
+      - 2 uppercase letters, underscore, 2 uppercase letters, 3 digits
+    - Normalizes hyphens to underscores: "KD-EW004" → "KD_EW004"
+    - Truncates if > 8 characters: "KD_EW004XY" → "KD_EW004"
+    - Replaces with error value if ≤ 8 chars and invalid format
+
+    This function should be called LAST in the validation pipeline because
+    other functions use patient_id for error logging.
+
+    Args:
+        df: Input DataFrame
+        error_collector: ErrorCollector for tracking validation errors
+        patient_id_col: Column name for patient ID (default: "patient_id")
+
+    Returns:
+        DataFrame with validated/fixed patient IDs
+
+    Example:
+        >>> df = fix_patient_id(df, error_collector)
+        >>> # "KD_EW004" → "KD_EW004" (valid)
+        >>> # "KD-EW004" → "KD_EW004" (normalized)
+        >>> # "KD_EW004XY" → "KD_EW004" (truncated)
+        >>> # "INVALID" → "Other" (replaced)
+    """
+    import re
+
+    from a4d.config import settings
+
+    if patient_id_col not in df.columns:
+        return df
+
+    # Store original values for error reporting
+    original_col = f"{patient_id_col}_original"
+    df = df.with_columns(pl.col(patient_id_col).alias(original_col))
+
+    # Valid format: XX_YY### (2 letters, underscore, 2 letters, 3 digits)
+    valid_pattern = re.compile(r"^[A-Z]{2}_[A-Z]{2}\d{3}$")
+
+    def fix_single_id(patient_id: str | None) -> str | None:
+        """Fix a single patient ID value."""
+        if patient_id is None:
+            return None
+
+        # Step 1: Replace hyphens with underscores
+        patient_id = patient_id.replace("-", "_")
+
+        # Step 2: Check if it matches the valid pattern
+        if valid_pattern.match(patient_id):
+            return patient_id
+
+        # Step 3: Invalid format - either truncate or replace
+        if len(patient_id) > 8:
+            # Truncate to 8 characters
+            return patient_id[:8]
+        else:
+            # Replace with error value
+            return settings.error_val_character
+
+    # Apply transformation
+    df = df.with_columns(
+        pl.col(patient_id_col)
+        .map_elements(fix_single_id, return_dtype=pl.String)
+        .alias(patient_id_col)
+    )
+
+    # Now collect errors for changed values
+    for row in df.iter_rows(named=True):
+        original = row[original_col]
+        fixed = row[patient_id_col]
+
+        if original != fixed and original is not None:
+            # Normalize original to check if it's just hyphen replacement
+            normalized = original.replace("-", "_")
+
+            if normalized != fixed:
+                # Not just normalization - either truncation or replacement
+                if len(original.replace("-", "_")) > 8:
+                    # Truncation
+                    error_collector.add_error(
+                        file_name="",
+                        patient_id=original,
+                        column=patient_id_col,
+                        original_value=original,
+                        error_message="Patient ID truncated (length > 8)",
+                        error_code="invalid_value",
+                    )
+                else:
+                    # Replacement
+                    error_collector.add_error(
+                        file_name="",
+                        patient_id=original,
+                        column=patient_id_col,
+                        original_value=original,
+                        error_message="Invalid patient ID format (expected XX_YY###)",
+                        error_code="invalid_value",
+                    )
+
+    # Drop the temporary column
+    df = df.drop(original_col)
+
+    return df
diff --git a/a4d-python/src/a4d/cli.py b/a4d-python/src/a4d/cli.py
new file mode 100644
index 0000000..6ab7cd7
--- /dev/null
+++ b/a4d-python/src/a4d/cli.py
@@ -0,0 +1,578 @@
+"""Command-line interface for A4D pipeline."""
+
+from pathlib import Path
+from typing import Annotated
+
+import polars as pl
+import typer
+from rich.console import Console
+from rich.table import Table
+
+from a4d.pipeline.patient import process_patient_tables, run_patient_pipeline
+from a4d.tables.logs import create_table_logs
+
+app = typer.Typer(
+    name="a4d", help="A4D medical tracker data processing pipeline", no_args_is_help=True
+)
+
+console = Console()
+
+
+def _display_tables_summary(tables: dict[str, Path]) -> None:
+    """Display summary table of created tables with record counts.
+
+    Args:
+        tables: Dictionary mapping table name to output path
+    """
+    if not tables:
+        return
+
+    console.print("\n[bold green]Created Tables:[/bold green]")
+    tables_table = Table(title="Created Tables")
+    tables_table.add_column("Table", style="cyan")
+    tables_table.add_column("Path", style="green")
+    tables_table.add_column("Records", justify="right", style="magenta")
+
+    # Add patient tables first, then logs table
+    for name in ["static", "monthly", "annual"]:
+        if name in tables:
+            path = tables[name]
+            try:
+                df = pl.read_parquet(path)
+                record_count = f"{len(df):,}"
+            except Exception:
+                record_count = "?"
+            tables_table.add_row(name, str(path.name), record_count)
+
+    # Add logs table last
+    if "logs" in tables:
+        path = tables["logs"]
+        try:
+            df = pl.read_parquet(path)
+            record_count = f"{len(df):,}"
+        except Exception:
+            record_count = "?"
+        tables_table.add_row("logs", str(path.name), record_count)
+
+    console.print(tables_table)
+    console.print()
+
+
+@app.command("process-patient")
+def process_patient_cmd(
+    file: Annotated[
+        Path | None,
+        typer.Option(
+            "--file",
+            "-f",
+            help="Process specific tracker file (if not set, processes all files in data_root)",
+        ),
+    ] = None,
+    workers: Annotated[
+        int, typer.Option("--workers", "-w", help="Number of parallel workers (1 = sequential)")
+    ] = 1,
+    skip_tables: Annotated[
+        bool, typer.Option("--skip-tables", help="Skip table creation (only extract + clean)")
+    ] = False,
+    force: Annotated[
+        bool, typer.Option("--force", help="Force reprocessing (ignore existing outputs)")
+    ] = False,
+    output_root: Annotated[
+        Path | None, typer.Option("--output", "-o", help="Output directory (default: from config)")
+    ] = None,
+):
+    """Process patient data pipeline.
+
+    \b
+    Examples:
+        # Process all trackers in data_root
+        uv run a4d process-patient
+
+        # Process specific file
+        uv run a4d process-patient --file /path/to/tracker.xlsx
+
+        # Parallel processing with 8 workers
+        uv run a4d process-patient --workers 8
+
+        # Just extract + clean, skip tables
+        uv run a4d process-patient --skip-tables
+    """
+    console.print("\n[bold blue]A4D Patient Pipeline[/bold blue]\n")
+
+    # Prepare tracker files list
+    tracker_files = [file] if file else None
+
+    # Run pipeline with progress bar and minimal console logging
+    try:
+        result = run_patient_pipeline(
+            tracker_files=tracker_files,
+            max_workers=workers,
+            output_root=output_root,
+            skip_tables=skip_tables,
+            force=force,
+            show_progress=True,  # Show tqdm progress bar
+            console_log_level="ERROR",  # Only show errors in console
+        )
+
+        # Display results
+        console.print("\n[bold]Pipeline Results[/bold]\n")
+
+        # Calculate error statistics
+        total_errors = sum(tr.cleaning_errors for tr in result.tracker_results)
+        files_with_errors = sum(1 for tr in result.tracker_results if tr.cleaning_errors > 0)
+
+        summary_table = Table(title="Summary")
+        summary_table.add_column("Metric", style="cyan")
+        summary_table.add_column("Value", style="green")
+
+        summary_table.add_row("Total Trackers", str(result.total_trackers))
+        summary_table.add_row("Successful", str(result.successful_trackers))
+        summary_table.add_row("Failed", str(result.failed_trackers))
+        summary_table.add_row("Tables Created", str(len(result.tables)))
+        summary_table.add_row("", "")  # Spacer
+        summary_table.add_row("Data Quality Errors", f"{total_errors:,}")
+        summary_table.add_row("Files with Errors", str(files_with_errors))
+
+        console.print(summary_table)
+
+        # Show error type breakdown if there are errors
+        if total_errors > 0:
+            console.print("\n[bold yellow]Error Type Breakdown:[/bold yellow]")
+
+            # Aggregate error types across all trackers
+            error_type_totals: dict[str, int] = {}
+            for tr in result.tracker_results:
+                if tr.error_breakdown:
+                    for error_type, count in tr.error_breakdown.items():
+                        error_type_totals[error_type] = error_type_totals.get(error_type, 0) + count
+
+            # Create frequency table
+            error_type_table = Table()
+            error_type_table.add_column("Error Type", style="yellow")
+            error_type_table.add_column("Count", justify="right", style="red")
+            error_type_table.add_column("Percentage", justify="right", style="cyan")
+
+            # Sort by count (descending)
+            sorted_error_types = sorted(error_type_totals.items(), key=lambda x: x[1], reverse=True)
+
+            for error_type, count in sorted_error_types:
+                percentage = (count / total_errors) * 100
+                error_type_table.add_row(error_type, f"{count:,}", f"{percentage:.1f}%")
+
+            console.print(error_type_table)
+
+        # Show failed trackers if any
+        if result.failed_trackers > 0:
+            console.print("\n[bold yellow]Failed Trackers:[/bold yellow]")
+            failed_table = Table()
+            failed_table.add_column("File", style="red")
+            failed_table.add_column("Error")
+
+            for tr in result.tracker_results:
+                if not tr.success:
+                    failed_table.add_row(
+                        tr.tracker_file.name,
+                        str(tr.error)[:100],  # Truncate long errors
+                    )
+
+            console.print(failed_table)
+
+        # Show top files with most data quality errors (if any)
+        if total_errors > 0:
+            console.print("\n[bold yellow]Top Files by Error Count:[/bold yellow]")
+            # Sort by error count (descending) and take top 10
+            files_by_errors = sorted(
+                [
+                    (tr.tracker_file.name, tr.cleaning_errors)
+                    for tr in result.tracker_results
+                    if tr.cleaning_errors > 0
+                ],
+                key=lambda x: x[1],
+                reverse=True,
+            )[:10]
+
+            errors_table = Table()
+            errors_table.add_column("File", style="yellow")
+            errors_table.add_column("Errors", justify="right", style="red")
+
+            for filename, error_count in files_by_errors:
+                errors_table.add_row(filename, f"{error_count:,}")
+
+            console.print(errors_table)
+
+        # Show created tables
+        _display_tables_summary(result.tables)
+
+        # Exit status
+        if result.success:
+            console.print("\n[bold green]✓ Pipeline completed successfully![/bold green]\n")
+            raise typer.Exit(0)
+        else:
+            console.print(
+                f"\n[bold red]✗ Pipeline completed with "
+                f"{result.failed_trackers} failures[/bold red]\n"
+            )
+            raise typer.Exit(1)
+
+    except Exception as e:
+        console.print(f"\n[bold red]Error: {e}[/bold red]\n")
+        raise typer.Exit(1) from e
+
+
+@app.command("create-tables")
+def create_tables_cmd(
+    input_dir: Annotated[
+        Path, typer.Option("--input", "-i", help="Directory containing cleaned parquet files")
+    ],
+    output_dir: Annotated[
+        Path | None,
+        typer.Option(
+            "--output", "-o", help="Output directory for tables (default: input_dir/tables)"
+        ),
+    ] = None,
+):
+    """Create final tables from existing cleaned parquet files.
+
+    This command creates the patient tables (static, monthly, annual) and logs table
+    from existing cleaned parquet files, without running the full pipeline.
+
+    Useful for:
+    - Re-creating tables after fixing table creation logic
+    - Creating tables from manually cleaned data
+    - Testing table creation independently
+
+    \\b
+    Examples:
+        # Create tables from existing output
+        uv run a4d create-tables --input output/patient_data_cleaned
+
+        # Specify custom output directory
+        uv run a4d create-tables --input output/patient_data_cleaned --output custom_tables
+    """
+    console.print("\n[bold blue]A4D Table Creation[/bold blue]\n")
+
+    # Determine output directory
+    if output_dir is None:
+        output_dir = input_dir.parent / "tables"
+
+    console.print(f"Input directory: {input_dir}")
+    console.print(f"Output directory: {output_dir}\n")
+
+    # Find cleaned parquet files
+    cleaned_files = list(input_dir.glob("*_patient_cleaned.parquet"))
+    if not cleaned_files:
+        console.print(
+            f"[bold red]Error: No cleaned parquet files found in {input_dir}[/bold red]\n"
+        )
+        raise typer.Exit(1)
+
+    console.print(f"Found {len(cleaned_files)} cleaned parquet files\n")
+
+    try:
+        console.print("[bold]Creating tables...[/bold]")
+
+        # Create patient tables
+        tables = process_patient_tables(input_dir, output_dir)
+
+        # Create logs table separately (operational data)
+        logs_dir = input_dir.parent / "logs"
+        if logs_dir.exists():
+            console.print("  • Creating logs table...")
+            logs_table_path = create_table_logs(logs_dir, output_dir)
+            tables["logs"] = logs_table_path
+        else:
+            console.print(f"  [yellow]Warning: Logs directory not found at {logs_dir}[/yellow]")
+
+        # Display results
+        console.print("\n[bold green]✓ Tables created successfully![/bold green]")
+        _display_tables_summary(tables)
+
+    except Exception as e:
+        console.print(f"\n[bold red]Error creating tables: {e}[/bold red]\n")
+        raise typer.Exit(1) from e
+
+
+@app.command("upload-tables")
+def upload_tables_cmd(
+    tables_dir: Annotated[
+        Path,
+        typer.Option("--tables-dir", "-t", help="Directory containing parquet table files"),
+    ],
+    dataset: Annotated[
+        str | None,
+        typer.Option("--dataset", "-d", help="BigQuery dataset name (default: from config)"),
+    ] = None,
+    project_id: Annotated[
+        str | None,
+        typer.Option("--project", "-p", help="GCP project ID (default: from config)"),
+    ] = None,
+    append: Annotated[
+        bool,
+        typer.Option("--append", help="Append to existing tables instead of replacing"),
+    ] = False,
+):
+    """Upload pipeline output tables to BigQuery.
+
+    Loads parquet files from the tables directory into the configured
+    BigQuery dataset. By default, existing tables are replaced (matching
+    the R pipeline behavior).
+
+    \b
+    Examples:
+        # Upload tables from default output directory
+        uv run a4d upload-tables --tables-dir output/tables
+
+        # Upload to a specific dataset
+        uv run a4d upload-tables --tables-dir output/tables --dataset tracker_dev
+
+        # Append instead of replace
+        uv run a4d upload-tables --tables-dir output/tables --append
+    """
+    from a4d.gcp.bigquery import load_pipeline_tables
+
+    console.print("\n[bold blue]A4D BigQuery Upload[/bold blue]\n")
+    console.print(f"Tables directory: {tables_dir}")
+
+    if not tables_dir.exists():
+        console.print(f"[bold red]Error: Directory not found: {tables_dir}[/bold red]\n")
+        raise typer.Exit(1)
+
+    try:
+        results = load_pipeline_tables(
+            tables_dir=tables_dir,
+            dataset=dataset,
+            project_id=project_id,
+            replace=not append,
+        )
+
+        if results:
+            result_table = Table(title="Uploaded Tables")
+            result_table.add_column("Table", style="cyan")
+            result_table.add_column("Rows", justify="right", style="green")
+            result_table.add_column("Status", style="green")
+
+            for table_name, job in results.items():
+                result_table.add_row(
+                    table_name,
+                    f"{job.output_rows:,}" if job.output_rows else "?",
+                    "✓",
+                )
+
+            console.print(result_table)
+            console.print(
+                f"\n[bold green]✓ Uploaded {len(results)} tables to BigQuery[/bold green]\n"
+            )
+        else:
+            console.print("[bold yellow]No tables found to upload[/bold yellow]\n")
+
+    except Exception as e:
+        console.print(f"\n[bold red]Error: {e}[/bold red]\n")
+        raise typer.Exit(1) from e
+
+
+@app.command("download-trackers")
+def download_trackers_cmd(
+    destination: Annotated[
+        Path,
+        typer.Option("--destination", "-d", help="Local directory to download files to"),
+    ],
+    bucket: Annotated[
+        str | None,
+        typer.Option("--bucket", "-b", help="GCS bucket name (default: from config)"),
+    ] = None,
+):
+    """Download tracker files from Google Cloud Storage.
+
+    \b
+    Examples:
+        # Download to local directory
+        uv run a4d download-trackers --destination /data/trackers
+
+        # Download from specific bucket
+        uv run a4d download-trackers --destination /data/trackers --bucket my-bucket
+    """
+    from a4d.gcp.storage import download_tracker_files
+
+    console.print("\n[bold blue]A4D Tracker Download[/bold blue]\n")
+    console.print(f"Destination: {destination}")
+
+    try:
+        downloaded = download_tracker_files(destination=destination, bucket_name=bucket)
+        console.print(f"\n[bold green]✓ Downloaded {len(downloaded)} files[/bold green]\n")
+    except Exception as e:
+        console.print(f"\n[bold red]Error: {e}[/bold red]\n")
+        raise typer.Exit(1) from e
+
+
+@app.command("upload-output")
+def upload_output_cmd(
+    source_dir: Annotated[
+        Path,
+        typer.Option("--source", "-s", help="Output directory to upload"),
+    ],
+    bucket: Annotated[
+        str | None,
+        typer.Option("--bucket", "-b", help="GCS bucket name (default: from config)"),
+    ] = None,
+    prefix: Annotated[
+        str,
+        typer.Option("--prefix", help="Prefix for uploaded blob names"),
+    ] = "",
+):
+    """Upload pipeline output to Google Cloud Storage.
+
+    \b
+    Examples:
+        # Upload output directory
+        uv run a4d upload-output --source output/
+
+        # Upload with prefix
+        uv run a4d upload-output --source output/ --prefix 2024-01
+    """
+    from a4d.gcp.storage import upload_output
+
+    console.print("\n[bold blue]A4D Output Upload[/bold blue]\n")
+    console.print(f"Source: {source_dir}")
+
+    if not source_dir.exists():
+        console.print(f"[bold red]Error: Directory not found: {source_dir}[/bold red]\n")
+        raise typer.Exit(1)
+
+    try:
+        uploaded = upload_output(source_dir=source_dir, bucket_name=bucket, prefix=prefix)
+        console.print(f"\n[bold green]✓ Uploaded {len(uploaded)} files to GCS[/bold green]\n")
+    except Exception as e:
+        console.print(f"\n[bold red]Error: {e}[/bold red]\n")
+        raise typer.Exit(1) from e
+
+
+@app.command("run-pipeline")
+def run_pipeline_cmd(
+    workers: Annotated[
+        int, typer.Option("--workers", "-w", help="Number of parallel workers (1 = sequential)")
+    ] = 4,
+    force: Annotated[
+        bool, typer.Option("--force", help="Force reprocessing (ignore existing outputs)")
+    ] = False,
+    skip_upload: Annotated[
+        bool,
+        typer.Option("--skip-upload", help="Skip GCS and BigQuery uploads (local testing)"),
+    ] = False,
+):
+    """Run the full end-to-end A4D pipeline.
+
+    Executes all pipeline stages in sequence:
+      1. Download tracker files from Google Cloud Storage
+      2. Extract and clean all tracker files
+      3. Create final tables (static, monthly, annual)
+      4. Upload output files to Google Cloud Storage
+      5. Ingest tables into BigQuery
+
+    All configuration is read from environment variables (A4D_*) or a .env file.
+
+    \b
+    Examples:
+        # Full pipeline with 4 workers
+        uv run a4d run-pipeline
+
+        # Force reprocess all files
+        uv run a4d run-pipeline --force
+
+        # Local testing without GCS/BigQuery uploads
+        uv run a4d run-pipeline --skip-upload
+    """
+    from a4d.config import settings
+    from a4d.gcp.bigquery import load_pipeline_tables
+    from a4d.gcp.storage import download_tracker_files, upload_output
+
+    console.print("\n[bold blue]A4D Full Pipeline[/bold blue]\n")
+    console.print(f"Data root:   {settings.data_root}")
+    console.print(f"Output root: {settings.output_root}")
+    console.print(f"Workers:     {workers}")
+    console.print(f"Project:     {settings.project_id}")
+    console.print(f"Dataset:     {settings.dataset}\n")
+
+    # Step 1 – Download tracker files from GCS
+    if not skip_upload:
+        console.print("[bold]Step 1/5:[/bold] Downloading tracker files from GCS...")
+        try:
+            downloaded = download_tracker_files(destination=settings.data_root)
+            console.print(f"  ✓ Downloaded {len(downloaded)} files\n")
+        except Exception as e:
+            console.print(f"\n[bold red]Error during download: {e}[/bold red]\n")
+            raise typer.Exit(1) from e
+    else:
+        console.print("[bold]Step 1/5:[/bold] Skipping GCS download (--skip-upload)\n")
+
+    # Step 2+3 – Extract, clean and build tables
+    console.print("[bold]Steps 2–3/5:[/bold] Processing tracker files...\n")
+    try:
+        result = run_patient_pipeline(
+            max_workers=workers,
+            force=force,
+            show_progress=True,
+            console_log_level="WARNING",
+        )
+
+        console.print(
+            f"  ✓ Processed {result.total_trackers} trackers "
+            f"({result.successful_trackers} ok, {result.failed_trackers} failed)\n"
+        )
+
+        if result.failed_trackers > 0:
+            console.print("[bold yellow]Failed trackers:[/bold yellow]")
+            for tr in result.tracker_results:
+                if not tr.success:
+                    console.print(f"  • {tr.tracker_file.name}: {tr.error}")
+            console.print()
+
+        if not result.success:
+            console.print("[bold red]✗ Pipeline failed – aborting upload steps[/bold red]\n")
+            raise typer.Exit(1)
+
+    except Exception as e:
+        console.print(f"\n[bold red]Error during processing: {e}[/bold red]\n")
+        raise typer.Exit(1) from e
+
+    tables_dir = settings.output_root / "tables"
+
+    # Step 4 – Upload output to GCS
+    if not skip_upload:
+        console.print("[bold]Step 4/5:[/bold] Uploading output files to GCS...")
+        try:
+            uploaded = upload_output(source_dir=settings.output_root)
+            console.print(f"  ✓ Uploaded {len(uploaded)} files\n")
+        except Exception as e:
+            console.print(f"\n[bold red]Error during GCS upload: {e}[/bold red]\n")
+            raise typer.Exit(1) from e
+    else:
+        console.print("[bold]Step 4/5:[/bold] Skipping GCS upload (--skip-upload)\n")
+
+    # Step 5 – Ingest tables into BigQuery
+    if not skip_upload:
+        console.print("[bold]Step 5/5:[/bold] Ingesting tables into BigQuery...")
+        try:
+            bq_results = load_pipeline_tables(tables_dir=tables_dir)
+            console.print(f"  ✓ Loaded {len(bq_results)} tables into BigQuery\n")
+        except Exception as e:
+            console.print(f"\n[bold red]Error during BigQuery upload: {e}[/bold red]\n")
+            raise typer.Exit(1) from e
+    else:
+        console.print("[bold]Step 5/5:[/bold] Skipping BigQuery upload (--skip-upload)\n")
+
+    console.print("[bold green]✓ Full pipeline completed successfully![/bold green]\n")
+
+
+
+    """Show version information."""
+    console.print("[bold cyan]A4D Pipeline v0.1.0[/bold cyan]")
+    console.print("Python implementation of the A4D medical tracker processing pipeline")
+
+
+def main():
+    """Entry point for CLI."""
+    app()
+
+
+if __name__ == "__main__":
+    main()
diff --git a/a4d-python/src/a4d/config.py b/a4d-python/src/a4d/config.py
new file mode 100644
index 0000000..f32dadf
--- /dev/null
+++ b/a4d-python/src/a4d/config.py
@@ -0,0 +1,57 @@
+"""Application configuration using Pydantic Settings."""
+
+from pathlib import Path
+from typing import Literal
+
+from pydantic_settings import BaseSettings, SettingsConfigDict
+
+
+class Settings(BaseSettings):
+    """
+    Application configuration with environment variable support.
+
+    All settings can be overridden with environment variables prefixed with A4D_.
+    Example: A4D_DATA_ROOT=/path/to/data
+    """
+
+    model_config = SettingsConfigDict(
+        env_file=".env",
+        env_file_encoding="utf-8",
+        env_prefix="A4D_",
+        case_sensitive=False,
+    )
+
+    # Environment
+    environment: Literal["development", "production"] = "development"
+
+    # GCP Configuration
+    project_id: str = "a4dphase2"
+    dataset: str = "tracker"
+    download_bucket: str = "a4dphase2_upload"
+    upload_bucket: str = "a4dphase2_output"
+
+    # Paths
+    data_root: Path = Path("/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload")
+    output_dir: Path = Path("output")
+
+    # Processing settings
+    max_workers: int = 4
+
+    # Error values (matching R pipeline constants)
+    error_val_numeric: float = 999999.0
+    error_val_character: str = "Undefined"
+    error_val_date: str = "9999-09-09"
+
+    @property
+    def output_root(self) -> Path:
+        """Computed output root path."""
+        return self.data_root / self.output_dir
+
+    @property
+    def tracker_root(self) -> Path:
+        """Tracker files root directory."""
+        return self.data_root
+
+
+# Global settings instance
+settings = Settings()
diff --git a/a4d-python/src/a4d/errors.py b/a4d-python/src/a4d/errors.py
new file mode 100644
index 0000000..11dc45b
--- /dev/null
+++ b/a4d-python/src/a4d/errors.py
@@ -0,0 +1,210 @@
+"""Data quality error tracking for pipeline processing.
+
+This module provides the ErrorCollector class for tracking conversion failures,
+validation errors, and other data quality issues. Errors are exported as
+parquet files and aggregated into the logs table for BigQuery analysis.
+
+This is separate from operational logging (see a4d.logging) which tracks
+pipeline execution and progress.
+"""
+
+from datetime import datetime
+from typing import Any, Literal
+
+import polars as pl
+from pydantic import BaseModel, Field
+
+# Error code types based on R pipeline
+ErrorCode = Literal[
+    "type_conversion",  # Failed to convert type (e.g., "abc" -> int)
+    "invalid_value",  # Value outside allowed range or not in allowed list
+    "missing_value",  # Required value is missing/NA
+    "missing_required_field",  # Critical field (patient_id, status) is missing, row excluded
+    "invalid_tracker",  # Tracker-level issues (missing columns, etc.)
+    "function_call",  # Generic function execution error
+    "critical_abort",  # Fatal error, tracker cannot be processed
+]
+
+
+class DataError(BaseModel):
+    """Single data quality error record.
+
+    Attributes:
+        file_name: Name of the tracker file where error occurred
+        patient_id: Patient ID (if applicable, else "unknown")
+        column: Column name where error occurred
+        original_value: Original value that caused the error
+        error_message: Human-readable error description
+        error_code: Error category for grouping/analysis
+        script: Script name where error occurred (e.g., "script2", "clean")
+        function_name: Function name where error occurred
+        timestamp: When the error was recorded
+    """
+
+    file_name: str
+    patient_id: str
+    column: str
+    original_value: str
+    error_message: str
+    error_code: ErrorCode
+    script: str = "clean"
+    function_name: str = ""
+    timestamp: datetime = Field(default_factory=datetime.now)
+
+
+class ErrorCollector:
+    """Collects data quality errors for export to parquet.
+
+    Errors are collected during processing and exported as a DataFrame
+    at the end. The DataFrame schema matches the logs table in BigQuery
+    for easy querying and dashboard visualization.
+
+    Example:
+        >>> collector = ErrorCollector()
+        >>> collector.add_error(
+        ...     file_name="clinic_001.xlsx",
+        ...     patient_id="XX_YY001",
+        ...     column="age",
+        ...     original_value="invalid",
+        ...     error_message="Could not convert 'invalid' to Int32",
+        ...     error_code="type_conversion",
+        ...     function_name="safe_convert_column"
+        ... )
+        >>> # Or batch add:
+        >>> errors = [
+        ...     DataError(file_name="clinic_001.xlsx", patient_id="XX_YY001", ...),
+        ...     DataError(file_name="clinic_001.xlsx", patient_id="XX_YY002", ...),
+        ... ]
+        >>> collector.add_errors(errors)
+        >>> df = collector.to_dataframe()
+        >>> df.write_parquet("output/clinic_001/errors.parquet")
+    """
+
+    def __init__(self):
+        """Initialize an empty error collector."""
+        self.errors: list[DataError] = []
+
+    def add_error(
+        self,
+        file_name: str,
+        patient_id: str,
+        column: str,
+        original_value: Any,
+        error_message: str,
+        error_code: ErrorCode,
+        script: str = "clean",
+        function_name: str = "",
+    ) -> None:
+        """Add a data quality error to the collector.
+
+        Args:
+            file_name: Name of the tracker file
+            patient_id: Patient ID (use "unknown" if not applicable)
+            column: Column name where error occurred
+            original_value: Original value that caused the error
+            error_message: Human-readable error description
+            error_code: Error category (type_conversion, invalid_value, etc.)
+            script: Script name (default: "clean")
+            function_name: Function name where error occurred
+        """
+        error = DataError(
+            file_name=file_name,
+            patient_id=patient_id,
+            column=column,
+            original_value=str(original_value),
+            error_message=error_message,
+            error_code=error_code,
+            script=script,
+            function_name=function_name,
+        )
+        self.errors.append(error)
+
+    def add_errors(self, errors: list[DataError]) -> None:
+        """Add multiple errors at once.
+
+        Args:
+            errors: List of DataError instances to add
+
+        Example:
+            >>> errors = [
+            ...     DataError(file_name="clinic_001.xlsx", patient_id="XX_YY001", ...),
+            ...     DataError(file_name="clinic_001.xlsx", patient_id="XX_YY002", ...),
+            ... ]
+            >>> collector.add_errors(errors)
+        """
+        self.errors.extend(errors)
+
+    def to_dataframe(self) -> pl.DataFrame:
+        """Export errors as a Polars DataFrame for parquet export.
+
+        Returns:
+            Polars DataFrame with all error records, or empty DataFrame if no errors
+
+        Schema:
+            - file_name: str
+            - patient_id: str
+            - column: str
+            - original_value: str
+            - error_message: str
+            - error_code: str (categorical)
+            - script: str (categorical)
+            - function_name: str (categorical)
+            - timestamp: datetime
+        """
+        if not self.errors:
+            # Return empty DataFrame with correct schema
+            return pl.DataFrame(
+                schema={
+                    "file_name": pl.Utf8,
+                    "patient_id": pl.Utf8,
+                    "column": pl.Utf8,
+                    "original_value": pl.Utf8,
+                    "error_message": pl.Utf8,
+                    "error_code": pl.Categorical,
+                    "script": pl.Categorical,
+                    "function_name": pl.Categorical,
+                    "timestamp": pl.Datetime,
+                }
+            )
+
+        # Convert Pydantic models to dict records
+        records = [error.model_dump() for error in self.errors]
+
+        # Create DataFrame and cast categorical columns for efficiency
+        df = pl.DataFrame(records)
+        df = df.with_columns(
+            [
+                pl.col("error_code").cast(pl.Categorical),
+                pl.col("script").cast(pl.Categorical),
+                pl.col("function_name").cast(pl.Categorical),
+            ]
+        )
+
+        return df
+
+    def __len__(self) -> int:
+        """Return number of errors collected."""
+        return len(self.errors)
+
+    def __bool__(self) -> bool:
+        """Return True if any errors have been collected."""
+        return len(self.errors) > 0
+
+    def clear(self) -> None:
+        """Clear all collected errors."""
+        self.errors.clear()
+
+    def get_error_summary(self) -> dict[str, int]:
+        """Get summary of errors by error_code.
+
+        Returns:
+            Dictionary mapping error_code to count
+
+        Example:
+            >>> collector.get_error_summary()
+            {'type_conversion': 10, 'invalid_value': 5}
+        """
+        summary: dict[str, int] = {}
+        for error in self.errors:
+            summary[error.error_code] = summary.get(error.error_code, 0) + 1
+        return summary
diff --git a/a4d-python/src/a4d/extract/__init__.py b/a4d-python/src/a4d/extract/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/a4d-python/src/a4d/extract/patient.py b/a4d-python/src/a4d/extract/patient.py
new file mode 100644
index 0000000..8e65285
--- /dev/null
+++ b/a4d-python/src/a4d/extract/patient.py
@@ -0,0 +1,958 @@
+"""Patient data extraction from Excel tracker files.
+
+This module handles reading patient data from Excel trackers, which have
+evolved over the years with different formats and structures.
+"""
+
+import calendar
+import re
+import warnings
+from pathlib import Path
+
+import polars as pl
+from loguru import logger
+from openpyxl import load_workbook
+
+from a4d.errors import ErrorCollector
+from a4d.reference.synonyms import ColumnMapper, load_patient_mapper
+
+# Suppress openpyxl warnings about unsupported Excel features
+# We only read data, so these warnings are not actionable
+warnings.filterwarnings("ignore", category=UserWarning, module=r"openpyxl\..*")
+
+
+def get_tracker_year(tracker_file: Path, month_sheets: list[str]) -> int:
+    """Extract tracker year from month sheet names or filename.
+
+    Tries to parse year from month sheet names (e.g., "Jan24" -> 2024).
+    Falls back to extracting from filename if parsing fails.
+    Validates year is in reasonable range (2017-2030).
+
+    Args:
+        tracker_file: Path to the tracker Excel file
+        month_sheets: List of month sheet names
+
+    Returns:
+        Year of the tracker (e.g., 2024)
+
+    Raises:
+        ValueError: If year cannot be determined or is out of valid range
+
+    Example:
+        >>> get_tracker_year(Path("2024_Clinic.xlsx"), ["Jan24", "Feb24"])
+        2024
+    """
+    for sheet in month_sheets:
+        match = re.search(r"(\d{2})$", sheet)
+        if match:
+            year_suffix = int(match.group(1))
+            year = 2000 + year_suffix  # Assume 20xx until 2100
+            logger.debug(f"Parsed year {year} from sheet name '{sheet}'")
+
+            if not (2017 <= year <= 2030):  # Match R pipeline validation
+                raise ValueError(
+                    f"Year {year} is out of valid range (2017-2030). "
+                    f"Parsed from sheet name '{sheet}'"
+                )
+
+            return year
+
+    match = re.search(r"(\d{4})", tracker_file.name)
+    if match:
+        year = int(match.group(1))
+        logger.debug(f"Parsed year {year} from filename '{tracker_file.name}'")
+
+        if not (2017 <= year <= 2030):  # Match R pipeline validation
+            raise ValueError(
+                f"Year {year} is out of valid range (2017-2030). "
+                f"Parsed from filename '{tracker_file.name}'"
+            )
+
+        return year
+
+    raise ValueError(
+        f"Could not determine year from month sheets {month_sheets} or filename {tracker_file.name}"
+    )
+
+
+def find_month_sheets(workbook) -> list[str]:
+    """Find all month sheets in the tracker workbook.
+
+    Month sheets are identified by matching against month abbreviations
+    (Jan, Feb, Mar, etc.) and sorted by month number for consistent processing.
+
+    Args:
+        workbook: openpyxl Workbook object
+
+    Returns:
+        List of month sheet names found in the workbook, sorted by month number
+        (Jan=1, Feb=2, ..., Dec=12)
+
+    Example:
+        >>> wb = load_workbook("tracker.xlsx")
+        >>> find_month_sheets(wb)
+        ['Jan24', 'Feb24', 'Mar24', ...]
+    """
+    month_abbrs = list(calendar.month_abbr)[1:]  # ['Jan', 'Feb', ...]
+    month_sheets = []
+
+    for sheet_name in workbook.sheetnames:
+        if any(sheet_name.startswith(abbr) for abbr in month_abbrs):
+            month_sheets.append(sheet_name)
+
+    def get_month_number(sheet_name: str) -> int:
+        """Extract month number from sheet name (Jan=1, ..., Dec=12)."""
+        month_prefix = sheet_name[:3]
+        try:
+            return month_abbrs.index(month_prefix) + 1
+        except ValueError:
+            return 999  # Push unrecognized sheets to end
+
+    month_sheets.sort(key=get_month_number)
+
+    logger.info(f"Found {len(month_sheets)} month sheets (sorted by month): {month_sheets}")
+    return month_sheets
+
+
+def find_data_start_row(ws) -> int:
+    """Find the first row containing patient data.
+
+    Scans column A for the first numeric value (patient row numbers: 1, 2, 3...).
+    This skips any non-numeric values that may appear above the patient data
+    (e.g., spaces, text, product data).
+
+    Args:
+        ws: openpyxl worksheet object
+
+    Returns:
+        Row number (1-indexed) where patient data starts
+
+    Raises:
+        ValueError: If no numeric data is found in column A
+    """
+    max_row = ws.max_row or 1000
+    for row_idx in range(1, max_row + 1):
+        cell_value = ws.cell(row_idx, 1).value
+        if cell_value is not None and isinstance(cell_value, (int, float)):
+            return row_idx
+
+    raise ValueError("No patient data found in column A (looking for numeric row numbers)")
+
+
+def read_header_rows(ws, data_start_row: int, max_cols: int = 100) -> tuple[list, list]:
+    """Read and trim the two header rows above the data.
+
+    Headers are located in the two rows immediately before data_start_row.
+    Reads up to max_cols columns and trims to the last non-None column.
+
+    Args:
+        ws: openpyxl worksheet object
+        data_start_row: Row number where patient data starts
+        max_cols: Maximum number of columns to read (default: 100)
+
+    Returns:
+        Tuple of (header_1, header_2) lists, trimmed to actual width
+
+    Example:
+        >>> header_1, header_2 = read_header_rows(ws, 77)
+        >>> len(header_1)
+        31
+    """
+    header_row_1 = data_start_row - 1
+    header_row_2 = data_start_row - 2
+
+    # Read raw header rows
+    header_1_raw = list(
+        ws.iter_rows(
+            min_row=header_row_1,
+            max_row=header_row_1,
+            min_col=1,
+            max_col=max_cols,
+            values_only=True,
+        )
+    )[0]
+    header_2_raw = list(
+        ws.iter_rows(
+            min_row=header_row_2,
+            max_row=header_row_2,
+            min_col=1,
+            max_col=max_cols,
+            values_only=True,
+        )
+    )[0]
+
+    last_col = max_cols
+    for i in range(len(header_1_raw) - 1, -1, -1):
+        if header_1_raw[i] is not None or header_2_raw[i] is not None:
+            last_col = i + 1
+            break
+
+    header_1 = list(header_1_raw[:last_col])
+    header_2 = list(header_2_raw[:last_col])
+
+    return header_1, header_2
+
+
+def merge_headers(
+    header_1: list,
+    header_2: list,
+    mapper: ColumnMapper | None = None,
+) -> list[str | None]:
+    """Merge two header rows using heuristic forward-fill with synonym validation.
+
+    When h2=None but h1 exists:
+    1. Try forward-fill: combine prev_h2 + h1
+    2. If mapper validates this as known column, use it
+    3. Otherwise, treat h1 as standalone column
+
+    This replaces Excel merge metadata detection with synonym-based validation,
+    eliminating the need for slow read_only=False workbook loading.
+
+    Special case: If header_1 contains "Patient ID" (or known synonyms) and
+    header_2 appears to be a title row (mostly None), use only header_1.
+
+    Args:
+        header_1: First header row (closer to data), 0-indexed
+        header_2: Second header row (further from data), 0-indexed
+        mapper: Optional ColumnMapper for validating forward-filled headers
+
+    Returns:
+        List of merged header strings with whitespace normalized
+    """
+    patient_id_indicators = ["patient id", "patient.id"]
+    has_patient_id_in_h1 = any(
+        str(h1).strip().lower() in patient_id_indicators for h1 in header_1 if h1 is not None
+    )
+
+    non_none_count_h2 = sum(1 for h2 in header_2 if h2 is not None)
+
+    if has_patient_id_in_h1 and non_none_count_h2 <= 2:
+        logger.debug(
+            "Detected title row in header_2 with Patient ID in header_1, using header_1 only"
+        )
+        headers = [str(h1).strip() if h1 is not None else None for h1 in header_1]
+        headers = [re.sub(r"\s+", " ", h.replace("\n", " ")) if h else None for h in headers]
+        return headers
+
+    headers = []
+    prev_h2 = None
+
+    for h1, h2 in zip(header_1, header_2, strict=True):
+        if h1 and h2:
+            headers.append(f"{h2} {h1}".strip())
+            prev_h2 = str(h2).strip()
+        elif h2:
+            headers.append(str(h2).strip())
+            prev_h2 = str(h2).strip()
+        elif h1:
+            # Try forward-fill with validation
+            if prev_h2:
+                candidate = f"{prev_h2} {h1}".strip()
+                if mapper and mapper.is_known_column(candidate):
+                    headers.append(candidate)
+                else:
+                    # Forward-fill not valid, use h1 standalone
+                    headers.append(str(h1).strip())
+            else:
+                headers.append(str(h1).strip())
+        else:
+            headers.append(None)
+            prev_h2 = None  # Reset on gap
+
+    headers = [re.sub(r"\s+", " ", h.replace("\n", " ")) if h else None for h in headers]
+
+    return headers
+
+
+def read_patient_rows(ws, data_start_row: int, num_columns: int) -> list[tuple]:
+    """Read patient data rows from the worksheet.
+
+    Reads from data_start_row until either ws.max_row or the first completely
+    empty row. Skips rows where both the row number (column A) and patient_id
+    (column B) are None, but accepts rows where patient_id exists even if row
+    number is missing (handles data quality issues in Excel files).
+
+    Args:
+        ws: openpyxl worksheet object
+        data_start_row: Row number where patient data starts
+        num_columns: Number of columns to read
+
+    Returns:
+        List of tuples, each containing one row of patient data
+
+    Example:
+        >>> rows = read_patient_rows(ws, 77, 31)
+        >>> len(rows)
+        4
+    """
+    data = []
+    for row in ws.iter_rows(
+        min_row=data_start_row,
+        max_row=ws.max_row,
+        min_col=1,
+        max_col=num_columns,
+        values_only=True,
+    ):
+        if all(cell is None for cell in row):
+            break
+        # Skip rows where both row number (col A) AND patient_id (col B) are missing
+        # This handles cases where Excel has missing row numbers but valid patient data
+        if row[0] is None and (len(row) < 2 or row[1] is None):
+            continue
+        data.append(row)
+
+    return data
+
+
+def merge_duplicate_columns_data(
+    headers: list[str], data: list[list]
+) -> tuple[list[str], list[list]]:
+    """Merge data from duplicate column headers by concatenating with commas.
+
+    When Excel cells are merged both horizontally and vertically, the forward-fill
+    logic in merge_headers() can create duplicate column names. This function
+    merges the data from duplicate columns (like R's tidyr::unite()).
+
+    Args:
+        headers: List of header strings (may contain duplicates)
+        data: List of data rows (each row is a list)
+
+    Returns:
+        Tuple of (unique_headers, merged_data)
+
+    Example:
+        >>> headers = ["ID", "DM Complications", "DM Complications", "DM Complications", "Age"]
+        >>> data = [["1", "A", "B", "C", "25"], ["2", "X", "Y", "Z", "30"]]
+        >>> merge_duplicate_columns_data(headers, data)
+        (['ID', 'DM Complications', 'Age'], [['1', 'A,B,C', '25'], ['2', 'X,Y,Z', '30']])
+    """
+    if len(headers) == len(set(headers)):
+        return headers, data
+
+    from collections import defaultdict
+
+    header_positions: dict[str, list[int]] = defaultdict(list)
+    for idx, header in enumerate(headers):
+        header_positions[header].append(idx)
+
+    unique_headers = list(header_positions.keys())
+
+    duplicated = [h for h, positions in header_positions.items() if len(positions) > 1]
+    if duplicated:
+        logger.debug(f"Merging {len(duplicated)} duplicate column groups: {duplicated}")
+
+    merged_data = []
+    for row in data:
+        merged_row = []
+        for header in unique_headers:
+            positions = header_positions[header]
+            if len(positions) == 1:
+                merged_row.append(row[positions[0]])
+            else:
+                values = [str(row[pos]) if row[pos] is not None else "" for pos in positions]
+                values = [v for v in values if v]
+                merged_value = ",".join(values) if values else None
+                merged_row.append(merged_value)
+        merged_data.append(merged_row)
+
+    return unique_headers, merged_data
+
+
+def filter_valid_columns(
+    headers: list[str | None], data: list[tuple]
+) -> tuple[list[str], list[list]]:
+    """Filter out columns with None headers and their corresponding data.
+
+    Args:
+        headers: List of header strings (may contain None)
+        data: List of data rows
+
+    Returns:
+        Tuple of (valid_headers, filtered_data)
+
+    Example:
+        >>> headers = ["ID", None, "Name", None, "Age"]
+        >>> data = [("1", "x", "Alice", "y", "30")]
+        >>> filter_valid_columns(headers, data)
+        (['ID', 'Name', 'Age'], [['1', 'Alice', '30']])
+    """
+    valid_cols = [(i, h) for i, h in enumerate(headers) if h]
+
+    if not valid_cols:
+        return [], []
+
+    valid_indices = [i for i, _ in valid_cols]
+    valid_headers = [h for _, h in valid_cols]
+
+    filtered_data = [[row[i] for i in valid_indices] for row in data]
+
+    return valid_headers, filtered_data
+
+
+def clean_excel_errors(df: pl.DataFrame) -> pl.DataFrame:
+    """Convert Excel error strings to NULL values.
+
+    Excel error codes like #DIV/0!, #VALUE!, etc. are not usable values
+    and should be treated as missing data.
+
+    Args:
+        df: DataFrame with potential Excel error strings
+
+    Returns:
+        DataFrame with Excel errors converted to NULL
+
+    Example:
+        >>> df = pl.DataFrame({"bmi": ["17.5", "#DIV/0!", "18.2"]})
+        >>> clean_df = clean_excel_errors(df)
+        >>> clean_df["bmi"].to_list()
+        ['17.5', None, '18.2']
+    """
+    excel_errors = [
+        "#DIV/0!",
+        "#VALUE!",
+        "#REF!",
+        "#NAME?",
+        "#NUM!",
+        "#N/A",
+        "#NULL!",
+    ]
+
+    metadata_cols = {
+        "tracker_year",
+        "tracker_month",
+        "clinic_id",
+        "patient_id",
+        "sheet_name",
+        "file_name",
+    }
+    data_cols = [col for col in df.columns if col not in metadata_cols]
+
+    if not data_cols:
+        return df
+
+    df = df.with_columns(
+        [
+            pl.when(pl.col(col).is_in(excel_errors)).then(None).otherwise(pl.col(col)).alias(col)
+            for col in data_cols
+        ]
+    )
+
+    for error in excel_errors:
+        for col in data_cols:
+            count = (df[col] == error).sum()
+            if count > 0:
+                logger.debug(f"Converted {count} '{error}' values to NULL in column '{col}'")
+
+    return df
+
+
+def extract_patient_data(
+    tracker_file: Path,
+    sheet_name: str,
+    year: int,
+    mapper: ColumnMapper | None = None,
+    workbook=None,
+) -> pl.DataFrame:
+    """Extract patient data from a single sheet.
+
+    Uses single read_only=True load with synonym-validated header merging.
+
+    Args:
+        tracker_file: Path to the tracker Excel file
+        sheet_name: Name of the sheet to extract
+        year: Year of the tracker (currently unused, reserved for future use)
+        mapper: Optional ColumnMapper for validating forward-filled headers
+        workbook: Optional pre-loaded workbook for caching across sheets
+
+    Returns:
+        Polars DataFrame with patient data (all columns as strings)
+
+    Example:
+        >>> df = extract_patient_data(
+        ...     Path("2024_Clinic.xlsx"),
+        ...     "Jan24",
+        ...     2024
+        ... )
+        >>> len(df)
+        4
+        >>> "Patient ID*" in df.columns
+        True
+    """
+    if mapper is None:
+        mapper = load_patient_mapper()
+
+    # Use cached workbook or load new one
+    close_wb = workbook is None
+    if workbook is None:
+        workbook = load_workbook(
+            tracker_file,
+            read_only=True,
+            data_only=True,
+            keep_vba=False,
+            keep_links=False,
+        )
+
+    ws = workbook[sheet_name]
+
+    data_start_row = find_data_start_row(ws)
+    logger.debug(
+        f"Sheet '{sheet_name}': Patient data found in rows {data_start_row} to {ws.max_row}"
+    )
+
+    logger.info("Processing headers...")
+    header_1, header_2 = read_header_rows(ws, data_start_row)
+
+    # Use synonym-validated forward-fill instead of Excel merge metadata
+    headers = merge_headers(header_1, header_2, mapper=mapper)
+
+    valid_cols = [(i, h) for i, h in enumerate(headers) if h]
+
+    if not valid_cols:
+        if close_wb:
+            workbook.close()
+        logger.warning(f"No valid headers found in sheet '{sheet_name}'")
+        return pl.DataFrame()
+
+    data = read_patient_rows(ws, data_start_row, len(headers))
+
+    if close_wb:
+        workbook.close()
+
+    valid_headers, filtered_data = filter_valid_columns(headers, data)
+
+    valid_headers, filtered_data = merge_duplicate_columns_data(valid_headers, filtered_data)
+
+    # Create DataFrame with ALL columns explicitly as String type to ensure consistent schema
+    # across all files and avoid type inference issues (Null vs String dtype)
+    df = pl.DataFrame(
+        {
+            header: pl.Series(
+                [str(row[i]) if row[i] is not None else None for row in filtered_data],
+                dtype=pl.String,
+            )
+            for i, header in enumerate(valid_headers)
+        }
+    )
+
+    logger.info(f"Extracted {len(df)} rows x {len(df.columns)} cols from sheet '{sheet_name}'")
+
+    return df
+
+
+def harmonize_patient_data_columns(
+    df: pl.DataFrame,
+    mapper: ColumnMapper | None = None,
+    strict: bool = False,
+) -> pl.DataFrame:
+    """Harmonize patient data columns using synonym mappings.
+
+    Renames columns from their various synonyms (e.g., "Patient ID", "ID",
+    "Patient ID*") to standardized column names (e.g., "patient_id").
+
+    Args:
+        df: DataFrame with raw column names from tracker
+        mapper: ColumnMapper to use (if None, loads default patient mapper)
+        strict: If True, raise error if unmapped columns exist
+                If False, keep unmapped columns as-is (default)
+
+    Returns:
+        DataFrame with standardized column names
+
+    Raises:
+        ValueError: If strict=True and unmapped columns exist
+
+    Example:
+        >>> raw_df = pl.DataFrame({
+        ...     "Patient ID*": ["MY_SU001", "MY_SU002"],
+        ...     "Age": [25, 30],
+        ... })
+        >>> harmonized = harmonize_patient_data_columns(raw_df)
+        >>> harmonized.columns
+        ['patient_id', 'age']
+    """
+    if mapper is None:
+        mapper = load_patient_mapper()
+
+    renamed_df = mapper.rename_columns(df, strict=strict)
+
+    logger.info(
+        f"Harmonized columns: {len(df.columns)} -> {len(renamed_df.columns)} "
+        f"({len(df.columns) - len(renamed_df.columns)} columns removed)"
+        if len(df.columns) != len(renamed_df.columns)
+        else f"Harmonized {len(renamed_df.columns)} columns"
+    )
+
+    return renamed_df
+
+
+def extract_tracker_month(sheet_name: str) -> int:
+    """Extract month number (1-12) from sheet name.
+
+    Args:
+        sheet_name: Sheet name like "Jan24", "Feb24", etc.
+
+    Returns:
+        Month number (1 for January, 2 for February, etc.)
+
+    Raises:
+        ValueError: If month cannot be extracted or is out of valid range
+
+    Example:
+        >>> extract_tracker_month("Jan24")
+        1
+        >>> extract_tracker_month("Dec23")
+        12
+    """
+    month_abbrs = list(calendar.month_abbr)[1:]  # ['Jan', 'Feb', ...]
+
+    # Check first 3 characters
+    month_prefix = sheet_name[:3]
+
+    if month_prefix in month_abbrs:
+        month_num = month_abbrs.index(month_prefix) + 1  # +1 because index is 0-based
+
+        # Validate month is in valid range (1-12)
+        # This should always be true given the logic above, but check anyway for safety
+        if not (1 <= month_num <= 12):
+            raise ValueError(
+                f"Month number {month_num} is out of valid range (1-12). "
+                f"Parsed from sheet name '{sheet_name}'"
+            )
+
+        return month_num
+
+    raise ValueError(f"Could not extract month from sheet name '{sheet_name}'")
+
+
+def read_all_patient_sheets(
+    tracker_file: Path,
+    mapper: ColumnMapper | None = None,
+    error_collector: ErrorCollector | None = None,
+) -> pl.DataFrame:
+    """Read patient data from all month sheets in a tracker file.
+
+    Orchestrates the complete extraction process:
+    1. Find all month sheets
+    2. Extract tracker year
+    3. For each month sheet:
+        - Extract raw data
+        - Harmonize column names
+        - Merge duplicate columns
+        - Add metadata (sheet_name, tracker_month, tracker_year, file_name)
+    4. Combine all sheets
+    5. Filter invalid rows (no patient_id and no name)
+
+    Args:
+        tracker_file: Path to the tracker Excel file
+        mapper: ColumnMapper to use (if None, loads default patient mapper)
+        error_collector: ErrorCollector for tracking data quality issues (optional)
+
+    Returns:
+        Combined DataFrame with all patient data from all month sheets
+
+    Raises:
+        ValueError: If no month sheets found or year cannot be determined
+
+    Example:
+        >>> df = read_all_patient_sheets(Path("2024_Clinic.xlsx"))
+        >>> "patient_id" in df.columns
+        True
+        >>> "tracker_month" in df.columns
+        True
+        >>> "tracker_year" in df.columns
+        True
+    """
+    logger.info(f"Reading all patient sheets from {tracker_file.name}")
+
+    # Load mapper once for all sheets
+    if mapper is None:
+        mapper = load_patient_mapper()
+
+    # Load workbook once and reuse across all sheets
+    wb = load_workbook(
+        tracker_file, read_only=True, data_only=True, keep_vba=False, keep_links=False
+    )
+
+    month_sheets = find_month_sheets(wb)
+    if not month_sheets:
+        wb.close()
+        raise ValueError(f"No month sheets found in {tracker_file.name}")
+
+    year = get_tracker_year(tracker_file, month_sheets)
+    logger.info(f"Processing {len(month_sheets)} month sheets for year {year}")
+
+    all_sheets_data = []
+
+    for sheet_name in month_sheets:
+        logger.info(f"Processing sheet: {sheet_name}")
+
+        df_sheet = extract_patient_data(
+            tracker_file, sheet_name, year, mapper=mapper, workbook=wb
+        )
+
+        if df_sheet.is_empty():
+            logger.warning(f"Sheet '{sheet_name}' has no data, skipping")
+            continue
+
+        df_sheet = harmonize_patient_data_columns(df_sheet, mapper=mapper, strict=False)
+
+        if "patient_id" not in df_sheet.columns:
+            logger.warning(
+                f"Sheet '{sheet_name}' has no 'patient_id' column after harmonization, skipping"
+            )
+            continue
+
+        try:
+            month_num = extract_tracker_month(sheet_name)
+        except ValueError as e:
+            logger.warning(f"Could not extract month from '{sheet_name}': {e}, skipping")
+            continue
+
+        # Derived metadata (year, month) use Int64; text metadata (sheet_name, etc.) use String
+        clinic_id = tracker_file.parent.name
+        file_name = tracker_file.stem
+        df_sheet = df_sheet.with_columns(
+            [
+                pl.lit(sheet_name, dtype=pl.String).alias("sheet_name"),
+                pl.lit(month_num, dtype=pl.Int64).alias("tracker_month"),
+                pl.lit(year, dtype=pl.Int64).alias("tracker_year"),
+                pl.lit(file_name, dtype=pl.String).alias("file_name"),
+                pl.lit(clinic_id, dtype=pl.String).alias("clinic_id"),
+            ]
+        )
+
+        all_sheets_data.append(df_sheet)
+
+    if not all_sheets_data:
+        raise ValueError(f"No valid patient data found in any month sheets of {tracker_file.name}")
+
+    # Use diagonal_relaxed to handle type mismatches (e.g., Null vs String) like R's bind_rows
+    logger.info(f"Combining {len(all_sheets_data)} sheets...")
+    df_combined = pl.concat(all_sheets_data, how="diagonal_relaxed")
+
+    initial_rows = len(df_combined)
+
+    # Track rows with missing patient_id for error reporting
+    missing_patient_id_rows = df_combined.filter(pl.col("patient_id").is_null())
+    missing_count = len(missing_patient_id_rows)
+
+    if missing_count > 0:
+        logger.error(
+            f"Found {missing_count} rows with missing patient_id in {tracker_file.name} - "
+            f"these rows will be excluded from processing"
+        )
+
+        # Log to ErrorCollector if available
+        if error_collector is not None:
+            for row in missing_patient_id_rows.iter_rows(named=True):
+                sheet_name = row.get("sheet_name", "unknown")
+                name_value = row.get("name", "")
+                error_collector.add_error(
+                    file_name=tracker_file.stem,
+                    patient_id="MISSING",
+                    column="patient_id",
+                    original_value=None,
+                    error_message=(
+                        f"Row in sheet '{sheet_name}' has missing "
+                        f"patient_id (name: {name_value})"
+                    ),
+                    error_code="missing_required_field",
+                    script="extract",
+                    function_name="read_all_patient_sheets",
+                )
+
+    # Filter out ALL rows with missing patient_id
+    df_combined = df_combined.filter(pl.col("patient_id").is_not_null())
+
+    # Filter out empty rows (both patient_id and name are null/empty)
+    # This is redundant now but kept for clarity
+    if "name" in df_combined.columns:
+        df_combined = df_combined.filter(
+            ~(
+                (pl.col("patient_id").str.strip_chars() == "")
+                & (pl.col("name").is_null() | (pl.col("name").str.strip_chars() == ""))
+            )
+        )
+
+    # Filter out rows where both patient_id and name are numeric zeros (0, 0.0, "0", "0.0", etc.)
+    if "name" in df_combined.columns:
+        df_combined = df_combined.filter(
+            ~(
+                pl.col("patient_id").str.strip_chars().is_in(["0", "0.0"])
+                & pl.col("name").str.strip_chars().is_in(["0", "0.0"])
+            )
+        )
+
+    # Filter out rows with patient_id starting with "#" (Excel errors like #REF!)
+    df_combined = df_combined.filter(~pl.col("patient_id").str.starts_with("#"))
+
+    filtered_rows = initial_rows - len(df_combined)
+    if filtered_rows > 0:
+        logger.info(f"Filtered out {filtered_rows} invalid rows total")
+
+    df_combined = clean_excel_errors(df_combined)
+
+    # Use already-loaded workbook for sheet checking
+    all_sheets = wb.sheetnames
+
+    # Process Patient List sheet if it exists (R: lines 103-130)
+    if "Patient List" in all_sheets:
+        logger.info("Processing 'Patient List' sheet...")
+        try:
+            patient_list = extract_patient_data(
+                tracker_file, "Patient List", year, mapper=mapper, workbook=wb
+            )
+            if not patient_list.is_empty():
+                patient_list = clean_excel_errors(patient_list)
+                patient_list = harmonize_patient_data_columns(
+                    patient_list, mapper=mapper, strict=False
+                )
+
+                if "patient_id" in patient_list.columns:
+                    # Filter out rows with missing patient_id
+                    patient_list = patient_list.filter(pl.col("patient_id").is_not_null())
+
+                    # Filter out numeric zeros and Excel errors
+                    if "name" in patient_list.columns:
+                        patient_list = patient_list.filter(
+                            ~(
+                                pl.col("patient_id").str.strip_chars().is_in(["0", "0.0"])
+                                & pl.col("name").str.strip_chars().is_in(["0", "0.0"])
+                            )
+                        )
+
+                    patient_list = patient_list.filter(~pl.col("patient_id").str.starts_with("#"))
+
+                    # R: select(-any_of(c("hba1c_baseline"))) and select(-any_of(c("name")))
+                    df_monthly = (
+                        df_combined.drop("hba1c_baseline")
+                        if "hba1c_baseline" in df_combined.columns
+                        else df_combined
+                    )
+                    patient_list_join = (
+                        patient_list.drop("name")
+                        if "name" in patient_list.columns
+                        else patient_list
+                    )
+
+                    df_combined = df_monthly.join(
+                        patient_list_join, on="patient_id", how="left", suffix=".static"
+                    )
+                    logger.info(f"Joined {len(patient_list)} Patient List records")
+                else:
+                    logger.warning(
+                        "Patient List sheet has no 'patient_id' column after harmonization"
+                    )
+            else:
+                logger.warning("Patient List sheet is empty")
+        except Exception as e:
+            logger.warning(f"Could not process Patient List sheet: {e}")
+
+    # Process Annual sheet if it exists (R: lines 132-160)
+    if "Annual" in all_sheets:
+        logger.info("Processing 'Annual' sheet...")
+        try:
+            annual_data = extract_patient_data(
+                tracker_file, "Annual", year, mapper=mapper, workbook=wb
+            )
+            if not annual_data.is_empty():
+                annual_data = clean_excel_errors(annual_data)
+                annual_data = harmonize_patient_data_columns(
+                    annual_data, mapper=mapper, strict=False
+                )
+
+                if "patient_id" in annual_data.columns:
+                    # Filter out rows with missing patient_id
+                    annual_data = annual_data.filter(pl.col("patient_id").is_not_null())
+
+                    # Filter out numeric zeros and Excel errors
+                    if "name" in annual_data.columns:
+                        annual_data = annual_data.filter(
+                            ~(
+                                pl.col("patient_id").str.strip_chars().is_in(["0", "0.0"])
+                                & pl.col("name").str.strip_chars().is_in(["0", "0.0"])
+                            )
+                        )
+
+                    annual_data = annual_data.filter(~pl.col("patient_id").str.starts_with("#"))
+
+                    # R: select(-any_of(c("status", "name")))
+                    cols_to_drop = [col for col in ["status", "name"] if col in annual_data.columns]
+                    annual_data_join = (
+                        annual_data.drop(cols_to_drop) if cols_to_drop else annual_data
+                    )
+
+                    df_combined = df_combined.join(
+                        annual_data_join, on="patient_id", how="left", suffix=".annual"
+                    )
+                    logger.info(f"Joined {len(annual_data)} Annual records")
+                else:
+                    logger.warning("Annual sheet has no 'patient_id' column after harmonization")
+            else:
+                logger.warning("Annual sheet is empty")
+        except Exception as e:
+            logger.warning(f"Could not process Annual sheet: {e}")
+
+    # Close workbook after all processing
+    wb.close()
+
+    logger.info(
+        f"Successfully extracted {len(df_combined)} total rows "
+        f"from {len(all_sheets_data)} month sheets"
+    )
+
+    # Reorder: metadata first, then patient data
+    # (tracker_year, tracker_month, clinic_id, patient_id)
+    priority_cols = ["tracker_year", "tracker_month", "clinic_id", "patient_id"]
+    existing_priority = [c for c in priority_cols if c in df_combined.columns]
+    other_cols = [c for c in df_combined.columns if c not in priority_cols]
+    df_combined = df_combined.select(existing_priority + other_cols)
+
+    return df_combined
+
+
+def export_patient_raw(
+    df: pl.DataFrame,
+    tracker_file: Path,
+    output_dir: Path,
+) -> Path:
+    """Export raw patient data to parquet file.
+
+    Matches R pipeline behavior:
+    - Filename: {tracker_name}_patient_raw.parquet
+    - Location: output_dir/{tracker_name}_patient_raw.parquet
+
+    Args:
+        df: Patient DataFrame to export
+        tracker_file: Path to original tracker file (used to extract tracker_name)
+        output_dir: Directory to write parquet file (e.g., data_root/output/patient_data_raw)
+
+    Returns:
+        Path to the written parquet file
+
+    Example:
+        >>> df = read_all_patient_sheets(Path("2024_Clinic.xlsx"))
+        >>> output_path = export_patient_raw(
+        ...     df,
+        ...     Path("2024_Clinic.xlsx"),
+        ...     Path("output/patient_data_raw")
+        ... )
+        >>> output_path.name
+        '2024_Clinic_patient_raw.parquet'
+    """
+    # Extract tracker name (filename without extension)
+    tracker_name = tracker_file.stem
+
+    # Create output filename: {tracker_name}_patient_raw.parquet
+    output_filename = f"{tracker_name}_patient_raw.parquet"
+    output_path = output_dir / output_filename
+
+    # Ensure output directory exists
+    output_dir.mkdir(parents=True, exist_ok=True)
+
+    # Write parquet file
+    logger.info(f"Writing {len(df)} rows to {output_path}")
+    df.write_parquet(output_path)
+
+    logger.info(f"Successfully exported to {output_path}")
+    return output_path
diff --git a/a4d-python/src/a4d/gcp/__init__.py b/a4d-python/src/a4d/gcp/__init__.py
new file mode 100644
index 0000000..89b75e0
--- /dev/null
+++ b/a4d-python/src/a4d/gcp/__init__.py
@@ -0,0 +1,21 @@
+from a4d.gcp.bigquery import (
+    TABLE_CONFIGS,
+    get_bigquery_client,
+    load_pipeline_tables,
+    load_table,
+)
+from a4d.gcp.storage import (
+    download_tracker_files,
+    get_storage_client,
+    upload_output,
+)
+
+__all__ = [
+    "TABLE_CONFIGS",
+    "download_tracker_files",
+    "get_bigquery_client",
+    "get_storage_client",
+    "load_pipeline_tables",
+    "load_table",
+    "upload_output",
+]
diff --git a/a4d-python/src/a4d/gcp/bigquery.py b/a4d-python/src/a4d/gcp/bigquery.py
new file mode 100644
index 0000000..ad3d24d
--- /dev/null
+++ b/a4d-python/src/a4d/gcp/bigquery.py
@@ -0,0 +1,187 @@
+"""BigQuery table loading from parquet files.
+
+Replaces the R pipeline's `ingest_data()` function which used the `bq` CLI tool.
+Uses the google-cloud-bigquery Python client for loading parquet files with
+clustering configuration matching the R pipeline.
+"""
+
+from pathlib import Path
+
+from google.cloud import bigquery
+from loguru import logger
+
+from a4d.config import settings
+
+# Table configurations matching the R pipeline's clustering fields.
+# Each table maps to the clustering fields used for optimal query performance.
+TABLE_CONFIGS: dict[str, list[str]] = {
+    "patient_data_monthly": ["clinic_id", "patient_id", "tracker_date"],
+    "patient_data_annual": ["patient_id", "tracker_date"],
+    "patient_data_static": ["clinic_id", "patient_id", "tracker_date"],
+    "patient_data_hba1c": ["clinic_id", "patient_id", "tracker_date"],
+    "product_data": [
+        "clinic_id",
+        "product_released_to",
+        "product_table_year",
+        "product_table_month",
+    ],
+    "clinic_data_static": ["clinic_id"],
+    "logs": ["level", "log_file", "file_name"],
+    "tracker_metadata": ["file_name", "clinic_code"],
+}
+
+# Maps the pipeline output file names to BigQuery table names.
+# Note: table_logs.parquet uses this name from create_table_logs() in tables/logs.py.
+PARQUET_TO_TABLE: dict[str, str] = {
+    "patient_data_static.parquet": "patient_data_static",
+    "patient_data_monthly.parquet": "patient_data_monthly",
+    "patient_data_annual.parquet": "patient_data_annual",
+    "table_logs.parquet": "logs",
+}
+
+
+def get_bigquery_client(project_id: str | None = None) -> bigquery.Client:
+    """Create a BigQuery client.
+
+    Authentication uses Application Default Credentials (ADC):
+    - In Cloud Run / GCE: automatic via metadata server
+    - Locally: via `gcloud auth application-default login`
+    - In CI: via GOOGLE_APPLICATION_CREDENTIALS environment variable
+
+    Args:
+        project_id: GCP project ID (defaults to settings.project_id)
+
+    Returns:
+        Configured BigQuery client
+    """
+    return bigquery.Client(project=project_id or settings.project_id)
+
+
+def load_table(
+    parquet_path: Path,
+    table_name: str,
+    client: bigquery.Client | None = None,
+    dataset: str | None = None,
+    project_id: str | None = None,
+    replace: bool = True,
+) -> bigquery.LoadJob:
+    """Load a parquet file into a BigQuery table.
+
+    Replicates the R pipeline's `ingest_data()` function:
+    1. Optionally deletes the existing table (replace=True, matching R's delete=T default)
+    2. Loads the parquet file with clustering fields
+
+    Args:
+        parquet_path: Path to the parquet file to load
+        table_name: BigQuery table name (e.g., "patient_data_monthly")
+        client: BigQuery client (created if not provided)
+        dataset: Dataset name (defaults to settings.dataset)
+        project_id: GCP project ID (defaults to settings.project_id)
+        replace: If True, replaces the existing table (default matches R pipeline)
+
+    Returns:
+        Completed LoadJob
+
+    Raises:
+        FileNotFoundError: If parquet file doesn't exist
+        ValueError: If table_name is not in TABLE_CONFIGS
+        google.api_core.exceptions.GoogleAPIError: On BigQuery API errors
+    """
+    if not parquet_path.exists():
+        raise FileNotFoundError(f"Parquet file not found: {parquet_path}")
+
+    dataset = dataset or settings.dataset
+    project_id = project_id or settings.project_id
+
+    if client is None:
+        client = get_bigquery_client(project_id)
+
+    table_ref = f"{project_id}.{dataset}.{table_name}"
+    logger.info(f"Loading {parquet_path.name} → {table_ref}")
+
+    # Configure the load job
+    job_config = bigquery.LoadJobConfig(
+        source_format=bigquery.SourceFormat.PARQUET,
+        write_disposition=(
+            bigquery.WriteDisposition.WRITE_TRUNCATE
+            if replace
+            else bigquery.WriteDisposition.WRITE_APPEND
+        ),
+    )
+
+    # Add clustering if configured for this table
+    clustering_fields = TABLE_CONFIGS.get(table_name)
+    if clustering_fields:
+        job_config.clustering_fields = clustering_fields
+        logger.info(f"Clustering fields: {clustering_fields}")
+
+    # Load the parquet file
+    with open(parquet_path, "rb") as f:
+        load_job = client.load_table_from_file(f, table_ref, job_config=job_config)
+
+    # Wait for completion
+    load_job.result()
+
+    logger.info(
+        f"Loaded {load_job.output_rows} rows into {table_ref} "
+        f"({parquet_path.stat().st_size / 1024 / 1024:.2f} MB)"
+    )
+    return load_job
+
+
+def load_pipeline_tables(
+    tables_dir: Path,
+    client: bigquery.Client | None = None,
+    dataset: str | None = None,
+    project_id: str | None = None,
+    replace: bool = True,
+) -> dict[str, bigquery.LoadJob]:
+    """Load all pipeline output tables into BigQuery.
+
+    Scans the tables directory for known parquet files and loads each one
+    into the corresponding BigQuery table.
+
+    Args:
+        tables_dir: Directory containing parquet table files (e.g., output/tables/)
+        client: BigQuery client (created if not provided)
+        dataset: Dataset name (defaults to settings.dataset)
+        project_id: GCP project ID (defaults to settings.project_id)
+        replace: If True, replaces existing tables
+
+    Returns:
+        Dictionary mapping table name to completed LoadJob
+
+    Raises:
+        FileNotFoundError: If tables_dir doesn't exist
+    """
+    if not tables_dir.exists():
+        raise FileNotFoundError(f"Tables directory not found: {tables_dir}")
+
+    if client is None:
+        project_id = project_id or settings.project_id
+        client = get_bigquery_client(project_id)
+
+    logger.info(f"Loading pipeline tables from: {tables_dir}")
+
+    results: dict[str, bigquery.LoadJob] = {}
+
+    for parquet_name, table_name in PARQUET_TO_TABLE.items():
+        parquet_path = tables_dir / parquet_name
+        if parquet_path.exists():
+            try:
+                job = load_table(
+                    parquet_path=parquet_path,
+                    table_name=table_name,
+                    client=client,
+                    dataset=dataset,
+                    project_id=project_id,
+                    replace=replace,
+                )
+                results[table_name] = job
+            except Exception:
+                logger.exception(f"Failed to load table: {table_name}")
+        else:
+            logger.warning(f"Table file not found, skipping: {parquet_name}")
+
+    logger.info(f"Successfully loaded {len(results)}/{len(PARQUET_TO_TABLE)} tables")
+    return results
diff --git a/a4d-python/src/a4d/gcp/storage.py b/a4d-python/src/a4d/gcp/storage.py
new file mode 100644
index 0000000..93adda1
--- /dev/null
+++ b/a4d-python/src/a4d/gcp/storage.py
@@ -0,0 +1,129 @@
+"""Google Cloud Storage operations for tracker file download and output upload.
+
+Replaces the R pipeline's `gsutil` CLI calls with the google-cloud-storage
+Python client library.
+"""
+
+from pathlib import Path
+
+from google.cloud import storage
+from loguru import logger
+
+from a4d.config import settings
+
+
+def get_storage_client(project_id: str | None = None) -> storage.Client:
+    """Create a GCS client.
+
+    Authentication uses Application Default Credentials (ADC):
+    - In Cloud Run / GCE: automatic via metadata server
+    - Locally: via `gcloud auth application-default login`
+    - In CI: via GOOGLE_APPLICATION_CREDENTIALS environment variable
+
+    Args:
+        project_id: GCP project ID (defaults to settings.project_id)
+
+    Returns:
+        Configured storage client
+    """
+    return storage.Client(project=project_id or settings.project_id)
+
+
+def download_tracker_files(
+    destination: Path,
+    bucket_name: str | None = None,
+    client: storage.Client | None = None,
+) -> list[Path]:
+    """Download tracker files from GCS bucket.
+
+    Replaces R pipeline's `download_data()` function which used `gsutil -m cp -r`.
+    Downloads all .xlsx files from the bucket, preserving directory structure.
+
+    Args:
+        destination: Local directory to download files to
+        bucket_name: GCS bucket name (defaults to settings.download_bucket)
+        client: Storage client (created if not provided)
+
+    Returns:
+        List of downloaded file paths
+    """
+    bucket_name = bucket_name or settings.download_bucket
+
+    if client is None:
+        client = get_storage_client()
+
+    bucket = client.bucket(bucket_name)
+    destination.mkdir(parents=True, exist_ok=True)
+
+    logger.info(f"Downloading tracker files from gs://{bucket_name} to {destination}")
+
+    downloaded: list[Path] = []
+    blobs = list(bucket.list_blobs())
+    logger.info(f"Found {len(blobs)} objects in bucket")
+
+    for blob in blobs:
+        # Skip directory markers
+        if blob.name.endswith("/"):
+            continue
+
+        local_path = destination / blob.name
+        local_path.parent.mkdir(parents=True, exist_ok=True)
+
+        logger.debug(f"Downloading: {blob.name}")
+        blob.download_to_filename(str(local_path))
+        downloaded.append(local_path)
+
+    logger.info(f"Downloaded {len(downloaded)} files")
+    return downloaded
+
+
+def upload_output(
+    source_dir: Path,
+    bucket_name: str | None = None,
+    prefix: str = "",
+    client: storage.Client | None = None,
+) -> list[str]:
+    """Upload output directory to GCS bucket.
+
+    Replaces R pipeline's `upload_data()` function which used `gsutil -m cp -r`.
+    Uploads all files from the source directory, preserving directory structure.
+
+    Args:
+        source_dir: Local directory to upload
+        bucket_name: GCS bucket name (defaults to settings.upload_bucket)
+        prefix: Optional prefix for uploaded blob names
+        client: Storage client (created if not provided)
+
+    Returns:
+        List of uploaded blob names
+
+    Raises:
+        FileNotFoundError: If source directory doesn't exist
+    """
+    if not source_dir.exists():
+        raise FileNotFoundError(f"Source directory not found: {source_dir}")
+
+    bucket_name = bucket_name or settings.upload_bucket
+
+    if client is None:
+        client = get_storage_client()
+
+    bucket = client.bucket(bucket_name)
+
+    logger.info(f"Uploading {source_dir} to gs://{bucket_name}/{prefix}")
+
+    uploaded: list[str] = []
+    files = [f for f in source_dir.rglob("*") if f.is_file()]
+
+    for file_path in files:
+        relative_path = file_path.relative_to(source_dir)
+        blob_name = f"{prefix}/{relative_path}" if prefix else str(relative_path)
+        blob_name = blob_name.replace("\\", "/")  # Windows compatibility
+
+        logger.debug(f"Uploading: {blob_name}")
+        blob = bucket.blob(blob_name)
+        blob.upload_from_filename(str(file_path))
+        uploaded.append(blob_name)
+
+    logger.info(f"Uploaded {len(uploaded)} files to gs://{bucket_name}")
+    return uploaded
diff --git a/a4d-python/src/a4d/logging.py b/a4d-python/src/a4d/logging.py
new file mode 100644
index 0000000..d9ca150
--- /dev/null
+++ b/a4d-python/src/a4d/logging.py
@@ -0,0 +1,159 @@
+"""Operational logging configuration using loguru.
+
+This module provides logging infrastructure for monitoring and debugging
+the pipeline execution. Logs are exported to BigQuery for dashboard analysis
+(success rates, error counts, processing times, etc.).
+
+For data quality errors (conversion failures, validation errors),
+use the ErrorCollector class from a4d.errors instead.
+
+Usage:
+    The loguru logger is a singleton. Once configured with setup_logging(),
+    all imports of 'from loguru import logger' will use the same configuration.
+
+    >>> from a4d.logging import setup_logging, file_logger
+    >>> setup_logging(output_root=Path("output"), log_name="script1")
+    >>>
+    >>> # In processing code:
+    >>> from loguru import logger
+    >>> with file_logger("clinic_001_patient", output_root, tracker_year=2024, tracker_month=10):
+    ...     logger.info("Processing started", rows=150)
+    ...     logger.warning("Missing column", column="hba1c_updated_date")
+"""
+
+import sys
+from collections.abc import Generator
+from contextlib import contextmanager
+from pathlib import Path
+
+from loguru import logger
+
+
+def setup_logging(
+    output_root: Path,
+    log_name: str,
+    level: str = "INFO",
+    console: bool = True,
+    console_level: str | None = None,
+) -> None:
+    """Configure loguru for pipeline-wide operational logging.
+
+    Creates both console (colored, human-readable) and file (JSON for BigQuery)
+    handlers. All logs in the JSON file include context variables from
+    contextualize() for analysis in Looker Studio.
+
+    Args:
+        output_root: Root output directory (logs will be in output_root/logs/)
+        log_name: Base name for the log file (e.g., "script1_extract")
+        level: Minimum file log level (DEBUG, INFO, WARNING, ERROR)
+        console: Whether to add console handler (set False for CLI with progress bars)
+        console_level: Console log level (None = use level, or set to ERROR for quiet mode)
+
+    Example:
+        >>> setup_logging(Path("output"), "script1_extract")
+        >>> logger.info("Processing started", total_trackers=10)
+
+        >>> # Quiet mode for CLI with progress bars
+        >>> setup_logging(Path("output"), "pipeline", console_level="ERROR")
+    """
+    log_dir = output_root / "logs"
+    log_dir.mkdir(parents=True, exist_ok=True)
+    log_file = log_dir / f"main_{log_name}.log"
+
+    # Remove default handler
+    logger.remove()
+
+    # Console handler: pretty, colored output for monitoring
+    if console:
+        console_log_level = console_level if console_level is not None else level
+        logger.add(
+            sys.stdout,
+            level=console_log_level,
+            colorize=True,
+            format=(
+                "<green>{time:HH:mm:ss}</green> | "
+                "<level>{level: <8}</level> | "
+                "<level>{message}</level>"
+            ),
+        )
+
+    # File handler: JSON output for BigQuery upload
+    # serialize=True means all context from contextualize() is included
+    logger.add(
+        log_file,
+        level="DEBUG",  # Capture all levels in file
+        serialize=True,  # JSON format with all fields
+        rotation="100 MB",
+        retention="30 days",
+        compression="zip",
+    )
+
+    if console:
+        logger.info("Logging initialized", log_file=str(log_file), level=level)
+
+
+@contextmanager
+def file_logger(
+    file_name: str,
+    output_root: Path,
+    tracker_year: int | None = None,
+    tracker_month: int | None = None,
+    level: str = "DEBUG",
+) -> Generator:
+    """Context manager for per-tracker file logging with context.
+
+    Creates a separate log file for a specific tracker and sets context
+    variables (file_name, tracker_year, tracker_month) that are automatically
+    included in all log records within this context.
+
+    All logs are JSON formatted and will be aggregated for BigQuery upload.
+
+    Args:
+        file_name: Name of the tracker file (e.g., "clinic_001_patient")
+        output_root: Root output directory (logs will be in output_root/logs/)
+        tracker_year: Year from the tracker (for dashboard filtering)
+        tracker_month: Month from the tracker (for dashboard filtering)
+        level: Minimum log level for this file handler
+
+    Yields:
+        None (use logger directly within context)
+
+    Example:
+        >>> with file_logger("clinic_001_patient", output_root, 2024, 10):
+        ...     logger.info("Processing patient data", rows=150)
+        ...     logger.warning("Missing column", column="hba1c_updated_date")
+        ...     # All logs include file_name, tracker_year, tracker_month
+    """
+    log_dir = output_root / "logs"
+    log_dir.mkdir(parents=True, exist_ok=True)
+    log_file = log_dir / f"{file_name}.log"
+
+    # Remove old log file if exists
+    if log_file.exists():
+        log_file.unlink()
+
+    # Add file-specific handler (JSON only, no console)
+    handler_id = logger.add(
+        log_file,
+        level=level,
+        serialize=True,  # JSON format
+    )
+
+    # Build context dict (only include non-None values)
+    context = {"file_name": file_name}
+    if tracker_year is not None:
+        context["tracker_year"] = tracker_year
+    if tracker_month is not None:
+        context["tracker_month"] = tracker_month
+
+    # Use contextualize to add file_name, tracker_year, tracker_month to all logs
+    with logger.contextualize(**context):
+        try:
+            yield
+        except Exception:
+            # Log exception with full traceback
+            logger.exception("Processing failed", error_code="critical_abort")
+            raise
+        finally:
+            # Remove the handler
+            logger.remove(handler_id)
diff --git a/a4d-python/src/a4d/pipeline/__init__.py b/a4d-python/src/a4d/pipeline/__init__.py
new file mode 100644
index 0000000..d256ed8
--- /dev/null
+++ b/a4d-python/src/a4d/pipeline/__init__.py
@@ -0,0 +1,18 @@
+"""Pipeline orchestration for A4D data processing."""
+
+from a4d.pipeline.models import PipelineResult, TrackerResult
+from a4d.pipeline.patient import (
+    discover_tracker_files,
+    process_patient_tables,
+    run_patient_pipeline,
+)
+from a4d.pipeline.tracker import process_tracker_patient
+
+__all__ = [
+    "PipelineResult",
+    "TrackerResult",
+    "discover_tracker_files",
+    "process_patient_tables",
+    "process_tracker_patient",
+    "run_patient_pipeline",
+]
diff --git a/a4d-python/src/a4d/pipeline/models.py b/a4d-python/src/a4d/pipeline/models.py
new file mode 100644
index 0000000..191ff31
--- /dev/null
+++ b/a4d-python/src/a4d/pipeline/models.py
@@ -0,0 +1,78 @@
+"""Pipeline result models for tracking processing outputs."""
+
+from dataclasses import dataclass
+from pathlib import Path
+
+
+@dataclass
+class TrackerResult:
+    """Result from processing a single tracker file.
+
+    Attributes:
+        tracker_file: Original tracker file path
+        tracker_name: Base name without extension
+        raw_output: Path to raw parquet file (None if extraction failed)
+        cleaned_output: Path to cleaned parquet file (None if cleaning failed)
+        success: Whether processing completed successfully
+        error: Error message if processing failed
+        cleaning_errors: Number of data quality errors during cleaning (type conversion,
+                        validation failures, etc.). These are non-fatal - data is cleaned
+                        with error values (999999, "Undefined", etc.)
+        error_breakdown: Breakdown of errors by type (error_code → count).
+                        Example: {"type_conversion": 10, "invalid_value": 5}
+    """
+
+    tracker_file: Path
+    tracker_name: str
+    raw_output: Path | None = None
+    cleaned_output: Path | None = None
+    success: bool = True
+    error: str | None = None
+    cleaning_errors: int = 0
+    error_breakdown: dict[str, int] | None = None
+
+
+@dataclass
+class PipelineResult:
+    """Result from running the complete patient pipeline.
+
+    Attributes:
+        tracker_results: Results from processing individual trackers
+        tables: Dictionary mapping table name to output path
+        total_trackers: Total number of trackers processed
+        successful_trackers: Number of successfully processed trackers
+        failed_trackers: Number of failed trackers
+        success: Whether entire pipeline completed successfully
+    """
+
+    tracker_results: list[TrackerResult]
+    tables: dict[str, Path]
+    total_trackers: int
+    successful_trackers: int
+    failed_trackers: int
+    success: bool
+
+    @classmethod
+    def from_tracker_results(
+        cls, tracker_results: list[TrackerResult], tables: dict[str, Path] | None = None
+    ) -> "PipelineResult":
+        """Create PipelineResult from tracker results.
+
+        Args:
+            tracker_results: List of tracker processing results
+            tables: Dictionary of created tables (empty if table creation skipped)
+
+        Returns:
+            PipelineResult with computed statistics
+        """
+        successful = sum(1 for r in tracker_results if r.success)
+        failed = len(tracker_results) - successful
+
+        return cls(
+            tracker_results=tracker_results,
+            tables=tables or {},
+            total_trackers=len(tracker_results),
+            successful_trackers=successful,
+            failed_trackers=failed,
+            success=failed == 0,
+        )
diff --git a/a4d-python/src/a4d/pipeline/patient.py b/a4d-python/src/a4d/pipeline/patient.py
new file mode 100644
index 0000000..b320c59
--- /dev/null
+++ b/a4d-python/src/a4d/pipeline/patient.py
@@ -0,0 +1,329 @@
+"""Main patient pipeline orchestration."""
+
+import os
+from collections.abc import Callable
+from concurrent.futures import ProcessPoolExecutor, as_completed
+from datetime import datetime
+from pathlib import Path
+
+from loguru import logger
+from tqdm import tqdm
+
+from a4d.config import settings
+from a4d.logging import setup_logging
+from a4d.pipeline.models import PipelineResult, TrackerResult
+from a4d.pipeline.tracker import process_tracker_patient
+from a4d.tables.logs import create_table_logs
+from a4d.tables.patient import (
+    create_table_patient_data_annual,
+    create_table_patient_data_monthly,
+    create_table_patient_data_static,
+)
+
+
+def _init_worker_logging(output_root: Path):
+    """Initialize logging for worker processes.
+
+    This is called once when each worker process starts in ProcessPoolExecutor.
+    Sets up quiet logging (only file output, no console spam).
+
+    Args:
+        output_root: Output directory for logs
+    """
+    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+    pid = os.getpid()
+    setup_logging(
+        output_root=output_root,
+        log_name=f"worker_{timestamp}_pid{pid}",
+        console_level="ERROR",  # Quiet console
+    )
+
+
+def discover_tracker_files(data_root: Path) -> list[Path]:
+    """Discover all Excel tracker files in data_root.
+
+    Searches recursively for .xlsx files, excluding temp files (~$*).
+
+    Args:
+        data_root: Root directory to search
+
+    Returns:
+        List of tracker file paths
+
+    Example:
+        >>> tracker_files = discover_tracker_files(Path("/data"))
+        >>> len(tracker_files)
+        42
+    """
+    tracker_files = []
+    for file in data_root.rglob("*.xlsx"):
+        if not file.name.startswith("~$"):
+            tracker_files.append(file)
+
+    return sorted(tracker_files)
+
+
+def process_patient_tables(cleaned_dir: Path, output_dir: Path) -> dict[str, Path]:
+    """Create final patient tables from cleaned parquets.
+
+    Creates three main tables:
+    - patient_data_static: Latest data per patient
+    - patient_data_monthly: All monthly records
+    - patient_data_annual: Latest data per patient per year (2024+)
+
+    Args:
+        cleaned_dir: Directory containing cleaned parquet files
+        output_dir: Directory to write final tables
+
+    Returns:
+        Dictionary mapping table name to output path
+
+    Example:
+        >>> tables = process_patient_tables(
+        ...     Path("output/patient_data_cleaned"),
+        ...     Path("output/tables")
+        ... )
+        >>> tables.keys()
+        dict_keys(['static', 'monthly', 'annual'])
+    """
+    logger.info("Creating final patient tables from cleaned data")
+
+    cleaned_files = list(cleaned_dir.glob("*_patient_cleaned.parquet"))
+    logger.info(f"Found {len(cleaned_files)} cleaned parquet files")
+
+    if not cleaned_files:
+        logger.warning("No cleaned files found, skipping table creation")
+        return {}
+
+    tables = {}
+
+    logger.info("Creating static patient table")
+    static_path = create_table_patient_data_static(cleaned_files, output_dir)
+    tables["static"] = static_path
+
+    logger.info("Creating monthly patient table")
+    monthly_path = create_table_patient_data_monthly(cleaned_files, output_dir)
+    tables["monthly"] = monthly_path
+
+    logger.info("Creating annual patient table")
+    annual_path = create_table_patient_data_annual(cleaned_files, output_dir)
+    tables["annual"] = annual_path
+
+    logger.info(f"Created {len(tables)} patient tables")
+    return tables
+
+
+def run_patient_pipeline(
+    tracker_files: list[Path] | None = None,
+    max_workers: int = 1,
+    output_root: Path | None = None,
+    skip_tables: bool = False,
+    force: bool = False,
+    progress_callback: Callable[[str, bool], None] | None = None,
+    show_progress: bool = False,
+    console_log_level: str | None = None,
+) -> PipelineResult:
+    """Run complete patient data pipeline.
+
+    Processing modes:
+    - Batch mode: If tracker_files is None, discovers all .xlsx in data_root
+    - Single file mode: If tracker_files provided, processes only those files
+
+    Pipeline steps:
+    1. For each tracker (optionally parallel):
+       - Extract patient data from Excel → raw parquet
+       - Clean raw data → cleaned parquet
+    2. Create final tables from all cleaned parquets (if not skipped)
+
+    Args:
+        tracker_files: Specific files to process (None = discover all)
+        max_workers: Number of parallel workers (1 = sequential)
+        output_root: Output directory (None = use settings.output_root)
+        skip_tables: If True, only extract + clean, skip table creation
+        force: If True, reprocess even if outputs exist
+        progress_callback: Optional callback(tracker_name, success) called after each tracker
+        show_progress: If True, show tqdm progress bar
+        console_log_level: Console log level (None=INFO, ERROR=quiet, etc)
+
+    Returns:
+        PipelineResult with tracker results and table paths
+
+    Example:
+        >>> # Process all trackers
+        >>> result = run_patient_pipeline()
+        >>> result.success
+        True
+        >>> result.successful_trackers
+        42
+
+        >>> # Process single file
+        >>> result = run_patient_pipeline(
+        ...     tracker_files=[Path("/data/2024_Sibu.xlsx")]
+        ... )
+
+        >>> # Parallel processing with progress bar (CLI mode)
+        >>> result = run_patient_pipeline(
+        ...     max_workers=8,
+        ...     show_progress=True,
+        ...     console_log_level="ERROR"
+        ... )
+    """
+    # Use settings defaults if not provided
+    if output_root is None:
+        output_root = settings.output_root
+
+    # Setup main pipeline logging
+    setup_logging(
+        output_root,
+        "pipeline_patient",
+        console_level=console_log_level if console_log_level else "INFO",
+    )
+    logger.info("Starting patient pipeline")
+    logger.info(f"Output directory: {output_root}")
+    logger.info(f"Max workers: {max_workers}")
+
+    # Discover or use provided tracker files
+    if tracker_files is None:
+        logger.info(f"Discovering tracker files in: {settings.data_root}")
+        tracker_files = discover_tracker_files(settings.data_root)
+    else:
+        tracker_files = [Path(f) for f in tracker_files]
+
+    logger.info(f"Found {len(tracker_files)} tracker files to process")
+
+    if not tracker_files:
+        logger.warning("No tracker files found")
+        return PipelineResult.from_tracker_results([], {})
+
+    # Process trackers
+    tracker_results: list[TrackerResult] = []
+
+    if max_workers == 1:
+        # Sequential processing (easier for debugging)
+        logger.info("Processing trackers sequentially")
+
+        # Use tqdm if requested
+        iterator = (
+            tqdm(tracker_files, desc="Processing trackers", unit="file")
+            if show_progress
+            else tracker_files
+        )
+
+        for tracker_file in iterator:
+            if show_progress:
+                iterator.set_description(f"Processing {tracker_file.name}")
+
+            result = process_tracker_patient(
+                tracker_file=tracker_file,
+                output_root=output_root,
+                mapper=None,  # Each tracker loads mapper if needed
+            )
+            tracker_results.append(result)
+
+            # Call progress callback if provided
+            if progress_callback:
+                progress_callback(tracker_file.name, result.success)
+
+            if result.success:
+                logger.info(f"✓ Successfully processed: {tracker_file.name}")
+                if show_progress:
+                    tqdm.write(f"✓ {tracker_file.name}")
+            else:
+                logger.error(f"✗ Failed to process: {tracker_file.name} - {result.error}")
+                if show_progress:
+                    tqdm.write(f"✗ {tracker_file.name}: {result.error}")
+
+    else:
+        # Parallel processing
+        logger.info(f"Processing trackers in parallel ({max_workers} workers)")
+        with ProcessPoolExecutor(
+            max_workers=max_workers, initializer=_init_worker_logging, initargs=(output_root,)
+        ) as executor:
+            # Submit all jobs
+            futures = {
+                executor.submit(
+                    process_tracker_patient,
+                    tracker_file,
+                    output_root,
+                    None,  # Each worker loads synonyms independently
+                ): tracker_file
+                for tracker_file in tracker_files
+            }
+
+            # Collect results as they complete
+            futures_iterator = as_completed(futures)
+            if show_progress:
+                futures_iterator = tqdm(
+                    futures_iterator, total=len(futures), desc="Processing trackers", unit="file"
+                )
+
+            for future in futures_iterator:
+                tracker_file = futures[future]
+                try:
+                    result = future.result()
+                    tracker_results.append(result)
+
+                    # Call progress callback if provided
+                    if progress_callback:
+                        progress_callback(tracker_file.name, result.success)
+
+                    if result.success:
+                        logger.info(f"✓ Completed: {tracker_file.name}")
+                        if show_progress:
+                            tqdm.write(f"✓ {tracker_file.name}")
+                    else:
+                        logger.error(f"✗ Failed: {tracker_file.name} - {result.error}")
+                        if show_progress:
+                            tqdm.write(f"✗ {tracker_file.name}: {result.error}")
+                except Exception as e:
+                    logger.exception(f"Exception processing {tracker_file.name}")
+                    if show_progress:
+                        tqdm.write(f"✗ {tracker_file.name}: Exception - {str(e)}")
+                    tracker_results.append(
+                        TrackerResult(
+                            tracker_file=tracker_file,
+                            tracker_name=tracker_file.stem,
+                            success=False,
+                            error=str(e),
+                        )
+                    )
+
+    # Summary
+    successful = sum(1 for r in tracker_results if r.success)
+    failed = len(tracker_results) - successful
+    logger.info(f"Tracker processing complete: {successful} successful, {failed} failed")
+
+    # Create tables
+    tables: dict[str, Path] = {}
+    if not skip_tables:
+        try:
+            cleaned_dir = output_root / "patient_data_cleaned"
+            tables_dir = output_root / "tables"
+
+            # Create patient tables
+            tables = process_patient_tables(cleaned_dir, tables_dir)
+
+            # Create logs table separately (operational data, not patient data)
+            logs_dir = output_root / "logs"
+            if logs_dir.exists():
+                logger.info("Creating logs table from pipeline execution logs")
+                logs_table_path = create_table_logs(logs_dir, tables_dir)
+                tables["logs"] = logs_table_path
+                logger.info(f"Logs table created: {logs_table_path}")
+
+            logger.info(f"Created {len(tables)} tables total")
+        except Exception:
+            logger.exception("Failed to create tables")
+            # Don't fail entire pipeline if table creation fails
+    else:
+        logger.info("Skipping table creation (skip_tables=True)")
+
+    # Build result
+    result = PipelineResult.from_tracker_results(tracker_results, tables)
+
+    if result.success:
+        logger.info("✓ Pipeline completed successfully")
+    else:
+        logger.warning(f"✗ Pipeline completed with {failed} failures")
+
+    return result
diff --git a/a4d-python/src/a4d/pipeline/tracker.py b/a4d-python/src/a4d/pipeline/tracker.py
new file mode 100644
index 0000000..38ede3a
--- /dev/null
+++ b/a4d-python/src/a4d/pipeline/tracker.py
@@ -0,0 +1,113 @@
+"""Single tracker processing: extract + clean."""
+
+from pathlib import Path
+
+from loguru import logger
+
+from a4d.clean.patient import clean_patient_file
+from a4d.errors import ErrorCollector
+from a4d.extract.patient import export_patient_raw, read_all_patient_sheets
+from a4d.logging import file_logger
+from a4d.pipeline.models import TrackerResult
+from a4d.reference.synonyms import ColumnMapper
+
+
+def process_tracker_patient(
+    tracker_file: Path, output_root: Path, mapper: ColumnMapper | None = None
+) -> TrackerResult:
+    """Process single tracker file: extract + clean patient data.
+
+    This function processes one tracker file end-to-end:
+    1. Extract patient data from Excel
+    2. Export to raw parquet
+    3. Clean the raw data
+    4. Export to cleaned parquet
+
+    Each step creates a separate log file for debugging.
+
+    Args:
+        tracker_file: Path to tracker Excel file
+        output_root: Root output directory (will create subdirs for raw/cleaned)
+        mapper: ColumnMapper for synonym mapping (loaded if not provided)
+
+    Returns:
+        TrackerResult with paths to outputs and success status
+
+    Example:
+        >>> tracker_file = Path("/data/2024_Sibu.xlsx")
+        >>> output_root = Path("output")
+        >>> result = process_tracker_patient(tracker_file, output_root)
+        >>> result.success
+        True
+        >>> result.raw_output
+        Path('output/patient_data_raw/2024_Sibu_patient_raw.parquet')
+    """
+    tracker_name = tracker_file.stem
+
+    try:
+        # Setup directories
+        raw_dir = output_root / "patient_data_raw"
+        cleaned_dir = output_root / "patient_data_cleaned"
+        raw_dir.mkdir(parents=True, exist_ok=True)
+        cleaned_dir.mkdir(parents=True, exist_ok=True)
+
+        # Expected output paths
+        raw_output = raw_dir / f"{tracker_name}_patient_raw.parquet"
+        cleaned_output = cleaned_dir / f"{tracker_name}_patient_cleaned.parquet"
+
+        # Log context for this tracker
+        with file_logger(f"{tracker_name}_patient", output_root):
+            logger.info(f"Processing tracker: {tracker_file.name}")
+
+            # STEP 1: Extract
+            logger.info("Step 1: Extracting patient data from Excel")
+            error_collector = ErrorCollector()
+
+            df_raw = read_all_patient_sheets(
+                tracker_file=tracker_file, mapper=mapper, error_collector=error_collector
+            )
+            logger.info(f"Extracted {len(df_raw)} rows")
+
+            # Export raw parquet
+            raw_output = export_patient_raw(
+                df=df_raw, tracker_file=tracker_file, output_dir=raw_dir
+            )
+            logger.info(f"Raw parquet saved: {raw_output}")
+
+            # STEP 2: Clean
+            logger.info("Step 2: Cleaning patient data")
+
+            clean_patient_file(
+                raw_parquet_path=raw_output,
+                output_parquet_path=cleaned_output,
+                error_collector=error_collector,
+            )
+
+            error_count = len(error_collector)
+            error_breakdown = error_collector.get_error_summary()
+            logger.info(f"Cleaned parquet saved: {cleaned_output}")
+            logger.info(f"Total data quality errors: {error_count}")
+            if error_breakdown:
+                logger.info(f"Error breakdown: {error_breakdown}")
+
+        return TrackerResult(
+            tracker_file=tracker_file,
+            tracker_name=tracker_name,
+            raw_output=raw_output,
+            cleaned_output=cleaned_output,
+            success=True,
+            error=None,
+            cleaning_errors=error_count,
+            error_breakdown=error_breakdown if error_breakdown else None,
+        )
+
+    except Exception as e:
+        logger.exception(f"Failed to process tracker: {tracker_file.name}")
+        return TrackerResult(
+            tracker_file=tracker_file,
+            tracker_name=tracker_name,
+            raw_output=None,
+            cleaned_output=None,
+            success=False,
+            error=str(e),
+        )
diff --git a/a4d-python/src/a4d/reference/__init__.py b/a4d-python/src/a4d/reference/__init__.py
new file mode 100644
index 0000000..7662305
--- /dev/null
+++ b/a4d-python/src/a4d/reference/__init__.py
@@ -0,0 +1,43 @@
+"""Reference data loaders and validators.
+
+This package contains modules for loading and working with reference data
+from the shared reference_data/ directory.
+"""
+
+# Loaders (internal utilities)
+from a4d.reference.loaders import (
+    find_reference_data_dir,
+    get_reference_data_path,
+    load_yaml,
+)
+
+# Provinces (validation)
+from a4d.reference.provinces import (
+    get_country_for_province,
+    is_valid_province,
+    load_allowed_provinces,
+    load_provinces_by_country,
+)
+
+# Synonyms (column mapping)
+from a4d.reference.synonyms import (
+    ColumnMapper,
+    load_patient_mapper,
+    load_product_mapper,
+)
+
+__all__ = [
+    # Loaders
+    "find_reference_data_dir",
+    "get_reference_data_path",
+    "load_yaml",
+    # Synonyms
+    "ColumnMapper",
+    "load_patient_mapper",
+    "load_product_mapper",
+    # Provinces
+    "get_country_for_province",
+    "is_valid_province",
+    "load_allowed_provinces",
+    "load_provinces_by_country",
+]
diff --git a/a4d-python/src/a4d/reference/loaders.py b/a4d-python/src/a4d/reference/loaders.py
new file mode 100644
index 0000000..aaae370
--- /dev/null
+++ b/a4d-python/src/a4d/reference/loaders.py
@@ -0,0 +1,83 @@
+"""Utilities for loading reference data files.
+
+This module provides common utilities for loading YAML and other reference
+data files shared between the R and Python pipelines.
+"""
+
+from pathlib import Path
+from typing import Any
+
+import yaml
+from loguru import logger
+
+
+def find_reference_data_dir() -> Path:
+    """Find reference_data directory relative to the a4d package.
+
+    The reference_data directory is at the repository root, shared between
+    R and Python pipelines. From src/a4d/utils/reference_data.py we navigate
+    up to the repo root.
+
+    Returns:
+        Path to reference_data directory
+
+    Raises:
+        FileNotFoundError: If reference_data directory not found
+    """
+    # Navigate from src/a4d/utils/reference_data.py to repo root
+    # reference_data.py -> utils -> a4d -> src -> a4d-python -> repo root
+    repo_root = Path(__file__).parents[4]
+    reference_data_dir = repo_root / "reference_data"
+
+    if not reference_data_dir.exists():
+        raise FileNotFoundError(f"reference_data directory not found at {reference_data_dir}")
+
+    return reference_data_dir
+
+
+def load_yaml(
+    yaml_path: Path,
+    relative_to_reference_data: bool = False,
+) -> Any:
+    """Load and parse a YAML file.
+
+    Args:
+        yaml_path: Path to the YAML file
+        relative_to_reference_data: If True, yaml_path is relative to
+                                    reference_data directory
+
+    Returns:
+        Parsed YAML content
+
+    Raises:
+        FileNotFoundError: If the YAML file doesn't exist
+        yaml.YAMLError: If the YAML file is malformed
+    """
+    if relative_to_reference_data:
+        reference_data_dir = find_reference_data_dir()
+        yaml_path = reference_data_dir / yaml_path
+
+    if not yaml_path.exists():
+        raise FileNotFoundError(f"YAML file not found: {yaml_path}")
+
+    logger.debug(f"Loading YAML file: {yaml_path}")
+
+    with open(yaml_path) as f:
+        return yaml.safe_load(f)
+
+
+def get_reference_data_path(*parts: str) -> Path:
+    """Get path to a file in reference_data directory.
+
+    Args:
+        *parts: Path components relative to reference_data directory
+
+    Returns:
+        Absolute path to the file
+
+    Example:
+        >>> path = get_reference_data_path("synonyms", "synonyms_patient.yaml")
+        >>> # Returns: /path/to/repo/reference_data/synonyms/synonyms_patient.yaml
+    """
+    reference_data_dir = find_reference_data_dir()
+    return reference_data_dir.joinpath(*parts)
diff --git a/a4d-python/src/a4d/reference/provinces.py b/a4d-python/src/a4d/reference/provinces.py
new file mode 100644
index 0000000..2fa1694
--- /dev/null
+++ b/a4d-python/src/a4d/reference/provinces.py
@@ -0,0 +1,166 @@
+"""Province validation for patient data.
+
+This module loads allowed provinces from the reference_data YAML file
+and provides utilities for validation.
+"""
+
+from functools import lru_cache
+
+from loguru import logger
+
+from a4d.reference.loaders import get_reference_data_path, load_yaml
+
+
+@lru_cache
+def load_allowed_provinces() -> list[str]:
+    """Load all allowed provinces from YAML file (lowercased for case-insensitive matching).
+
+    Provinces are organized by country in the YAML file. This function
+    flattens them into a single list and lowercases them for validation.
+
+    The result is cached for performance since provinces don't change
+    during runtime.
+
+    Returns:
+        List of all allowed province names (lowercased) across all countries
+
+    Example:
+        >>> provinces = load_allowed_provinces()
+        >>> "bangkok" in provinces
+        True
+        >>> "BANGKOK" in provinces
+        False  # List is lowercased, use is_valid_province() for validation
+    """
+    path = get_reference_data_path("provinces", "allowed_provinces.yaml")
+    provinces_by_country: dict[str, list[str]] = load_yaml(path)
+
+    # Flatten all provinces into single list and lowercase for matching
+    all_provinces = []
+    for _, provinces in provinces_by_country.items():
+        all_provinces.extend(p.lower() for p in provinces)
+
+    logger.info(f"Loaded {len(all_provinces)} provinces from {len(provinces_by_country)} countries")
+
+    return all_provinces
+
+
+@lru_cache
+def load_provinces_by_country() -> dict[str, list[str]]:
+    """Load provinces organized by country (lowercased for case-insensitive matching).
+
+    Returns:
+        Dict mapping country names to lists of their provinces (lowercased)
+
+    Example:
+        >>> provinces = load_provinces_by_country()
+        >>> "bangkok" in provinces["THAILAND"]
+        True
+        >>> len(provinces["VIETNAM"])
+        63
+    """
+    path = get_reference_data_path("provinces", "allowed_provinces.yaml")
+    provinces_by_country_raw: dict[str, list[str]] = load_yaml(path)
+
+    # Lowercase all province names for case-insensitive matching
+    provinces_by_country = {
+        country: [p.lower() for p in provinces]
+        for country, provinces in provinces_by_country_raw.items()
+    }
+
+    logger.info(f"Loaded provinces for {len(provinces_by_country)} countries")
+
+    return provinces_by_country
+
+
+@lru_cache
+def load_canonical_provinces() -> list[str]:
+    """Load all allowed provinces with canonical casing (for validation).
+
+    Unlike load_allowed_provinces() which lowercases for matching,
+    this returns the original province names from the YAML with proper
+    casing and accents to use as canonical values in validation.
+
+    Returns:
+        List of all allowed province names (original casing) across all countries
+
+    Example:
+        >>> provinces = load_canonical_provinces()
+        >>> "Takéo" in provinces
+        True
+        >>> "Bangkok" in provinces
+        True
+    """
+    path = get_reference_data_path("provinces", "allowed_provinces.yaml")
+    provinces_by_country: dict[str, list[str]] = load_yaml(path)
+
+    # Flatten all provinces into single list WITHOUT lowercasing
+    all_provinces = []
+    for _, provinces in provinces_by_country.items():
+        all_provinces.extend(provinces)
+
+    logger.info(
+        f"Loaded {len(all_provinces)} canonical province names "
+        f"from {len(provinces_by_country)} countries"
+    )
+
+    return all_provinces
+
+
+def is_valid_province(province: str | None) -> bool:
+    """Check if a province name is valid (case-insensitive).
+
+    Args:
+        province: Province name to validate (case-insensitive, None allowed)
+
+    Returns:
+        True if province is None or in the allowed list, False otherwise
+
+    Example:
+        >>> is_valid_province("Bangkok")
+        True
+        >>> is_valid_province("BANGKOK")
+        True
+        >>> is_valid_province("bangkok")
+        True
+        >>> is_valid_province(None)
+        True
+        >>> is_valid_province("Invalid Province")
+        False
+    """
+    if province is None:
+        return True
+
+    allowed = load_allowed_provinces()
+    return province.lower() in allowed
+
+
+def get_country_for_province(province: str) -> str | None:
+    """Get the country for a given province (case-insensitive).
+
+    Args:
+        province: Province name (case-insensitive)
+
+    Returns:
+        Country name if province is found, None otherwise
+
+    Example:
+        >>> get_country_for_province("Bangkok")
+        'THAILAND'
+        >>> get_country_for_province("bangkok")
+        'THAILAND'
+        >>> get_country_for_province("BANGKOK")
+        'THAILAND'
+    """
+    provinces_by_country = load_provinces_by_country()
+    province_lower = province.lower()
+
+    for country, provinces in provinces_by_country.items():
+        if province_lower in provinces:
+            return country
+
+    return None
+
+
+if __name__ == "__main__":
+    for c, p in load_provinces_by_country().items():
+        print(f"{c}: {p}")
diff --git a/a4d-python/src/a4d/reference/synonyms.py b/a4d-python/src/a4d/reference/synonyms.py
new file mode 100644
index 0000000..6d1c778
--- /dev/null
+++ b/a4d-python/src/a4d/reference/synonyms.py
@@ -0,0 +1,343 @@
+"""Column name mapper for standardizing tracker file columns.
+
+This module handles the mapping of various column name variants (synonyms)
+to standardized column names used throughout the pipeline.
+"""
+
+import re
+from pathlib import Path
+
+import polars as pl
+from loguru import logger
+
+from a4d.reference.loaders import get_reference_data_path, load_yaml
+
+
+def sanitize_str(text: str) -> str:
+    """Sanitize a string for column name matching.
+
+    Converts to lowercase, removes all spaces and special characters,
+    keeping only alphanumeric characters. This matches the R implementation.
+
+    Args:
+        text: String to sanitize
+
+    Returns:
+        Sanitized string with only lowercase alphanumeric characters
+
+    Examples:
+        >>> sanitize_str("Patient ID*")
+        'patientid'
+        >>> sanitize_str("Age* On Reporting")
+        'ageonreporting'
+        >>> sanitize_str("Date 2022")
+        'date2022'
+        >>> sanitize_str("My Awesome 1st Column!!")
+        'myawesome1stcolumn'
+    """
+    # Convert to lowercase
+    text = text.lower()
+    # Remove spaces
+    text = text.replace(" ", "")
+    # Remove all non-alphanumeric characters
+    text = re.sub(r"[^a-z0-9]", "", text)
+    return text
+
+
+class ColumnMapper:
+    """Maps synonym column names to standardized names.
+
+    Loads column synonyms from YAML files and provides methods to rename
+    DataFrame columns to their standardized names.
+
+    Example YAML structure:
+        age:
+            - Age
+            - Age*
+            - age on reporting
+            - Age (Years)
+        patient_id:
+            - ID
+            - Patient ID
+            - Patient ID*
+
+    Attributes:
+        yaml_path: Path to the synonym YAML file
+        synonyms: Dict mapping standard names to lists of synonyms
+        _lookup: Reverse lookup dict mapping SANITIZED synonyms to standard names
+
+    Note:
+        Synonym matching is case-insensitive and ignores special characters.
+        This matches the R implementation which uses sanitize_str() for both
+        column names and synonym keys before matching.
+    """
+
+    def __init__(self, yaml_path: Path):
+        """Initialize the mapper by loading synonyms from YAML.
+
+        Args:
+            yaml_path: Path to the synonym YAML file
+
+        Raises:
+            FileNotFoundError: If the YAML file doesn't exist
+            yaml.YAMLError: If the YAML file is malformed
+        """
+        self.yaml_path = yaml_path
+        self.synonyms: dict[str, list[str]] = load_yaml(yaml_path)
+
+        # Build reverse lookup: sanitized_synonym -> standard_name
+        # This matches R's behavior: sanitize both column names and synonym keys
+        self._lookup: dict[str, str] = self._build_lookup()
+
+        logger.info(
+            f"Loaded {len(self.synonyms)} standard columns with "
+            f"{len(self._lookup)} total synonyms from {yaml_path.name}"
+        )
+
+    def _build_lookup(self) -> dict[str, str]:
+        """Build reverse lookup dictionary from SANITIZED synonyms to standard names.
+
+        Sanitizes all synonym keys before adding to lookup, matching R's behavior.
+
+        Returns:
+            Dict mapping each SANITIZED synonym to its standard column name
+
+        Example:
+            >>> # YAML has: patient_id: ["Patient ID", "Patient ID*", "ID"]
+            >>> # Lookup will have: {"patientid": "patient_id", "id": "patient_id"}
+        """
+        lookup = {}
+        for standard_name, synonym_list in self.synonyms.items():
+            # Handle empty lists (columns with no synonyms)
+            if not synonym_list:
+                continue
+
+            for synonym in synonym_list:
+                # Sanitize the synonym key before adding to lookup
+                sanitized_key = sanitize_str(synonym)
+
+                if sanitized_key in lookup:
+                    logger.warning(
+                        f"Duplicate sanitized synonym '{sanitized_key}' "
+                        f"(from '{synonym}') found for both "
+                        f"'{lookup[sanitized_key]}' and '{standard_name}'. "
+                        f"Using '{standard_name}'."
+                    )
+                lookup[sanitized_key] = standard_name
+
+        return lookup
+
+    def get_standard_name(self, column: str) -> str:
+        """Get the standard name for a column.
+
+        Sanitizes the input column name before lookup to match R behavior.
+
+        Args:
+            column: Column name (may be a synonym, with special characters/spaces)
+
+        Returns:
+            Standard column name, or original if no mapping exists
+
+        Example:
+            >>> mapper.get_standard_name("Patient ID*")
+            'patient_id'  # "Patient ID*" → "patientid" → "patient_id"
+            >>> mapper.get_standard_name("Age* On Reporting")
+            'age'  # "Age* On Reporting" → "ageonreporting" → "age"
+        """
+        # Sanitize input column name before lookup (matches R behavior)
+        sanitized_col = sanitize_str(column)
+        return self._lookup.get(sanitized_col, column)
+
+    def is_known_column(self, column: str) -> bool:
+        """Check if column name maps to a known standard name.
+
+        Used for validating forward-filled headers during Excel extraction.
+        Returns True if the column is either a known synonym or a standard name.
+
+        Args:
+            column: Column name to check
+
+        Returns:
+            True if column maps to a known standard name
+
+        Example:
+            >>> mapper.is_known_column("Current Patient Observations Category")
+            True  # Maps to observations_category
+            >>> mapper.is_known_column("Level of Support Status")
+            False  # No such column in synonyms
+        """
+        sanitized = sanitize_str(column)
+        return sanitized in self._lookup or column in self.synonyms
+
+    def rename_columns(
+        self,
+        df: pl.DataFrame,
+        strict: bool = False,
+    ) -> pl.DataFrame:
+        """Rename DataFrame columns using synonym mappings.
+
+        Args:
+            df: Input DataFrame with potentially non-standard column names
+            strict: If True, raise error if unmapped columns exist
+                If False, keep unmapped columns as-is
+
+        Returns:
+            DataFrame with standardized column names
+
+        Raises:
+            ValueError: If strict=True and unmapped columns exist
+        """
+        # Build rename mapping for columns that need renaming
+        rename_map = {}
+        unmapped_columns = []
+
+        for col in df.columns:
+            standard_name = self.get_standard_name(col)
+
+            if standard_name == col and col not in self.synonyms:
+                # Column is not in lookup and not a standard name
+                unmapped_columns.append(col)
+            elif standard_name != col:
+                # Column needs to be renamed
+                rename_map[col] = standard_name
+
+        # Log unmapped columns
+        if unmapped_columns:
+            if strict:
+                raise ValueError(
+                    f"Unmapped columns found: {unmapped_columns}. "
+                    "These columns do not appear in the synonym file."
+                )
+            else:
+                logger.warning(
+                    f"Keeping {len(unmapped_columns)} unmapped columns as-is: {unmapped_columns}"
+                )
+
+        # Handle duplicate mappings: multiple source columns mapping to same target
+        # Keep only first occurrence, drop the rest (edge case from discontinued 2023 format)
+        target_counts: dict[str, int] = {}
+        for target in rename_map.values():
+            target_counts[target] = target_counts.get(target, 0) + 1
+
+        if any(count > 1 for count in target_counts.values()):
+            duplicates = {t: c for t, c in target_counts.items() if c > 1}
+            logger.warning(
+                f"Multiple source columns map to same target name: {duplicates}. "
+                "Keeping first occurrence only. "
+                "This is an edge case from discontinued 2023 format."
+            )
+
+            # Keep only first occurrence of each target
+            seen_targets: set[str] = set()
+            columns_to_drop = []
+
+            for source_col, target_col in rename_map.items():
+                if target_col in duplicates:
+                    if target_col in seen_targets:
+                        # Duplicate - drop it
+                        columns_to_drop.append(source_col)
+                        logger.debug(
+                            f"Dropping duplicate source column '{source_col}' "
+                            f"(maps to '{target_col}')"
+                        )
+                    else:
+                        # First occurrence - keep it
+                        seen_targets.add(target_col)
+
+            # Drop duplicates before renaming
+            if columns_to_drop:
+                df = df.drop(columns_to_drop)
+                # Remove dropped columns from rename_map
+                for col in columns_to_drop:
+                    del rename_map[col]
+
+        # Log successful mappings
+        if rename_map:
+            logger.debug(f"Renaming {len(rename_map)} columns: {list(rename_map.items())}")
+
+        return df.rename(rename_map) if rename_map else df
+
+    def get_expected_columns(self) -> set[str]:
+        """Get set of all standard column names.
+
+        Returns:
+            Set of standard column names defined in the synonym file
+        """
+        return set(self.synonyms)
+
+    def get_missing_columns(self, df: pl.DataFrame) -> set[str]:
+        """Get standard columns that are missing from the DataFrame.
+
+        Args:
+            df: DataFrame to check
+
+        Returns:
+            Set of standard column names not present in the DataFrame
+        """
+        current_columns = set(df.columns)
+        expected_columns = self.get_expected_columns()
+        return expected_columns - current_columns
+
+    def validate_required_columns(
+        self,
+        df: pl.DataFrame,
+        required: list[str],
+    ) -> None:
+        """Validate that required columns are present after renaming.
+
+        Args:
+            df: DataFrame to validate
+            required: List of required standard column names
+
+        Raises:
+            ValueError: If any required columns are missing
+        """
+        missing = set(required) - set(df.columns)
+        if missing:
+            raise ValueError(f"Required columns missing after renaming: {missing}")
+
+
+def load_patient_mapper() -> ColumnMapper:
+    """Load the patient data column mapper.
+
+    Returns:
+        ColumnMapper for patient data
+
+    Example:
+        >>> mapper = load_patient_mapper()
+        >>> df = mapper.rename_columns(raw_df)
+    """
+    path = get_reference_data_path("synonyms", "synonyms_patient.yaml")
+    return ColumnMapper(path)
+
+
+def load_product_mapper() -> ColumnMapper:
+    """Load the product data column mapper.
+
+    Returns:
+        ColumnMapper for product data
+
+    Example:
+        >>> mapper = load_product_mapper()
+        >>> df = mapper.rename_columns(raw_df)
+    """
+    path = get_reference_data_path("synonyms", "synonyms_product.yaml")
+    return ColumnMapper(path)
+
+
+if __name__ == "__main__":
+    # Example usage
+    patient_mapper = load_patient_mapper()
+    product_mapper = load_product_mapper()
+
+    # Example DataFrame
+    df = pl.DataFrame(
+        {
+            "Age": [25, 30],
+            "Patient ID": [1, 2],
+            "Product Name": ["A", "B"],
+        }
+    )
+
+    renamed_df = patient_mapper.rename_columns(df)
+    print(renamed_df)
diff --git a/a4d-python/src/a4d/state/__init__.py b/a4d-python/src/a4d/state/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/a4d-python/src/a4d/tables/__init__.py b/a4d-python/src/a4d/tables/__init__.py
new file mode 100644
index 0000000..434cbbb
--- /dev/null
+++ b/a4d-python/src/a4d/tables/__init__.py
@@ -0,0 +1,18 @@
+"""Table creation module for final output tables."""
+
+from a4d.tables.logs import create_table_logs, parse_log_file
+from a4d.tables.patient import (
+    create_table_patient_data_annual,
+    create_table_patient_data_monthly,
+    create_table_patient_data_static,
+    read_cleaned_patient_data,
+)
+
+__all__ = [
+    "create_table_patient_data_annual",
+    "create_table_patient_data_monthly",
+    "create_table_patient_data_static",
+    "read_cleaned_patient_data",
+    "create_table_logs",
+    "parse_log_file",
+]
diff --git a/a4d-python/src/a4d/tables/logs.py b/a4d-python/src/a4d/tables/logs.py
new file mode 100644
index 0000000..4c7428c
--- /dev/null
+++ b/a4d-python/src/a4d/tables/logs.py
@@ -0,0 +1,220 @@
+"""Create logs table from pipeline execution logs.
+
+This module reads all JSON-formatted log files created by the pipeline
+and creates a structured table for BigQuery upload and dashboard analysis.
+
+Log files are created by loguru with serialize=True, producing JSON lines format.
+Each line contains structured data about pipeline execution: timestamps, levels,
+messages, source locations, exceptions, and custom context fields.
+"""
+
+import json
+from pathlib import Path
+
+import polars as pl
+from loguru import logger
+
+
+def parse_log_file(log_file: Path) -> pl.DataFrame:
+    """Parse a single JSON lines log file into a DataFrame.
+
+    Args:
+        log_file: Path to .log file (JSON lines format from loguru)
+
+    Returns:
+        DataFrame with parsed log records, or empty DataFrame if file is invalid
+
+    Example:
+        >>> df = parse_log_file(Path("output/logs/2024_Penang_patient.log"))
+        >>> df.columns
+        ['timestamp', 'level', 'message', 'log_file', ...]
+    """
+    records = []
+
+    try:
+        with open(log_file, encoding="utf-8") as f:
+            for line_num, line in enumerate(f, 1):
+                line = line.strip()
+
+                try:
+                    log_entry = json.loads(line)
+                    record_data = log_entry.get("record", {})
+
+                    # Extract timestamp
+                    time_data = record_data.get("time", {})
+                    timestamp = time_data.get("timestamp")
+
+                    # Extract level
+                    level_data = record_data.get("level", {})
+                    level = level_data.get("name", "UNKNOWN")
+
+                    # Extract message
+                    message = record_data.get("message", "")
+
+                    # Extract source location
+                    file_data = record_data.get("file", {})
+                    source_file = file_data.get("name", "")
+                    source_path = file_data.get("path", "")
+
+                    function = record_data.get("function", "")
+                    line = record_data.get("line", 0)
+                    module = record_data.get("module", "")
+
+                    # Extract context fields (file_name, tracker_year, tracker_month)
+                    extra = record_data.get("extra", {})
+                    file_name = extra.get("file_name")
+                    tracker_year = extra.get("tracker_year")
+                    tracker_month = extra.get("tracker_month")
+
+                    # Extract process info (useful for debugging parallel processing)
+                    process_data = record_data.get("process", {})
+                    process_name = process_data.get("name", "")
+
+                    # Extract exception info if present
+                    exception = record_data.get("exception")
+                    has_exception = exception is not None
+                    exception_type = None
+                    exception_value = None
+
+                    if has_exception and exception:
+                        exception_type = exception.get("type")
+                        exception_value = exception.get("value")
+
+                    # Create record
+                    records.append(
+                        {
+                            "timestamp": timestamp,
+                            "level": level,
+                            "message": message,
+                            "log_file": log_file.name,
+                            "file_name": file_name,
+                            "tracker_year": tracker_year,
+                            "tracker_month": tracker_month,
+                            "source_file": source_file,
+                            "source_path": source_path,
+                            "function": function,
+                            "line": line,
+                            "module": module,
+                            "process_name": process_name,
+                            "has_exception": has_exception,
+                            "exception_type": exception_type,
+                            "exception_value": exception_value,
+                        }
+                    )
+
+                except json.JSONDecodeError as e:
+                    logger.warning(f"Failed to parse JSON in {log_file.name}:{line_num}: {e}")
+                    continue
+                except Exception as e:
+                    logger.warning(f"Error processing line {line_num} in {log_file.name}: {e}")
+                    continue
+
+    except Exception as e:
+        logger.error(f"Failed to read log file {log_file.name}: {e}")
+        return pl.DataFrame()
+
+    if not records:
+        return pl.DataFrame()
+
+    # Create DataFrame with proper types
+    df = pl.DataFrame(records)
+
+    # Cast categorical columns for efficiency
+    df = df.with_columns(
+        [
+            pl.col("level").cast(pl.Categorical),
+            pl.col("log_file").cast(pl.Categorical),
+            pl.col("source_file").cast(pl.Categorical),
+            pl.col("function").cast(pl.Categorical),
+            pl.col("module").cast(pl.Categorical),
+            pl.col("process_name").cast(pl.Categorical),
+        ]
+    )
+
+    return df
+
+
+def create_table_logs(logs_dir: Path, output_dir: Path) -> Path:
+    """Create logs table from all pipeline log files.
+
+    Reads all .log files from the logs directory, parses JSON lines,
+    and creates a structured table for BigQuery upload.
+
+    Args:
+        logs_dir: Directory containing .log files (e.g., output/logs/)
+        output_dir: Directory to write the logs table parquet
+
+    Returns:
+        Path to created logs table parquet file
+
+    Example:
+        >>> logs_path = create_table_logs(
+        ...     Path("output/logs"),
+        ...     Path("output/tables")
+        ... )
+        >>> logs_path
+        Path('output/tables/table_logs.parquet')
+    """
+    logger.info(f"Creating logs table from: {logs_dir}")
+
+    # Find all .log files (exclude .zip compressed files)
+    log_files = sorted(logs_dir.glob("*.log"))
+    logger.info(f"Found {len(log_files)} log files to process")
+
+    if not log_files:
+        logger.warning("No log files found, creating empty logs table")
+        # Create empty DataFrame with correct schema
+        empty_df = pl.DataFrame(
+            schema={
+                "timestamp": pl.Datetime,
+                "level": pl.Categorical,
+                "message": pl.Utf8,
+                "log_file": pl.Categorical,
+                "file_name": pl.Utf8,
+                "tracker_year": pl.Int32,
+                "tracker_month": pl.Int32,
+                "source_file": pl.Categorical,
+                "source_path": pl.Utf8,
+                "function": pl.Categorical,
+                "line": pl.Int32,
+                "module": pl.Categorical,
+                "process_name": pl.Categorical,
+                "has_exception": pl.Boolean,
+                "exception_type": pl.Utf8,
+                "exception_value": pl.Utf8,
+            }
+        )
+        output_dir.mkdir(parents=True, exist_ok=True)
+        output_file = output_dir / "table_logs.parquet"
+        empty_df.write_parquet(output_file)
+        return output_file
+
+    # Parse all log files
+    all_logs = []
+    for log_file in log_files:
+        logger.debug(f"Parsing: {log_file.name}")
+        df = parse_log_file(log_file)
+        if len(df) > 0:
+            all_logs.append(df)
+
+    logs_table = pl.concat(all_logs, how="vertical")
+
+    # Sort by timestamp for chronological analysis
+    logs_table = logs_table.sort("timestamp")
+
+    logger.info(f"Created logs table with {len(logs_table)} records")
+    logger.info(f"Date range: {logs_table['timestamp'].min()} to {logs_table['timestamp'].max()}")
+
+    # Log summary by level
+    level_counts = logs_table.group_by("level").agg(pl.count()).sort("level")
+    logger.info(f"Log level distribution: {level_counts.to_dict(as_series=False)}")
+
+    # Write to parquet
+    output_dir.mkdir(parents=True, exist_ok=True)
+    output_file = output_dir / "table_logs.parquet"
+    logs_table.write_parquet(output_file)
+
+    logger.info(f"Logs table saved: {output_file}")
+    logger.info(f"Table size: {output_file.stat().st_size / 1024 / 1024:.2f} MB")
+
+    return output_file
diff --git a/a4d-python/src/a4d/tables/patient.py b/a4d-python/src/a4d/tables/patient.py
new file mode 100644
index 0000000..1865a00
--- /dev/null
+++ b/a4d-python/src/a4d/tables/patient.py
@@ -0,0 +1,213 @@
+"""Create final patient data tables from cleaned data."""
+
+from pathlib import Path
+
+import polars as pl
+from loguru import logger
+
+
+def read_cleaned_patient_data(cleaned_files: list[Path]) -> pl.DataFrame:
+    """Read and combine all cleaned patient data files.
+
+    Args:
+        cleaned_files: List of paths to cleaned parquet files
+
+    Returns:
+        Combined DataFrame with all cleaned patient data
+    """
+    if not cleaned_files:
+        raise ValueError("No cleaned files provided")
+
+    dfs = [pl.read_parquet(file) for file in cleaned_files]
+    return pl.concat(dfs, how="vertical")
+
+
+def create_table_patient_data_static(cleaned_files: list[Path], output_dir: Path) -> Path:
+    """Create static patient data table.
+
+    Reads all cleaned patient data and creates a single table with static columns
+    (data that doesn't change monthly). Groups by patient_id and takes the latest
+    available data (latest year and month).
+
+    Args:
+        cleaned_files: List of paths to cleaned parquet files
+        output_dir: Directory to save output parquet file
+
+    Returns:
+        Path to created parquet file
+    """
+    static_columns = [
+        "clinic_id",
+        "dob",
+        "fbg_baseline_mg",
+        "fbg_baseline_mmol",
+        "file_name",
+        "hba1c_baseline",
+        "hba1c_baseline_exceeds",
+        "lost_date",
+        "name",
+        "patient_consent",
+        "patient_id",
+        "province",
+        "recruitment_date",
+        "sex",
+        "status_out",
+        "t1d_diagnosis_age",
+        "t1d_diagnosis_date",
+        "t1d_diagnosis_with_dka",
+        "tracker_date",
+        "tracker_month",
+        "tracker_year",
+    ]
+
+    patient_data = read_cleaned_patient_data(cleaned_files)
+
+    static_data = (
+        patient_data.select(static_columns)
+        .sort(["patient_id", "tracker_year", "tracker_month"])
+        .group_by("patient_id")
+        .last()
+        .sort(["tracker_year", "tracker_month", "patient_id"])
+    )
+
+    logger.info(f"Static patient data dimensions: {static_data.shape}")
+
+    output_file = output_dir / "patient_data_static.parquet"
+    output_dir.mkdir(parents=True, exist_ok=True)
+    static_data.write_parquet(output_file)
+
+    return output_file
+
+
+def create_table_patient_data_monthly(cleaned_files: list[Path], output_dir: Path) -> Path:
+    """Create monthly patient data table.
+
+    Reads all cleaned patient data and creates a single table with dynamic columns
+    (data that changes monthly). Keeps all monthly records.
+
+    Args:
+        cleaned_files: List of paths to cleaned parquet files
+        output_dir: Directory to save output parquet file
+
+    Returns:
+        Path to created parquet file
+    """
+    monthly_columns = [
+        "age",
+        "bmi",
+        "bmi_date",
+        "clinic_id",
+        "fbg_updated_date",
+        "fbg_updated_mg",
+        "fbg_updated_mmol",
+        "file_name",
+        "hba1c_updated",
+        "hba1c_updated_exceeds",
+        "hba1c_updated_date",
+        "height",
+        "hospitalisation_cause",
+        "hospitalisation_date",
+        "insulin_injections",
+        "insulin_regimen",
+        "insulin_total_units",
+        "insulin_type",
+        "insulin_subtype",
+        "last_clinic_visit_date",
+        "last_remote_followup_date",
+        "observations",
+        "observations_category",
+        "patient_id",
+        "sheet_name",
+        "status",
+        "support_level",
+        "testing_frequency",
+        "tracker_date",
+        "tracker_month",
+        "tracker_year",
+        "weight",
+    ]
+
+    patient_data = read_cleaned_patient_data(cleaned_files)
+
+    monthly_data = patient_data.select(monthly_columns).sort(
+        ["tracker_year", "tracker_month", "patient_id"]
+    )
+
+    logger.info(f"Monthly patient data dimensions: {monthly_data.shape}")
+
+    output_file = output_dir / "patient_data_monthly.parquet"
+    output_dir.mkdir(parents=True, exist_ok=True)
+    monthly_data.write_parquet(output_file)
+
+    return output_file
+
+
+def create_table_patient_data_annual(cleaned_files: list[Path], output_dir: Path) -> Path:
+    """Create annual patient data table.
+
+    Reads all cleaned patient data and creates a single table with annual columns
+    (data collected once per year). Groups by patient_id and tracker_year, taking
+    the latest month for each year. Only includes data from 2024 onwards.
+
+    Args:
+        cleaned_files: List of paths to cleaned parquet files
+        output_dir: Directory to save output parquet file
+
+    Returns:
+        Path to created parquet file
+    """
+    annual_columns = [
+        "patient_id",
+        "status",
+        "edu_occ",
+        "edu_occ_updated",
+        "blood_pressure_updated",
+        "blood_pressure_sys_mmhg",
+        "blood_pressure_dias_mmhg",
+        "complication_screening_kidney_test_date",
+        "complication_screening_kidney_test_value",
+        "complication_screening_eye_exam_date",
+        "complication_screening_eye_exam_value",
+        "complication_screening_foot_exam_date",
+        "complication_screening_foot_exam_value",
+        "complication_screening_lipid_profile_date",
+        "complication_screening_lipid_profile_triglycerides_value",
+        "complication_screening_lipid_profile_cholesterol_value",
+        "complication_screening_lipid_profile_ldl_mg_value",
+        "complication_screening_lipid_profile_ldl_mmol_value",
+        "complication_screening_lipid_profile_hdl_mg_value",
+        "complication_screening_lipid_profile_hdl_mmol_value",
+        "complication_screening_thyroid_test_date",
+        "complication_screening_thyroid_test_ft4_ng_value",
+        "complication_screening_thyroid_test_ft4_pmol_value",
+        "complication_screening_thyroid_test_tsh_value",
+        "complication_screening_remarks",
+        "dm_complication_eye",
+        "dm_complication_kidney",
+        "dm_complication_others",
+        "dm_complication_remarks",
+        "family_history",
+        "other_issues",
+        "tracker_date",
+        "tracker_month",
+        "tracker_year",
+    ]
+
+    patient_data = read_cleaned_patient_data(cleaned_files)
+
+    annual_data = (
+        patient_data.select(annual_columns)
+        .filter(pl.col("tracker_year") >= 2024)
+        .sort(["patient_id", "tracker_year", "tracker_month"])
+        .group_by(["patient_id", "tracker_year"])
+        .last()
+        .sort(["tracker_year", "tracker_month", "patient_id"])
+    )
+
+    logger.info(f"Annual patient data dimensions: {annual_data.shape}")
+
+    output_file = output_dir / "patient_data_annual.parquet"
+    output_dir.mkdir(parents=True, exist_ok=True)
+    annual_data.write_parquet(output_file)
+
+    return output_file
diff --git a/a4d-python/src/a4d/utils/__init__.py b/a4d-python/src/a4d/utils/__init__.py
new file mode 100644
index 0000000..12455b7
--- /dev/null
+++ b/a4d-python/src/a4d/utils/__init__.py
@@ -0,0 +1,3 @@
+"""Utility modules."""
+
+__all__ = []
diff --git a/a4d-python/tests/test_clean/__init__.py b/a4d-python/tests/test_clean/__init__.py
new file mode 100644
index 0000000..167c8d2
--- /dev/null
+++ b/a4d-python/tests/test_clean/__init__.py
@@ -0,0 +1 @@
+"""Tests for data cleaning modules."""
diff --git a/a4d-python/tests/test_clean/test_converters.py b/a4d-python/tests/test_clean/test_converters.py
new file mode 100644
index 0000000..ab48665
--- /dev/null
+++ b/a4d-python/tests/test_clean/test_converters.py
@@ -0,0 +1,337 @@
+"""Tests for type conversion with error tracking."""
+
+import polars as pl
+
+from a4d.clean.converters import (
+    correct_decimal_sign,
+    cut_numeric_value,
+    safe_convert_column,
+    safe_convert_multiple_columns,
+)
+from a4d.config import settings
+from a4d.errors import ErrorCollector
+
+
+def test_safe_convert_column_success():
+    """Test successful conversion without errors."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 3,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+            "age": ["25", "30", "18"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = safe_convert_column(
+        df=df,
+        column="age",
+        target_type=pl.Int32,
+        error_collector=collector,
+    )
+
+    assert result.schema["age"] == pl.Int32
+    assert result["age"].to_list() == [25, 30, 18]
+    assert len(collector) == 0  # No errors
+
+
+def test_safe_convert_column_with_failures():
+    """Test conversion with some failures."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 4,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003", "XX_YY004"],
+            "age": ["25", "invalid", "30", "abc"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = safe_convert_column(
+        df=df,
+        column="age",
+        target_type=pl.Int32,
+        error_collector=collector,
+    )
+
+    assert result.schema["age"] == pl.Int32
+    assert result["age"].to_list() == [
+        25,
+        int(settings.error_val_numeric),
+        30,
+        int(settings.error_val_numeric),
+    ]
+    assert len(collector) == 2  # Two failures
+
+    # Check error details
+    errors_df = collector.to_dataframe()
+    assert errors_df.filter(pl.col("patient_id") == "XX_YY002")["original_value"][0] == "invalid"
+    assert errors_df.filter(pl.col("patient_id") == "XX_YY004")["original_value"][0] == "abc"
+    assert all(errors_df["error_code"] == "type_conversion")
+
+
+def test_safe_convert_column_preserves_nulls():
+    """Test that existing nulls are preserved."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 3,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+            "age": ["25", None, "30"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = safe_convert_column(
+        df=df,
+        column="age",
+        target_type=pl.Int32,
+        error_collector=collector,
+    )
+
+    assert result["age"].to_list() == [25, None, 30]
+    assert len(collector) == 0  # Nulls are not errors
+
+
+def test_correct_decimal_sign():
+    """Test decimal sign correction."""
+    df = pl.DataFrame(
+        {
+            "weight": ["70,5", "80,2", "65.5"],
+        }
+    )
+
+    result = correct_decimal_sign(df, "weight")
+
+    assert result["weight"].to_list() == ["70.5", "80.2", "65.5"]
+
+
+def test_cut_numeric_value():
+    """Test cutting out-of-range values."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 5,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003", "XX_YY004", "XX_YY005"],
+            "age": [15, -5, 20, 30, 18],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = cut_numeric_value(
+        df=df,
+        column="age",
+        min_val=0,
+        max_val=25,
+        error_collector=collector,
+    )
+
+    assert result["age"].to_list() == [
+        15,
+        settings.error_val_numeric,  # -5 replaced
+        20,
+        settings.error_val_numeric,  # 30 replaced
+        18,
+    ]
+    assert len(collector) == 2  # Two values out of range
+
+
+def test_safe_convert_multiple_columns():
+    """Test batch conversion of multiple columns."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 2,
+            "patient_id": ["XX_YY001", "XX_YY002"],
+            "age": ["25", "30"],
+            "height": ["1.75", "1.80"],
+            "weight": ["70", "80"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = safe_convert_multiple_columns(
+        df=df,
+        columns=["age", "height", "weight"],
+        target_type=pl.Float64,
+        error_collector=collector,
+    )
+
+    assert result.schema["age"] == pl.Float64
+    assert result.schema["height"] == pl.Float64
+    assert result.schema["weight"] == pl.Float64
+    assert len(collector) == 0
+
+
+def test_safe_convert_column_missing_column():
+    """Test that missing columns are handled gracefully."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"],
+            "patient_id": ["XX_YY001"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    # Should not raise error
+    result = safe_convert_column(
+        df=df,
+        column="nonexistent",
+        target_type=pl.Int32,
+        error_collector=collector,
+    )
+
+    assert result.equals(df)
+    assert len(collector) == 0
+
+
+def test_safe_convert_column_float64():
+    """Test conversion to Float64 with decimal values."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 3,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+            "weight": ["70.5", "not_a_number", "85.2"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = safe_convert_column(
+        df=df,
+        column="weight",
+        target_type=pl.Float64,
+        error_collector=collector,
+    )
+
+    assert result.schema["weight"] == pl.Float64
+    assert result["weight"][0] == 70.5
+    assert result["weight"][1] == settings.error_val_numeric
+    assert result["weight"][2] == 85.2
+    assert len(collector) == 1
+
+
+def test_safe_convert_column_custom_error_value():
+    """Test using a custom error value."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 2,
+            "patient_id": ["XX_YY001", "XX_YY002"],
+            "age": ["25", "invalid"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = safe_convert_column(
+        df=df,
+        column="age",
+        target_type=pl.Int32,
+        error_collector=collector,
+        error_value=-1,
+    )
+
+    assert result["age"].to_list() == [25, -1]
+    assert len(collector) == 1
+
+
+def test_safe_convert_column_string_type():
+    """Test conversion to string type (always succeeds)."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 2,
+            "patient_id": ["XX_YY001", "XX_YY002"],
+            "value": [123, 456],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = safe_convert_column(
+        df=df,
+        column="value",
+        target_type=pl.Utf8,
+        error_collector=collector,
+    )
+
+    assert result.schema["value"] == pl.Utf8
+    assert result["value"].to_list() == ["123", "456"]
+    assert len(collector) == 0
+
+
+def test_correct_decimal_sign_missing_column():
+    """Test decimal sign correction with missing column."""
+    df = pl.DataFrame({"other": ["value"]})
+
+    result = correct_decimal_sign(df, "nonexistent")
+
+    assert result.equals(df)
+
+
+def test_cut_numeric_value_missing_column():
+    """Test cutting with missing column."""
+    df = pl.DataFrame({"other": [1, 2, 3]})
+
+    collector = ErrorCollector()
+
+    result = cut_numeric_value(
+        df=df,
+        column="nonexistent",
+        min_val=0,
+        max_val=10,
+        error_collector=collector,
+    )
+
+    assert result.equals(df)
+    assert len(collector) == 0
+
+
+def test_cut_numeric_value_with_nulls():
+    """Test that nulls are preserved when cutting values."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 4,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003", "XX_YY004"],
+            "age": [15, None, 30, 20],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = cut_numeric_value(
+        df=df,
+        column="age",
+        min_val=0,
+        max_val=25,
+        error_collector=collector,
+    )
+
+    assert result["age"].to_list() == [15, None, settings.error_val_numeric, 20]
+    assert len(collector) == 1  # Only 30 is out of range
+
+
+def test_cut_numeric_value_ignores_existing_errors():
+    """Test that existing error values are not re-logged."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 3,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+            "age": [15.0, settings.error_val_numeric, 30.0],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = cut_numeric_value(
+        df=df,
+        column="age",
+        min_val=0,
+        max_val=25,
+        error_collector=collector,
+    )
+
+    # Only 30 should be logged, not the existing error value
+    assert result["age"].to_list() == [15, settings.error_val_numeric, settings.error_val_numeric]
+    assert len(collector) == 1
diff --git a/a4d-python/tests/test_clean/test_patient.py b/a4d-python/tests/test_clean/test_patient.py
new file mode 100644
index 0000000..65b603b
--- /dev/null
+++ b/a4d-python/tests/test_clean/test_patient.py
@@ -0,0 +1,418 @@
+"""Unit tests for patient cleaning functions."""
+
+from datetime import date
+
+import polars as pl
+
+from a4d.clean.patient import (
+    _apply_preprocessing,
+    _fix_age_from_dob,
+    _fix_t1d_diagnosis_age,
+)
+from a4d.config import settings
+from a4d.errors import ErrorCollector
+
+
+class TestPatientIdNormalization:
+    """Tests for patient_id normalization (transfer clinic suffix removal)."""
+
+    def test_normalize_transfer_patient_id(self):
+        """Should normalize patient_id by removing transfer clinic suffix."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["MY_SM003_SB", "TH_BK001_PT", "LA_VT002_VP"],
+                "name": ["Patient A", "Patient B", "Patient C"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        assert result["patient_id"].to_list() == ["MY_SM003", "TH_BK001", "LA_VT002"]
+
+    def test_preserve_normal_patient_id(self):
+        """Should preserve patient_id without transfer suffix."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["MY_SB001", "TH_ST003", "LA_LFH042"],
+                "name": ["Patient A", "Patient B", "Patient C"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        # Should remain unchanged
+        assert result["patient_id"].to_list() == ["MY_SB001", "TH_ST003", "LA_LFH042"]
+
+    def test_mixed_patient_ids(self):
+        """Should handle mix of normal and transfer patient IDs."""
+        df = pl.DataFrame(
+            {
+                "patient_id": [
+                    "MY_SB001",  # Normal
+                    "MY_SM003_SB",  # Transfer
+                    "TH_ST003",  # Normal
+                    "TH_BK001_PT",  # Transfer
+                ],
+                "name": ["A", "B", "C", "D"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        assert result["patient_id"].to_list() == [
+            "MY_SB001",
+            "MY_SM003",  # Normalized
+            "TH_ST003",
+            "TH_BK001",  # Normalized
+        ]
+
+    def test_multiple_underscores_keeps_only_first_two_parts(self):
+        """Should keep only first two underscore-separated parts."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["MY_SM003_SB_EXTRA"],  # Three underscores
+                "name": ["Patient A"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        # Should extract only MY_SM003
+        assert result["patient_id"][0] == "MY_SM003"
+
+    def test_patient_id_without_underscores(self):
+        """Should preserve patient_id without underscores."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["MYID001", "NOMATCH"],
+                "name": ["Patient A", "Patient B"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        # Pattern won't match, should keep original
+        assert result["patient_id"].to_list() == ["MYID001", "NOMATCH"]
+
+    def test_null_patient_id_preserved(self):
+        """Should preserve null patient_ids."""
+        df = pl.DataFrame(
+            {
+                "patient_id": [None, "MY_SB001", None],
+                "name": ["A", "B", "C"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        assert result["patient_id"][0] is None
+        assert result["patient_id"][1] == "MY_SB001"
+        assert result["patient_id"][2] is None
+
+
+class TestHbA1cPreprocessing:
+    """Tests for HbA1c exceeds marker handling."""
+
+    def test_hba1c_baseline_exceeds_marker(self):
+        """Should extract > or < markers and remove them from value."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+                "hba1c_baseline": [">14", "<5.5", "7.2"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        assert result["hba1c_baseline_exceeds"].to_list() == [True, True, False]
+        assert result["hba1c_baseline"].to_list() == ["14", "5.5", "7.2"]
+
+    def test_hba1c_updated_exceeds_marker(self):
+        """Should extract > or < markers from updated HbA1c."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["XX_YY001"],
+                "hba1c_updated": [">12.5"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        assert result["hba1c_updated_exceeds"][0] is True
+        assert result["hba1c_updated"][0] == "12.5"
+
+
+class TestFbgPreprocessing:
+    """Tests for FBG (fasting blood glucose) text value handling."""
+
+    def test_fbg_qualitative_to_numeric(self):
+        """Should convert qualitative FBG values to numeric."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003", "XX_YY004"],
+                "fbg_updated_mg": ["high", "medium", "low", "150"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        # high→200, medium→170, low→140
+        assert result["fbg_updated_mg"].to_list() == ["200", "170", "140", "150"]
+
+    def test_fbg_removes_dka_marker(self):
+        """Should attempt to remove (DKA) marker from FBG values."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["XX_YY001"],
+                "fbg_updated_mg": ["350 (DKA)"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        # Note: Current implementation lowercases first, then tries to remove literal "(DKA)"
+        # which doesn't match lowercase "(dka)", so it's not actually removed
+        # This is a known issue but matches current behavior
+        assert result["fbg_updated_mg"][0] == "350 (dka)"
+
+
+class TestYesNoHyphenReplacement:
+    """Tests for replacing '-' with 'N' in insulin-related Y/N columns."""
+
+    def test_replace_hyphen_in_insulin_columns(self):
+        """Should replace '-' with 'N' in analog insulin columns (2024+ trackers)."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["XX_YY001"],
+                "analog_insulin_long_acting": ["-"],
+                "analog_insulin_rapid_acting": ["-"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        assert result["analog_insulin_long_acting"][0] == "N"
+        assert result["analog_insulin_rapid_acting"][0] == "N"
+
+    def test_preserve_hyphen_in_other_columns(self):
+        """Should NOT replace '-' in non-insulin Y/N columns."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["XX_YY001"],
+                "clinic_visit": ["-"],
+                "active": ["-"],
+            }
+        )
+
+        result = _apply_preprocessing(df)
+
+        # These columns are not in the insulin list, so '-' is preserved
+        assert result["clinic_visit"][0] == "-"
+        assert result["active"][0] == "-"
+
+
+class TestFixAgeFromDob:
+    """Tests for age calculation from DOB."""
+
+    def test_calculates_age_from_dob(self):
+        """Should calculate age from DOB and tracker date."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "age": [None],
+                "dob": [date(2010, 6, 15)],
+                "tracker_year": [2025],
+                "tracker_month": [1],
+            }
+        )
+        collector = ErrorCollector()
+
+        result = _fix_age_from_dob(df, collector)
+
+        # 2025 - 2010 = 15, but Jan < June so 15 - 1 = 14
+        assert result["age"][0] == 14
+
+    def test_birthday_already_passed(self):
+        """Should not subtract 1 if birthday already passed in tracker year."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "age": [None],
+                "dob": [date(2010, 3, 15)],
+                "tracker_year": [2025],
+                "tracker_month": [6],
+            }
+        )
+        collector = ErrorCollector()
+
+        result = _fix_age_from_dob(df, collector)
+
+        # 2025 - 2010 = 15, June > March so no adjustment
+        assert result["age"][0] == 15
+
+    def test_missing_dob_keeps_null(self):
+        """Should keep null age if DOB is missing."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "age": [None],
+                "dob": pl.Series([None], dtype=pl.Date),
+                "tracker_year": [2025],
+                "tracker_month": [1],
+            }
+        )
+        collector = ErrorCollector()
+
+        result = _fix_age_from_dob(df, collector)
+
+        assert result["age"][0] is None
+
+    def test_error_date_dob_keeps_null(self):
+        """Should keep null age if DOB is error date."""
+        error_date = date.fromisoformat(settings.error_val_date)
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "age": [None],
+                "dob": [error_date],
+                "tracker_year": [2025],
+                "tracker_month": [1],
+            }
+        )
+        collector = ErrorCollector()
+
+        result = _fix_age_from_dob(df, collector)
+
+        assert result["age"][0] is None
+
+    def test_corrects_wrong_excel_age(self):
+        """Should replace wrong Excel age with calculated age."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "age": [99.0],  # Wrong value from Excel
+                "dob": [date(2010, 6, 15)],
+                "tracker_year": [2025],
+                "tracker_month": [8],
+            }
+        )
+        collector = ErrorCollector()
+
+        result = _fix_age_from_dob(df, collector)
+
+        # Should be corrected to 15
+        assert result["age"][0] == 15
+
+
+class TestFixT1dDiagnosisAge:
+    """Tests for t1d_diagnosis_age calculation from DOB and diagnosis date."""
+
+    def test_calculates_diagnosis_age(self):
+        """Should calculate age at diagnosis from DOB and diagnosis date."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "dob": [date(2005, 8, 20)],
+                "t1d_diagnosis_date": [date(2020, 3, 15)],
+                "t1d_diagnosis_age": [None],
+            }
+        )
+
+        result = _fix_t1d_diagnosis_age(df)
+
+        # 2020 - 2005 = 15, but March < August so 15 - 1 = 14
+        assert result["t1d_diagnosis_age"][0] == 14
+
+    def test_birthday_passed_before_diagnosis(self):
+        """Should not subtract 1 if birthday passed before diagnosis."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "dob": [date(2005, 3, 20)],
+                "t1d_diagnosis_date": [date(2020, 8, 15)],
+                "t1d_diagnosis_age": [None],
+            }
+        )
+
+        result = _fix_t1d_diagnosis_age(df)
+
+        # 2020 - 2005 = 15, August > March so no adjustment
+        assert result["t1d_diagnosis_age"][0] == 15
+
+    def test_missing_dob_returns_null(self):
+        """Should return null if DOB is missing."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "dob": pl.Series([None], dtype=pl.Date),
+                "t1d_diagnosis_date": [date(2020, 3, 15)],
+                "t1d_diagnosis_age": [None],
+            }
+        )
+
+        result = _fix_t1d_diagnosis_age(df)
+
+        assert result["t1d_diagnosis_age"][0] is None
+
+    def test_missing_diagnosis_date_returns_null(self):
+        """Should return null if diagnosis date is missing."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "dob": [date(2005, 8, 20)],
+                "t1d_diagnosis_date": pl.Series([None], dtype=pl.Date),
+                "t1d_diagnosis_age": [None],
+            }
+        )
+
+        result = _fix_t1d_diagnosis_age(df)
+
+        assert result["t1d_diagnosis_age"][0] is None
+
+    def test_error_date_dob_returns_null(self):
+        """Should return null if DOB is error date."""
+        error_date = date.fromisoformat(settings.error_val_date)
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "dob": [error_date],
+                "t1d_diagnosis_date": [date(2020, 3, 15)],
+                "t1d_diagnosis_age": [None],
+            }
+        )
+
+        result = _fix_t1d_diagnosis_age(df)
+
+        assert result["t1d_diagnosis_age"][0] is None
+
+    def test_error_date_diagnosis_returns_null(self):
+        """Should return null if diagnosis date is error date."""
+        error_date = date.fromisoformat(settings.error_val_date)
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "dob": [date(2005, 8, 20)],
+                "t1d_diagnosis_date": [error_date],
+                "t1d_diagnosis_age": [None],
+            }
+        )
+
+        result = _fix_t1d_diagnosis_age(df)
+
+        assert result["t1d_diagnosis_age"][0] is None
+
+    def test_replaces_excel_error_value(self):
+        """Should replace Excel error (#NUM!) that became 999999 with calculated value."""
+        df = pl.DataFrame(
+            {
+                "patient_id": ["P001"],
+                "dob": [date(2005, 8, 20)],
+                "t1d_diagnosis_date": [date(2020, 3, 15)],
+                "t1d_diagnosis_age": [999999],  # Error value from Excel
+            }
+        )
+
+        result = _fix_t1d_diagnosis_age(df)
+
+        # Should be calculated as 14
+        assert result["t1d_diagnosis_age"][0] == 14
diff --git a/a4d-python/tests/test_clean/test_transformers.py b/a4d-python/tests/test_clean/test_transformers.py
new file mode 100644
index 0000000..d7c6c71
--- /dev/null
+++ b/a4d-python/tests/test_clean/test_transformers.py
@@ -0,0 +1,847 @@
+"""Tests for data transformation functions."""
+
+import polars as pl
+import pytest
+
+from a4d.clean.transformers import (
+    apply_transformation,
+    correct_decimal_sign_multiple,
+    extract_regimen,
+    fix_bmi,
+    fix_sex,
+    fix_testing_frequency,
+    replace_range_with_mean,
+    split_bp_in_sys_and_dias,
+    str_to_lower,
+)
+from a4d.config import settings
+
+
+def test_extract_regimen_basal():
+    """Test extraction of basal-bolus regimen."""
+    df = pl.DataFrame(
+        {
+            "insulin_regimen": [
+                "Basal-bolus",
+                "basal bolus",
+                "BASAL",
+                "Some basal text",
+            ]
+        }
+    )
+
+    result = extract_regimen(df)
+
+    # All should be standardized to "Basal-bolus (MDI)"
+    assert all(v == "Basal-bolus (MDI)" for v in result["insulin_regimen"].to_list())
+
+
+def test_extract_regimen_premixed():
+    """Test extraction of premixed regimen."""
+    df = pl.DataFrame(
+        {
+            "insulin_regimen": [
+                "Premixed",
+                "PREMIXED 30/70",
+                "premixed bd",
+            ]
+        }
+    )
+
+    result = extract_regimen(df)
+
+    assert all(v == "Premixed 30/70 BD" for v in result["insulin_regimen"].to_list())
+
+
+def test_extract_regimen_self_mixed():
+    """Test extraction of self-mixed regimen."""
+    df = pl.DataFrame(
+        {
+            "insulin_regimen": [
+                "Self-mixed",
+                "SELF-MIXED BD",
+                "self-mixed",  # Must have hyphen to match
+            ]
+        }
+    )
+
+    result = extract_regimen(df)
+
+    assert all(v == "Self-mixed BD" for v in result["insulin_regimen"].to_list())
+
+
+def test_extract_regimen_conventional():
+    """Test extraction of conventional regimen."""
+    df = pl.DataFrame(
+        {
+            "insulin_regimen": [
+                "Conventional",
+                "Modified CONVENTIONAL TID",
+                "conventional tid",
+            ]
+        }
+    )
+
+    result = extract_regimen(df)
+
+    assert all(v == "Modified conventional TID" for v in result["insulin_regimen"].to_list())
+
+
+def test_extract_regimen_missing_column():
+    """Test that missing column is handled gracefully."""
+    df = pl.DataFrame({"other": ["value"]})
+
+    result = extract_regimen(df)
+
+    assert result.equals(df)
+
+
+def test_extract_regimen_preserves_nulls():
+    """Test that nulls are preserved."""
+    df = pl.DataFrame(
+        {
+            "insulin_regimen": ["Basal-bolus", None, "Premixed"],
+        }
+    )
+
+    result = extract_regimen(df)
+
+    assert result["insulin_regimen"][0] == "Basal-bolus (MDI)"
+    assert result["insulin_regimen"][1] is None
+    assert result["insulin_regimen"][2] == "Premixed 30/70 BD"
+
+
+def test_extract_regimen_no_match():
+    """Test values that don't match any pattern."""
+    df = pl.DataFrame(
+        {
+            "insulin_regimen": [
+                "Unknown regimen",
+                "Other",
+            ]
+        }
+    )
+
+    result = extract_regimen(df)
+
+    # Values that don't match should be unchanged (lowercased)
+    assert result["insulin_regimen"].to_list() == ["unknown regimen", "other"]
+
+
+def test_str_to_lower():
+    """Test string lowercasing."""
+    df = pl.DataFrame(
+        {
+            "status": ["ACTIVE", "Inactive", "Transferred", "MixedCase"],
+        }
+    )
+
+    result = str_to_lower(df, "status")
+
+    assert result["status"].to_list() == ["active", "inactive", "transferred", "mixedcase"]
+
+
+def test_str_to_lower_preserves_nulls():
+    """Test that nulls are preserved."""
+    df = pl.DataFrame(
+        {
+            "status": ["ACTIVE", None, "Inactive"],
+        }
+    )
+
+    result = str_to_lower(df, "status")
+
+    assert result["status"][0] == "active"
+    assert result["status"][1] is None
+    assert result["status"][2] == "inactive"
+
+
+def test_str_to_lower_missing_column():
+    """Test that missing column is handled gracefully."""
+    df = pl.DataFrame({"other": ["VALUE"]})
+
+    result = str_to_lower(df, "nonexistent")
+
+    assert result.equals(df)
+
+
+def test_apply_transformation_extract_regimen():
+    """Test applying extract_regimen transformation."""
+    df = pl.DataFrame(
+        {
+            "insulin_regimen": ["Basal-bolus", "Premixed"],
+        }
+    )
+
+    result = apply_transformation(df, "insulin_regimen", "extract_regimen")
+
+    assert result["insulin_regimen"].to_list() == ["Basal-bolus (MDI)", "Premixed 30/70 BD"]
+
+
+def test_apply_transformation_str_to_lower():
+    """Test applying str_to_lower transformation (both naming conventions)."""
+    df = pl.DataFrame(
+        {
+            "status": ["ACTIVE", "INACTIVE"],
+        }
+    )
+
+    # Test with R function name
+    result = apply_transformation(df, "status", "stringr::str_to_lower")
+    assert result["status"].to_list() == ["active", "inactive"]
+
+    # Reset
+    df = pl.DataFrame({"status": ["ACTIVE", "INACTIVE"]})
+
+    # Test with Python function name
+    result = apply_transformation(df, "status", "str_to_lower")
+    assert result["status"].to_list() == ["active", "inactive"]
+
+
+def test_apply_transformation_unknown_function():
+    """Test that unknown function raises error."""
+    df = pl.DataFrame({"column": ["value"]})
+
+    with pytest.raises(ValueError, match="Unknown transformation function"):
+        apply_transformation(df, "column", "unknown_function")
+
+
+def test_correct_decimal_sign_multiple():
+    """Test correcting decimal signs for multiple columns."""
+    df = pl.DataFrame(
+        {
+            "weight": ["70,5", "80,2"],
+            "height": ["1,75", "1,80"],
+            "hba1c": ["7,2", "6,8"],
+        }
+    )
+
+    result = correct_decimal_sign_multiple(df, ["weight", "height", "hba1c"])
+
+    assert result["weight"].to_list() == ["70.5", "80.2"]
+    assert result["height"].to_list() == ["1.75", "1.80"]
+    assert result["hba1c"].to_list() == ["7.2", "6.8"]
+
+
+def test_correct_decimal_sign_multiple_missing_columns():
+    """Test that missing columns are handled gracefully."""
+    df = pl.DataFrame(
+        {
+            "weight": ["70,5", "80,2"],
+        }
+    )
+
+    # Should not raise error even though height and hba1c don't exist
+    result = correct_decimal_sign_multiple(df, ["weight", "height", "hba1c"])
+
+    assert result["weight"].to_list() == ["70.5", "80.2"]
+
+
+def test_extract_regimen_order_matters():
+    """Test that transformation order matches R behavior.
+
+    In R, the transformations are applied in order, and each one
+    replaces the entire value if it matches.
+    """
+    df = pl.DataFrame(
+        {
+            "insulin_regimen": [
+                "basal premixed",  # Both patterns match
+            ]
+        }
+    )
+
+    result = extract_regimen(df)
+
+    # "basal" is checked first in the code, so it should match that
+    assert result["insulin_regimen"][0] == "Basal-bolus (MDI)"
+
+
+def test_fix_sex_female_synonyms():
+    """Test that female synonyms are mapped to 'F'."""
+    df = pl.DataFrame(
+        {
+            "sex": [
+                "Female",
+                "FEMALE",
+                "girl",
+                "Woman",
+                "fem",
+                "Feminine",
+                "f",
+                "F",
+            ]
+        }
+    )
+
+    result = fix_sex(df)
+
+    # All should be mapped to "F"
+    assert all(v == "F" for v in result["sex"].to_list())
+
+
+def test_fix_sex_male_synonyms():
+    """Test that male synonyms are mapped to 'M'."""
+    df = pl.DataFrame(
+        {
+            "sex": [
+                "Male",
+                "MALE",
+                "boy",
+                "Man",
+                "masculine",
+                "m",
+                "M",
+            ]
+        }
+    )
+
+    result = fix_sex(df)
+
+    # All should be mapped to "M"
+    assert all(v == "M" for v in result["sex"].to_list())
+
+
+def test_fix_sex_invalid_values():
+    """Test that invalid values are set to 'Undefined'."""
+    df = pl.DataFrame(
+        {
+            "sex": [
+                "invalid",
+                "unknown",
+                "other",
+                "X",
+            ]
+        }
+    )
+
+    result = fix_sex(df)
+
+    # All should be set to "Undefined"
+    assert all(v == "Undefined" for v in result["sex"].to_list())
+
+
+def test_fix_sex_preserves_nulls():
+    """Test that null and empty values are preserved as null."""
+    df = pl.DataFrame(
+        {
+            "sex": ["Female", None, "", "Male"],
+        }
+    )
+
+    result = fix_sex(df)
+
+    assert result["sex"][0] == "F"
+    assert result["sex"][1] is None
+    assert result["sex"][2] is None
+    assert result["sex"][3] == "M"
+
+
+def test_fix_sex_case_insensitive():
+    """Test that matching is case-insensitive."""
+    df = pl.DataFrame(
+        {
+            "sex": [
+                "FEMALE",
+                "female",
+                "Female",
+                "FeMaLe",
+                "MALE",
+                "male",
+                "Male",
+                "MaLe",
+            ]
+        }
+    )
+
+    result = fix_sex(df)
+
+    assert result["sex"].to_list() == ["F", "F", "F", "F", "M", "M", "M", "M"]
+
+
+def test_fix_sex_missing_column():
+    """Test that missing column is handled gracefully."""
+    df = pl.DataFrame({"other": ["value"]})
+
+    result = fix_sex(df)
+
+    assert result.equals(df)
+
+
+def test_fix_sex_matches_r_behavior():
+    """Test that fix_sex matches R's fix_sex() function exactly.
+
+    This test uses the exact values from R's function definition.
+    """
+    df = pl.DataFrame(
+        {
+            "sex": [
+                # Female synonyms from R
+                "female",
+                "girl",
+                "woman",
+                "fem",
+                "feminine",
+                "f",
+                # Male synonyms from R
+                "male",
+                "boy",
+                "man",
+                "masculine",
+                "m",
+                # Invalid
+                "other",
+                "unknown",
+                # Null/empty
+                None,
+                "",
+            ]
+        }
+    )
+
+    result = fix_sex(df)
+
+    expected = [
+        "F",
+        "F",
+        "F",
+        "F",
+        "F",
+        "F",
+        "M",
+        "M",
+        "M",
+        "M",
+        "M",
+        "Undefined",
+        "Undefined",
+        None,
+        None,
+    ]
+    assert result["sex"].to_list() == expected
+
+
+def test_fix_bmi_basic_calculation():
+    """Test basic BMI calculation from weight and height."""
+    df = pl.DataFrame(
+        {
+            "weight": [70.0, 80.0, 65.0],
+            "height": [1.75, 1.80, 1.60],
+        }
+    )
+
+    result = fix_bmi(df)
+
+    # BMI = weight / height^2
+    assert "bmi" in result.columns
+    assert result["bmi"][0] == pytest.approx(22.857, abs=0.001)  # 70 / 1.75^2 = 22.857
+    assert result["bmi"][1] == pytest.approx(24.691, abs=0.001)  # 80 / 1.80^2 = 24.691
+    assert result["bmi"][2] == pytest.approx(25.391, abs=0.001)  # 65 / 1.60^2 = 25.391
+
+
+def test_fix_bmi_replaces_existing():
+    """Test that calculated BMI replaces existing BMI value."""
+    df = pl.DataFrame(
+        {
+            "weight": [70.0],
+            "height": [1.75],
+            "bmi": [999.9],  # Wrong BMI that should be replaced
+        }
+    )
+
+    result = fix_bmi(df)
+
+    # Should replace wrong BMI with correct calculation
+    assert result["bmi"][0] == pytest.approx(22.857, abs=0.001)
+
+
+def test_fix_bmi_null_weight():
+    """Test that null weight results in null BMI."""
+    df = pl.DataFrame(
+        {
+            "weight": [None, 70.0],
+            "height": [1.75, 1.75],
+        }
+    )
+
+    result = fix_bmi(df)
+
+    assert result["bmi"][0] is None
+    assert result["bmi"][1] is not None
+
+
+def test_fix_bmi_null_height():
+    """Test that null height results in null BMI."""
+    df = pl.DataFrame(
+        {
+            "weight": [70.0, 70.0],
+            "height": [None, 1.75],
+        }
+    )
+
+    result = fix_bmi(df)
+
+    assert result["bmi"][0] is None
+    assert result["bmi"][1] is not None
+
+
+def test_fix_bmi_error_value_weight():
+    """Test that error value weight results in error value BMI."""
+    df = pl.DataFrame(
+        {
+            "weight": [settings.error_val_numeric, 70.0],
+            "height": [1.75, 1.75],
+        }
+    )
+
+    result = fix_bmi(df)
+
+    assert result["bmi"][0] == settings.error_val_numeric
+    assert result["bmi"][1] == pytest.approx(22.857, abs=0.001)
+
+
+def test_fix_bmi_error_value_height():
+    """Test that error value height results in error value BMI."""
+    df = pl.DataFrame(
+        {
+            "weight": [70.0, 70.0],
+            "height": [settings.error_val_numeric, 1.75],
+        }
+    )
+
+    result = fix_bmi(df)
+
+    assert result["bmi"][0] == settings.error_val_numeric
+    assert result["bmi"][1] == pytest.approx(22.857, abs=0.001)
+
+
+def test_fix_bmi_missing_columns():
+    """Test that missing weight or height columns are handled gracefully."""
+    # Missing both
+    df = pl.DataFrame({"other": [1, 2, 3]})
+    result = fix_bmi(df)
+    assert result.equals(df)
+
+    # Missing weight
+    df = pl.DataFrame({"height": [1.75, 1.80]})
+    result = fix_bmi(df)
+    assert result.equals(df)
+
+    # Missing height
+    df = pl.DataFrame({"weight": [70.0, 80.0]})
+    result = fix_bmi(df)
+    assert result.equals(df)
+
+
+def test_fix_bmi_matches_r_behavior():
+    """Test that fix_bmi matches R's fix_bmi() function exactly."""
+    df = pl.DataFrame(
+        {
+            "weight": [70.0, None, settings.error_val_numeric, 80.0, 65.0],
+            "height": [1.75, 1.80, 1.75, None, settings.error_val_numeric],
+        }
+    )
+
+    result = fix_bmi(df)
+
+    # Row 0: Normal calculation
+    assert result["bmi"][0] == pytest.approx(22.857, abs=0.001)
+    # Row 1: Null weight → null BMI
+    assert result["bmi"][1] is None
+    # Row 2: Error weight → error BMI
+    assert result["bmi"][2] == settings.error_val_numeric
+    # Row 3: Null height → null BMI
+    assert result["bmi"][3] is None
+    # Row 4: Error height → error BMI
+    assert result["bmi"][4] == settings.error_val_numeric
+
+
+def test_fix_bmi_height_cm_conversion():
+    """Test that height in cm is converted to m before BMI calculation.
+
+    Matches R's transform_cm_to_m: if height > 50, divide by 100.
+    Real case: Lao Friends Hospital has height=135.5cm, weight=30.7kg.
+    """
+    df = pl.DataFrame(
+        {
+            "weight": [30.7, 70.0, 80.0],
+            "height": [135.5, 175.0, 1.80],  # cm, cm, m
+        }
+    )
+
+    result = fix_bmi(df)
+
+    # Row 0: 135.5cm → 1.355m → BMI = 30.7 / 1.355² = 16.72
+    assert result["bmi"][0] == pytest.approx(16.72, abs=0.01)
+    # Row 1: 175cm → 1.75m → BMI = 70 / 1.75² = 22.86
+    assert result["bmi"][1] == pytest.approx(22.86, abs=0.01)
+    # Row 2: 1.80m stays as-is → BMI = 80 / 1.80² = 24.69
+    assert result["bmi"][2] == pytest.approx(24.69, abs=0.01)
+
+
+# Tests for replace_range_with_mean
+
+
+def test_replace_range_with_mean_basic():
+    """Test basic range mean calculation."""
+    assert replace_range_with_mean("0-2") == pytest.approx(1.0)
+    assert replace_range_with_mean("2-3") == pytest.approx(2.5)
+    assert replace_range_with_mean("1-5") == pytest.approx(3.0)
+
+
+def test_replace_range_with_mean_larger_ranges():
+    """Test larger range values."""
+    assert replace_range_with_mean("10-20") == pytest.approx(15.0)
+    assert replace_range_with_mean("0-10") == pytest.approx(5.0)
+
+
+def test_replace_range_with_mean_same_values():
+    """Test range where both values are the same."""
+    assert replace_range_with_mean("0-0") == pytest.approx(0.0)
+    assert replace_range_with_mean("5-5") == pytest.approx(5.0)
+
+
+def test_replace_range_with_mean_decimals():
+    """Test ranges with decimal values."""
+    assert replace_range_with_mean("1.5-2.5") == pytest.approx(2.0)
+    assert replace_range_with_mean("0.5-1.5") == pytest.approx(1.0)
+
+
+# Tests for fix_testing_frequency
+
+
+def test_fix_testing_frequency_passthrough():
+    """Test that normal values pass through unchanged."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["P1", "P2", "P3"],
+            "testing_frequency": ["2", "1.5", "3"],
+        }
+    )
+
+    result = fix_testing_frequency(df)
+
+    assert result["testing_frequency"].to_list() == ["2", "1.5", "3"]
+
+
+def test_fix_testing_frequency_range_replacement():
+    """Test that ranges are replaced with mean."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["P1", "P2", "P3"],
+            "testing_frequency": ["0-2", "2-3", "1-5"],
+        }
+    )
+
+    result = fix_testing_frequency(df)
+
+    assert result["testing_frequency"].to_list() == ["1", "2.5", "3"]
+
+
+def test_fix_testing_frequency_mixed():
+    """Test mixed normal values and ranges."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["P1", "P2", "P3", "P4"],
+            "testing_frequency": ["2", "0-2", "1.5", "2-3"],
+        }
+    )
+
+    result = fix_testing_frequency(df)
+
+    assert result["testing_frequency"].to_list() == ["2", "1", "1.5", "2.5"]
+
+
+def test_fix_testing_frequency_null_handling():
+    """Test that null and empty values are preserved."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["P1", "P2", "P3"],
+            "testing_frequency": [None, "", "2"],
+        }
+    )
+
+    result = fix_testing_frequency(df)
+
+    assert result["testing_frequency"][0] is None
+    assert result["testing_frequency"][1] is None
+    assert result["testing_frequency"][2] == "2"
+
+
+def test_fix_testing_frequency_whole_numbers():
+    """Test that whole number means don't have decimal points."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["P1", "P2"],
+            "testing_frequency": ["0-2", "1-3"],
+        }
+    )
+
+    result = fix_testing_frequency(df)
+
+    # 0-2 mean is 1.0, should be "1" not "1.0"
+    # 1-3 mean is 2.0, should be "2" not "2.0"
+    assert result["testing_frequency"][0] == "1"
+    assert result["testing_frequency"][1] == "2"
+
+
+def test_fix_testing_frequency_missing_column():
+    """Test that missing column is handled gracefully."""
+    df = pl.DataFrame({"other": [1, 2, 3]})
+
+    result = fix_testing_frequency(df)
+
+    assert result.equals(df)
+
+
+def test_fix_testing_frequency_large_range():
+    """Test larger ranges."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["P1"],
+            "testing_frequency": ["0-10"],
+        }
+    )
+
+    result = fix_testing_frequency(df)
+
+    assert result["testing_frequency"][0] == "5"
+
+
+def test_fix_testing_frequency_preserves_other_columns():
+    """Test that other columns are preserved."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["P1", "P2"],
+            "testing_frequency": ["0-2", "3"],
+            "other_col": ["A", "B"],
+        }
+    )
+
+    result = fix_testing_frequency(df)
+
+    assert "patient_id" in result.columns
+    assert "other_col" in result.columns
+    assert result["other_col"].to_list() == ["A", "B"]
+
+
+# Tests for split_bp_in_sys_and_dias
+
+
+def test_split_bp_valid_format():
+    """Test splitting valid blood pressure format."""
+    df = pl.DataFrame(
+        {
+            "blood_pressure_mmhg": ["96/55", "101/57", "120/80"],
+        }
+    )
+
+    result = split_bp_in_sys_and_dias(df)
+
+    assert "blood_pressure_sys_mmhg" in result.columns
+    assert "blood_pressure_dias_mmhg" in result.columns
+    assert "blood_pressure_mmhg" not in result.columns
+
+    assert result["blood_pressure_sys_mmhg"].to_list() == ["96", "101", "120"]
+    assert result["blood_pressure_dias_mmhg"].to_list() == ["55", "57", "80"]
+
+
+def test_split_bp_invalid_no_slash():
+    """Test that values without slash are replaced with error value."""
+    df = pl.DataFrame(
+        {
+            "blood_pressure_mmhg": ["96", "1,6", ""],
+        }
+    )
+
+    result = split_bp_in_sys_and_dias(df)
+
+    error_val = str(int(settings.error_val_numeric))
+    assert result["blood_pressure_sys_mmhg"].to_list() == [error_val, error_val, error_val]
+    assert result["blood_pressure_dias_mmhg"].to_list() == [error_val, error_val, error_val]
+
+
+def test_split_bp_mixed_valid_invalid():
+    """Test mixed valid and invalid values."""
+    df = pl.DataFrame(
+        {
+            "blood_pressure_mmhg": ["96/55", "invalid", "120/80"],
+        }
+    )
+
+    result = split_bp_in_sys_and_dias(df)
+
+    error_val = str(int(settings.error_val_numeric))
+    assert result["blood_pressure_sys_mmhg"].to_list() == ["96", error_val, "120"]
+    assert result["blood_pressure_dias_mmhg"].to_list() == ["55", error_val, "80"]
+
+
+def test_split_bp_null_values():
+    """Test that null values are preserved."""
+    df = pl.DataFrame(
+        {
+            "blood_pressure_mmhg": ["96/55", None, "120/80"],
+        }
+    )
+
+    result = split_bp_in_sys_and_dias(df)
+
+    assert result["blood_pressure_sys_mmhg"][0] == "96"
+    assert result["blood_pressure_sys_mmhg"][1] is None
+    assert result["blood_pressure_sys_mmhg"][2] == "120"
+
+
+def test_split_bp_missing_column():
+    """Test that missing column is handled gracefully."""
+    df = pl.DataFrame({"other": [1, 2, 3]})
+
+    result = split_bp_in_sys_and_dias(df)
+
+    assert result.equals(df)
+
+
+def test_split_bp_drops_original_column():
+    """Test that original blood_pressure_mmhg column is dropped."""
+    df = pl.DataFrame(
+        {
+            "blood_pressure_mmhg": ["96/55", "120/80"],
+        }
+    )
+
+    result = split_bp_in_sys_and_dias(df)
+
+    assert "blood_pressure_mmhg" not in result.columns
+
+
+def test_split_bp_preserves_other_columns():
+    """Test that other columns are preserved."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["P1", "P2"],
+            "blood_pressure_mmhg": ["96/55", "120/80"],
+            "other_col": ["A", "B"],
+        }
+    )
+
+    result = split_bp_in_sys_and_dias(df)
+
+    assert "patient_id" in result.columns
+    assert "other_col" in result.columns
+    assert result["patient_id"].to_list() == ["P1", "P2"]
+    assert result["other_col"].to_list() == ["A", "B"]
+
+
+def test_split_bp_multiple_invalid():
+    """Test multiple invalid values log warning."""
+    df = pl.DataFrame(
+        {
+            "blood_pressure_mmhg": ["invalid1", "invalid2", "96/55"],
+        }
+    )
+
+    result = split_bp_in_sys_and_dias(df)
+
+    error_val = str(int(settings.error_val_numeric))
+    assert result["blood_pressure_sys_mmhg"][0] == error_val
+    assert result["blood_pressure_sys_mmhg"][1] == error_val
+    assert result["blood_pressure_sys_mmhg"][2] == "96"
diff --git a/a4d-python/tests/test_clean/test_validators.py b/a4d-python/tests/test_clean/test_validators.py
new file mode 100644
index 0000000..d662181
--- /dev/null
+++ b/a4d-python/tests/test_clean/test_validators.py
@@ -0,0 +1,592 @@
+"""Tests for schema and validation utilities."""
+
+import polars as pl
+
+from a4d.clean.validators import (
+    fix_patient_id,
+    load_validation_rules,
+    validate_all_columns,
+    validate_allowed_values,
+    validate_column_from_rules,
+)
+from a4d.config import settings
+from a4d.errors import ErrorCollector
+
+
+def test_load_validation_rules():
+    """Test loading validation rules from YAML."""
+    rules = load_validation_rules()
+
+    # Check that rules were loaded
+    assert isinstance(rules, dict)
+    assert len(rules) > 0
+
+    # Check a specific column rule (new simplified structure)
+    assert "status" in rules
+    assert "allowed_values" in rules["status"]
+    assert "replace_invalid" in rules["status"]
+    assert isinstance(rules["status"]["allowed_values"], list)
+    assert len(rules["status"]["allowed_values"]) > 0
+
+    # Check another column
+    assert "clinic_visit" in rules
+    assert rules["clinic_visit"]["allowed_values"] == ["N", "Y"]
+    assert rules["clinic_visit"]["replace_invalid"] is True
+
+
+def test_validate_allowed_values_all_valid():
+    """Test validation when all values are valid."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 3,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+            "status": ["Active", "Inactive", "Active"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = validate_allowed_values(
+        df=df,
+        column="status",
+        allowed_values=["Active", "Inactive", "Transferred"],
+        error_collector=collector,
+        replace_invalid=True,
+    )
+
+    assert result["status"].to_list() == ["Active", "Inactive", "Active"]
+    assert len(collector) == 0
+
+
+def test_validate_allowed_values_with_invalid():
+    """Test validation when some values are invalid."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 4,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003", "XX_YY004"],
+            "status": ["Active", "INVALID", "Inactive", "BAD_VALUE"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = validate_allowed_values(
+        df=df,
+        column="status",
+        allowed_values=["Active", "Inactive"],
+        error_collector=collector,
+        replace_invalid=True,
+    )
+
+    assert result["status"].to_list() == [
+        "Active",
+        settings.error_val_character,
+        "Inactive",
+        settings.error_val_character,
+    ]
+    assert len(collector) == 2
+
+    # Check error details
+    # Note: file_name and patient_id are "unknown" placeholders in validate_allowed_values
+    # They get filled in during bulk processing operations
+    errors_df = collector.to_dataframe()
+    # Order is not guaranteed, so check using sets
+    assert set(errors_df["original_value"].to_list()) == {"INVALID", "BAD_VALUE"}
+    assert errors_df["column"].to_list() == ["status", "status"]
+    assert errors_df["error_code"].to_list() == ["invalid_value", "invalid_value"]
+
+
+def test_validate_allowed_values_preserves_nulls():
+    """Test that nulls are preserved and not logged as errors."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 3,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+            "status": ["Active", None, "Inactive"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = validate_allowed_values(
+        df=df,
+        column="status",
+        allowed_values=["Active", "Inactive"],
+        error_collector=collector,
+        replace_invalid=True,
+    )
+
+    assert result["status"].to_list() == ["Active", None, "Inactive"]
+    assert len(collector) == 0
+
+
+def test_validate_allowed_values_no_replace():
+    """Test validation without replacing invalid values."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 2,
+            "patient_id": ["XX_YY001", "XX_YY002"],
+            "status": ["Active", "INVALID"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = validate_allowed_values(
+        df=df,
+        column="status",
+        allowed_values=["Active"],
+        error_collector=collector,
+        replace_invalid=False,
+    )
+
+    # Invalid value should NOT be replaced
+    assert result["status"].to_list() == ["Active", "INVALID"]
+    # But it should still be logged
+    assert len(collector) == 1
+
+
+def test_validate_allowed_values_missing_column():
+    """Test that missing columns are handled gracefully."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"],
+            "patient_id": ["XX_YY001"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = validate_allowed_values(
+        df=df,
+        column="nonexistent",
+        allowed_values=["Active"],
+        error_collector=collector,
+    )
+
+    assert result.equals(df)
+    assert len(collector) == 0
+
+
+def test_validate_allowed_values_ignores_existing_errors():
+    """Test that existing error values are not re-logged."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 3,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+            "status": ["Active", settings.error_val_character, "INVALID"],
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = validate_allowed_values(
+        df=df,
+        column="status",
+        allowed_values=["Active", "Inactive"],
+        error_collector=collector,
+        replace_invalid=True,
+    )
+
+    # Only "INVALID" should be logged, not the existing error value
+    assert len(collector) == 1
+    assert result["status"].to_list() == [
+        "Active",
+        settings.error_val_character,
+        settings.error_val_character,
+    ]
+
+
+def test_validate_column_from_rules():
+    """Test validation using rules from data_cleaning.yaml."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 3,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+            "clinic_visit": ["Y", "N", "INVALID"],
+        }
+    )
+
+    rules = load_validation_rules()
+    collector = ErrorCollector()
+
+    result = validate_column_from_rules(
+        df=df,
+        column="clinic_visit",
+        rules=rules["clinic_visit"],
+        error_collector=collector,
+    )
+
+    # "INVALID" should be replaced with error value
+    assert result["clinic_visit"].to_list() == ["Y", "N", settings.error_val_character]
+    assert len(collector) == 1
+
+
+def test_validate_column_from_rules_missing_column():
+    """Test validation with missing column."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"],
+            "patient_id": ["XX_YY001"],
+        }
+    )
+
+    rules = load_validation_rules()
+    collector = ErrorCollector()
+
+    result = validate_column_from_rules(
+        df=df,
+        column="nonexistent",
+        rules=rules["clinic_visit"],
+        error_collector=collector,
+    )
+
+    assert result.equals(df)
+    assert len(collector) == 0
+
+
+def test_validate_all_columns():
+    """Test validation of all columns with rules.
+
+    Note: Validation uses case-insensitive matching and normalizes to canonical values.
+    For example, "active" becomes "Active", "y" becomes "Y".
+    """
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 3,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+            "clinic_visit": ["Y", "N", "INVALID1"],
+            "patient_consent": ["Y", "INVALID2", "N"],
+            "status": ["active", "INVALID3", "inactive"],  # Lowercase input
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = validate_all_columns(df, collector)
+
+    # All invalid values should be replaced
+    # Valid values should be normalized to canonical form (Title Case for status)
+    assert result["clinic_visit"].to_list() == ["Y", "N", settings.error_val_character]
+    assert result["patient_consent"].to_list() == ["Y", settings.error_val_character, "N"]
+    assert result["status"].to_list() == ["Active", settings.error_val_character, "Inactive"]
+
+    # Should have logged 3 errors (one per invalid value)
+    assert len(collector) == 3
+
+
+def test_validate_all_columns_only_validates_existing():
+    """Test that validation only processes columns that exist in DataFrame."""
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"],
+            "patient_id": ["XX_YY001"],
+            "clinic_visit": ["Y"],
+            # Many other columns from rules don't exist
+        }
+    )
+
+    collector = ErrorCollector()
+
+    # Should not raise error even though many rule columns don't exist
+    result = validate_all_columns(df, collector)
+
+    assert "clinic_visit" in result.columns
+    assert len(collector) == 0
+
+
+def test_validate_allowed_values_case_insensitive():
+    """Test that validation is case-insensitive and normalizes to canonical values.
+
+    Validation matches R behavior:
+    - "y" matches "Y" (case-insensitive)
+    - Returns canonical value "Y" (not the input "y")
+    """
+    df = pl.DataFrame(
+        {
+            "file_name": ["test.xlsx"] * 3,
+            "patient_id": ["XX_YY001", "XX_YY002", "XX_YY003"],
+            "clinic_visit": ["Y", "y", "N"],  # Mixed case
+        }
+    )
+
+    collector = ErrorCollector()
+
+    result = validate_allowed_values(
+        df=df,
+        column="clinic_visit",
+        allowed_values=["Y", "N"],
+        error_collector=collector,
+        replace_invalid=True,
+    )
+
+    # Lowercase "y" should match "Y" and be normalized to canonical "Y"
+    assert result["clinic_visit"].to_list() == ["Y", "Y", "N"]
+    assert len(collector) == 0  # No errors - "y" is valid
+
+
+# Tests for fix_patient_id
+
+
+def test_fix_patient_id_valid_ids():
+    """Test that valid patient IDs are not changed."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["KD_EW004", "AB_CD123", "XY_ZW999"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result["patient_id"].to_list() == ["KD_EW004", "AB_CD123", "XY_ZW999"]
+    assert len(collector) == 0
+
+
+def test_fix_patient_id_hyphen_normalization():
+    """Test that hyphens are replaced with underscores."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["KD-EW004", "AB-CD123"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result["patient_id"].to_list() == ["KD_EW004", "AB_CD123"]
+    assert len(collector) == 0  # Normalization doesn't generate errors
+
+
+def test_fix_patient_id_truncation():
+    """Test that IDs > 8 chars are truncated."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["KD_EW004XY", "KD_EW004ABC", "VERYLONGID"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    # First 8 characters
+    assert result["patient_id"].to_list() == ["KD_EW004", "KD_EW004", "VERYLONG"]
+    # Truncation generates warnings
+    assert len(collector) == 3
+
+
+def test_fix_patient_id_invalid_too_short_first_part():
+    """Test that IDs with < 2 letters in first part are replaced."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["K_EW004", "A_CD123"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result["patient_id"].to_list() == ["Undefined", "Undefined"]
+    assert len(collector) == 2
+
+
+def test_fix_patient_id_invalid_too_short_second_part():
+    """Test that IDs with < 2 letters in second part are replaced."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["KD_E004", "AB_C123"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result["patient_id"].to_list() == ["Undefined", "Undefined"]
+    assert len(collector) == 2
+
+
+def test_fix_patient_id_invalid_wrong_digits():
+    """Test that IDs without exactly 3 digits are replaced."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["KD_EW04", "KD_EW0", "KD_EW0001"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    # All invalid (2 digits, 1 digit, 4 digits)
+    assert result["patient_id"][0] == "Undefined"
+    assert result["patient_id"][1] == "Undefined"
+    # KD_EW0001 is > 8 chars, so truncated to KD_EW000
+    assert result["patient_id"][2] == "KD_EW000"
+
+
+def test_fix_patient_id_invalid_digits_in_letter_positions():
+    """Test that IDs with digits instead of letters are replaced."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["11_EW004", "KD_E1004", "12_34567"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result["patient_id"].to_list() == ["Undefined", "Undefined", "Undefined"]
+    assert len(collector) == 3
+
+
+def test_fix_patient_id_invalid_letters_in_digit_positions():
+    """Test that IDs with letters in digit positions are replaced."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["KD_EWX04", "KD_EWABC"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result["patient_id"].to_list() == ["Undefined", "Undefined"]
+    assert len(collector) == 2
+
+
+def test_fix_patient_id_invalid_no_underscore():
+    """Test that IDs without underscore are replaced."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["KDEW004", "INVALID"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result["patient_id"].to_list() == ["Undefined", "Undefined"]
+    assert len(collector) == 2
+
+
+def test_fix_patient_id_null_values():
+    """Test that null values are preserved."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["KD_EW004", None, "AB_CD123"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result["patient_id"][0] == "KD_EW004"
+    assert result["patient_id"][1] is None
+    assert result["patient_id"][2] == "AB_CD123"
+    assert len(collector) == 0
+
+
+def test_fix_patient_id_empty_string():
+    """Test that empty string is replaced with error value."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["", "KD_EW004"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result["patient_id"][0] == "Undefined"
+    assert result["patient_id"][1] == "KD_EW004"
+    assert len(collector) == 1
+
+
+def test_fix_patient_id_missing_column():
+    """Test that missing column is handled gracefully."""
+    df = pl.DataFrame({"other": [1, 2, 3]})
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result.equals(df)
+    assert len(collector) == 0
+
+
+def test_fix_patient_id_mixed_valid_invalid():
+    """Test mixed valid and invalid IDs."""
+    df = pl.DataFrame(
+        {
+            "patient_id": [
+                "KD_EW004",  # Valid
+                "KD-AB123",  # Valid after normalization
+                "INVALID",  # Invalid, replaced
+                "KD_EW004XY",  # Invalid, truncated
+                None,  # Null preserved
+            ],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    assert result["patient_id"][0] == "KD_EW004"
+    assert result["patient_id"][1] == "KD_AB123"
+    assert result["patient_id"][2] == "Undefined"
+    assert result["patient_id"][3] == "KD_EW004"
+    assert result["patient_id"][4] is None
+    assert len(collector) == 2  # 1 replacement + 1 truncation
+
+
+def test_fix_patient_id_lowercase_letters():
+    """Test that lowercase letters make ID invalid."""
+    df = pl.DataFrame(
+        {
+            "patient_id": ["kd_ew004", "KD_ew004", "kd_EW004"],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    # All should be replaced (format requires uppercase)
+    assert result["patient_id"].to_list() == ["Undefined", "Undefined", "Undefined"]
+    assert len(collector) == 3
+
+
+def test_fix_patient_id_matches_r_behavior():
+    """Test that fix_patient_id matches R's fix_id() exactly."""
+    df = pl.DataFrame(
+        {
+            "patient_id": [
+                "KD_EW004",  # Valid
+                "KD-EW004",  # Normalize - to _
+                "K_EW004",  # Too short first part
+                "KD_E004",  # Too short second part
+                "KD_EWX04",  # Invalid format
+                "11_EW004",  # Digits instead of letters
+                "KD_E1004",  # Digit in letter position
+                "KD_EW004XY",  # Truncate (> 8 chars)
+                None,  # Null
+                "",  # Empty
+            ],
+        }
+    )
+
+    collector = ErrorCollector()
+    result = fix_patient_id(df, collector)
+
+    expected = [
+        "KD_EW004",  # Valid
+        "KD_EW004",  # Normalized
+        "Undefined",  # Invalid
+        "Undefined",  # Invalid
+        "Undefined",  # Invalid
+        "Undefined",  # Invalid
+        "Undefined",  # Invalid
+        "KD_EW004",  # Truncated
+        None,  # Null
+        "Undefined",  # Empty → Other
+    ]
+    assert result["patient_id"].to_list() == expected
+    # Errors: 5 replacements + 1 truncation + 1 empty string = 7
+    assert len(collector) == 7
diff --git a/a4d-python/tests/test_errors.py b/a4d-python/tests/test_errors.py
new file mode 100644
index 0000000..84196da
--- /dev/null
+++ b/a4d-python/tests/test_errors.py
@@ -0,0 +1,167 @@
+"""Tests for error tracking functionality."""
+
+import polars as pl
+
+from a4d.errors import DataError, ErrorCollector
+
+
+def test_data_error_creation():
+    """Test creating a DataError instance."""
+    error = DataError(
+        file_name="test.xlsx",
+        patient_id="XX_YY001",
+        column="age",
+        original_value="invalid",
+        error_message="Could not convert to Int32",
+        error_code="type_conversion",
+        function_name="safe_convert_column",
+    )
+
+    assert error.file_name == "test.xlsx"
+    assert error.patient_id == "XX_YY001"
+    assert error.column == "age"
+    assert error.error_code == "type_conversion"
+    assert error.script == "clean"  # default value
+
+
+def test_error_collector_add_error():
+    """Test adding errors to collector."""
+    collector = ErrorCollector()
+
+    assert len(collector) == 0
+    assert not collector  # __bool__ returns False when empty
+
+    collector.add_error(
+        file_name="test.xlsx",
+        patient_id="XX_YY001",
+        column="age",
+        original_value="invalid",
+        error_message="Could not convert",
+        error_code="type_conversion",
+    )
+
+    assert len(collector) == 1
+    assert collector  # __bool__ returns True when has errors
+
+
+def test_error_collector_add_errors():
+    """Test adding multiple errors at once."""
+    collector = ErrorCollector()
+
+    errors = [
+        DataError(
+            file_name="test.xlsx",
+            patient_id="XX_YY001",
+            column="age",
+            original_value="invalid",
+            error_message="Could not convert",
+            error_code="type_conversion",
+        ),
+        DataError(
+            file_name="test.xlsx",
+            patient_id="XX_YY002",
+            column="weight",
+            original_value="abc",
+            error_message="Could not convert",
+            error_code="type_conversion",
+        ),
+    ]
+
+    collector.add_errors(errors)
+
+    assert len(collector) == 2
+
+
+def test_error_collector_to_dataframe():
+    """Test converting errors to DataFrame."""
+    collector = ErrorCollector()
+
+    collector.add_error(
+        file_name="test.xlsx",
+        patient_id="XX_YY001",
+        column="age",
+        original_value="invalid",
+        error_message="Could not convert to Int32",
+        error_code="type_conversion",
+        function_name="safe_convert_column",
+    )
+
+    df = collector.to_dataframe()
+
+    assert isinstance(df, pl.DataFrame)
+    assert len(df) == 1
+    assert "file_name" in df.columns
+    assert "patient_id" in df.columns
+    assert "column" in df.columns
+    assert "error_code" in df.columns
+
+    # Check categorical columns
+    assert df.schema["error_code"] == pl.Categorical
+    assert df.schema["script"] == pl.Categorical
+
+
+def test_error_collector_to_dataframe_empty():
+    """Test converting empty collector to DataFrame."""
+    collector = ErrorCollector()
+    df = collector.to_dataframe()
+
+    assert isinstance(df, pl.DataFrame)
+    assert len(df) == 0
+    # Should still have correct schema
+    assert "file_name" in df.columns
+    assert "error_code" in df.columns
+
+
+def test_error_collector_get_summary():
+    """Test error summary by error_code."""
+    collector = ErrorCollector()
+
+    collector.add_error(
+        file_name="test.xlsx",
+        patient_id="XX_YY001",
+        column="age",
+        original_value="invalid",
+        error_message="Type error",
+        error_code="type_conversion",
+    )
+    collector.add_error(
+        file_name="test.xlsx",
+        patient_id="XX_YY002",
+        column="age",
+        original_value="999",
+        error_message="Out of range",
+        error_code="invalid_value",
+    )
+    collector.add_error(
+        file_name="test.xlsx",
+        patient_id="XX_YY003",
+        column="weight",
+        original_value="abc",
+        error_message="Type error",
+        error_code="type_conversion",
+    )
+
+    summary = collector.get_error_summary()
+
+    assert summary == {"type_conversion": 2, "invalid_value": 1}
+
+
+def test_error_collector_clear():
+    """Test clearing errors from collector."""
+    collector = ErrorCollector()
+
+    collector.add_error(
+        file_name="test.xlsx",
+        patient_id="XX_YY001",
+        column="age",
+        original_value="invalid",
+        error_message="Error",
+        error_code="type_conversion",
+    )
+
+    assert len(collector) == 1
+
+    collector.clear()
+
+    assert len(collector) == 0
+    assert not collector
diff --git a/a4d-python/tests/test_extract/__init__.py b/a4d-python/tests/test_extract/__init__.py
new file mode 100644
index 0000000..1690af8
--- /dev/null
+++ b/a4d-python/tests/test_extract/__init__.py
@@ -0,0 +1 @@
+"""Tests for data extraction modules."""
diff --git a/a4d-python/tests/test_extract/test_patient.py b/a4d-python/tests/test_extract/test_patient.py
new file mode 100644
index 0000000..0d2d31d
--- /dev/null
+++ b/a4d-python/tests/test_extract/test_patient.py
@@ -0,0 +1,648 @@
+"""Tests for patient data extraction."""
+
+from pathlib import Path
+
+import polars as pl
+import pytest
+
+from a4d.extract.patient import (
+    extract_patient_data,
+    extract_tracker_month,
+    find_month_sheets,
+    get_tracker_year,
+    harmonize_patient_data_columns,
+    merge_duplicate_columns_data,
+    read_all_patient_sheets,
+)
+
+
+def column_letter_to_index(col_letter: str) -> int:
+    """Convert Excel column letter to 0-based index.
+
+    Examples:
+        A -> 0, B -> 1, Z -> 25, AA -> 26, AB -> 27, AC -> 28
+    """
+    result = 0
+    for char in col_letter:
+        result = result * 26 + (ord(char) - ord("A") + 1)
+    return result - 1
+
+
+def calculate_expected_columns(start_col: str, end_col: str) -> int:
+    """Calculate expected number of columns from Excel range.
+
+    Args:
+        start_col: Starting column letter (e.g., 'B')
+        end_col: Ending column letter (e.g., 'AC')
+
+    Returns:
+        Number of columns in the range
+
+    Examples:
+        B to Z: 25 columns
+        B to AC: 28 columns
+        B to AB: 27 columns
+    """
+    start_idx = column_letter_to_index(start_col)
+    end_idx = column_letter_to_index(end_col)
+    return end_idx - start_idx + 1
+
+
+# Test data paths
+TRACKER_SBU_2024 = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/"
+    "Malaysia/SBU/2024_Sibu Hospital A4D Tracker.xlsx"
+)
+TRACKER_PNG_2019 = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/"
+    "Malaysia/PNG/2019_Penang General Hospital A4D Tracker_DC.xlsx"
+)
+TRACKER_PNG_2018 = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/"
+    "Malaysia/PNG/2018_Penang General Hospital A4D Tracker_DC.xlsx"
+)
+TRACKER_MHS_2017 = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/"
+    "Laos/MHS/2017_Mahosot Hospital A4D Tracker.xlsx"
+)
+TRACKER_MHS_2025 = Path(
+    "/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/"
+    "Laos/MHS/2025_06_Mahosot Hospital A4D Tracker.xlsx"
+)
+
+
+@pytest.mark.skipif(not TRACKER_SBU_2024.exists(), reason="Tracker file not available")
+def test_get_tracker_year_from_sheet_names():
+    """Test extracting year from sheet names."""
+    year = get_tracker_year(TRACKER_SBU_2024, ["Jan24", "Feb24", "Mar24"])
+    assert year == 2024
+
+
+@pytest.mark.skipif(not TRACKER_SBU_2024.exists(), reason="Tracker file not available")
+def test_get_tracker_year_from_filename():
+    """Test extracting year from filename as fallback."""
+    year = get_tracker_year(TRACKER_SBU_2024, ["January", "February"])
+    assert year == 2024
+
+
+@pytest.mark.skipif(not TRACKER_SBU_2024.exists(), reason="Tracker file not available")
+def test_find_month_sheets_2024():
+    """Test finding month sheets in 2024 tracker."""
+    from openpyxl import load_workbook
+
+    wb = load_workbook(TRACKER_SBU_2024, data_only=True)
+    month_sheets = find_month_sheets(wb)
+
+    assert len(month_sheets) > 0
+    assert any("Jan" in sheet for sheet in month_sheets)
+    assert any("Dec" in sheet for sheet in month_sheets)
+
+
+# Parameterized test data: (tracker_file, sheet_name, year, expected_patients, expected_cols, notes)
+# Note: expected_cols is the actual number after filtering out None header columns
+TRACKER_TEST_CASES = [
+    # 2024 tracker - optimized single-pass extraction
+    (
+        TRACKER_SBU_2024,
+        "Jan24",
+        2024,
+        4,
+        calculate_expected_columns("B", "AG") - 1,
+        "Single-pass read-only",
+    ),
+    # 2019 tracker - format changes across months! Optimized extraction
+    (
+        TRACKER_PNG_2019,
+        "Jan19",
+        2019,
+        10,
+        calculate_expected_columns("B", "Z"),
+        "Single-pass read-only",
+    ),
+    (
+        TRACKER_PNG_2019,
+        "Feb19",
+        2019,
+        10,
+        calculate_expected_columns("B", "AC"),
+        "Single-pass read-only",
+    ),
+    (
+        TRACKER_PNG_2019,
+        "Mar19",
+        2019,
+        10,
+        calculate_expected_columns("B", "AB"),
+        "Single-pass read-only",
+    ),
+    (
+        TRACKER_PNG_2019,
+        "Oct19",
+        2019,
+        11,
+        calculate_expected_columns("B", "AB"),
+        "Single-pass read-only",
+    ),
+    # 2018 tracker - single-line headers
+    (
+        TRACKER_PNG_2018,
+        "Dec18",
+        2018,
+        10,
+        calculate_expected_columns("B", "T"),
+        "Single-pass read-only",
+    ),
+]
+
+
+@pytest.mark.skipif(
+    any(not tf.exists() for tf, _, _, _, _, _ in TRACKER_TEST_CASES),
+    reason="Tracker files not available",
+)
+@pytest.mark.parametrize(
+    ("tracker_file", "sheet_name", "year", "expected_patients", "expected_cols", "notes"),
+    TRACKER_TEST_CASES,
+    ids=lambda params: f"{params[1] if isinstance(params, tuple) and len(params) > 1 else params}",
+)
+def test_extract_patient_data_schema(
+    tracker_file, sheet_name, year, expected_patients, expected_cols, notes
+):
+    """Test patient data extraction with schema validation across different months.
+
+    This parameterized test validates that:
+    1. Correct number of patients are extracted
+    2. Correct number of columns match expected (after filtering None headers)
+    3. Format changes between months are handled correctly
+
+    The test is critical because tracker formats change even within the same year,
+    and data quality is inconsistent across different months.
+    """
+    df = extract_patient_data(tracker_file, sheet_name, year)
+
+    # Check dimensions
+    assert len(df) == expected_patients, (
+        f"{sheet_name}: Expected {expected_patients} patients, got {len(df)}"
+    )
+    assert len(df.columns) == expected_cols, (
+        f"{sheet_name}: Expected {expected_cols} columns ({notes}), got {len(df.columns)}"
+    )
+
+    # Verify we have at least Patient ID column
+    assert any("patient" in col.lower() and "id" in col.lower() for col in df.columns), (
+        f"{sheet_name}: Missing Patient ID column in {df.columns}"
+    )
+
+    print(f"\n{sheet_name}: {len(df)} patients × {len(df.columns)} columns ({notes}) ✓")
+
+
+@pytest.mark.skipif(not TRACKER_SBU_2024.exists(), reason="Tracker file not available")
+def test_extract_patient_data_2024_detailed():
+    """Detailed test for 2024 tracker with patient ID validation."""
+    df = extract_patient_data(TRACKER_SBU_2024, "Jan24", 2024)
+
+    # Verify specific patient IDs
+    patient_ids = df["Patient ID*"].to_list()
+    assert patient_ids == ["MY_SU001", "MY_SU002", "MY_SU003", "MY_SU004"], (
+        f"Expected MY_SU001-004, got {patient_ids}"
+    )
+
+    print(f"\n2024 Jan24 - Patient IDs: {patient_ids} ✓")
+
+
+def test_harmonize_patient_data_columns_basic():
+    """Test basic column harmonization with known synonyms."""
+    raw_df = pl.DataFrame(
+        {
+            "Patient ID*": ["MY_SU001", "MY_SU002"],
+            "Age": [25, 30],
+            "D.O.B.": ["1998-01-15", "1993-06-20"],
+        }
+    )
+
+    harmonized = harmonize_patient_data_columns(raw_df)
+
+    # Check that columns were renamed to standardized names
+    assert "patient_id" in harmonized.columns
+    assert "age" in harmonized.columns
+    assert "dob" in harmonized.columns
+
+    # Check that data is preserved
+    assert harmonized["patient_id"].to_list() == ["MY_SU001", "MY_SU002"]
+    assert harmonized["age"].to_list() == [25, 30]
+
+
+def test_harmonize_patient_data_columns_multiple_synonyms():
+    """Test that multiple columns mapping to same name keeps first occurrence.
+
+    When multiple columns in the input map to the same standardized name
+    (e.g., "Patient ID", "ID", "Patient ID*" all map to "patient_id"),
+    we keep the FIRST occurrence and drop the rest. This matches R behavior
+    and handles edge cases like 2023 complication screening columns.
+    """
+    raw_df = pl.DataFrame(
+        {
+            "Patient ID": ["P001"],
+            "ID": ["P002"],
+            "Patient ID*": ["P003"],
+        }
+    )
+
+    # Should keep first occurrence ("Patient ID") and drop the rest
+    harmonized = harmonize_patient_data_columns(raw_df)
+
+    assert list(harmonized.columns) == ["patient_id"]
+    assert harmonized["patient_id"].to_list() == ["P001"]  # First occurrence kept
+
+
+def test_harmonize_patient_data_columns_unmapped_strict_false():
+    """Test that unmapped columns are kept when strict=False (default)."""
+    raw_df = pl.DataFrame(
+        {
+            "Patient ID*": ["MY_SU001"],
+            "Age": [25],
+            "UnknownColumn": ["some value"],
+        }
+    )
+
+    harmonized = harmonize_patient_data_columns(raw_df, strict=False)
+
+    # Mapped columns should be renamed
+    assert "patient_id" in harmonized.columns
+    assert "age" in harmonized.columns
+
+    # Unmapped column should be kept as-is
+    assert "UnknownColumn" in harmonized.columns
+
+
+def test_harmonize_patient_data_columns_unmapped_strict_true():
+    """Test that unmapped columns raise error when strict=True."""
+    raw_df = pl.DataFrame(
+        {
+            "Patient ID*": ["MY_SU001"],
+            "UnknownColumn": ["some value"],
+        }
+    )
+
+    with pytest.raises(ValueError, match="Unmapped columns found"):
+        harmonize_patient_data_columns(raw_df, strict=True)
+
+
+def test_harmonize_patient_data_columns_empty_dataframe():
+    """Test harmonization with empty DataFrame."""
+    raw_df = pl.DataFrame()
+
+    harmonized = harmonize_patient_data_columns(raw_df)
+
+    assert len(harmonized) == 0
+    assert len(harmonized.columns) == 0
+
+
+@pytest.mark.skipif(not TRACKER_SBU_2024.exists(), reason="Tracker file not available")
+def test_harmonize_real_tracker_data():
+    """Test harmonization with real tracker data."""
+    # Extract raw data
+    raw_df = extract_patient_data(TRACKER_SBU_2024, "Jan24", 2024)
+
+    # Harmonize columns
+    harmonized = harmonize_patient_data_columns(raw_df)
+
+    # Check that key columns were renamed
+    assert "patient_id" in harmonized.columns
+    assert "age" in harmonized.columns
+
+    # Check that data is preserved
+    assert len(harmonized) == len(raw_df)  # Same number of rows
+    assert harmonized["patient_id"].to_list() == ["MY_SU001", "MY_SU002", "MY_SU003", "MY_SU004"]
+
+
+def test_extract_tracker_month():
+    """Test extracting month number from sheet name."""
+    assert extract_tracker_month("Jan24") == 1
+    assert extract_tracker_month("Feb24") == 2
+    assert extract_tracker_month("Mar19") == 3
+    assert extract_tracker_month("Dec23") == 12
+
+    # Test with ValueError for invalid sheet names
+    with pytest.raises(ValueError, match="Could not extract month"):
+        extract_tracker_month("Sheet1")
+
+
+def test_merge_duplicate_columns_data_no_duplicates():
+    """Test that data without duplicate headers is unchanged."""
+    headers = ["ID", "Name", "Age", "City"]
+    data = [["1", "Alice", "25", "NYC"], ["2", "Bob", "30", "LA"]]
+
+    result_headers, result_data = merge_duplicate_columns_data(headers, data)
+
+    assert result_headers == headers
+    assert result_data == data
+
+
+def test_merge_duplicate_columns_data_with_duplicates():
+    """Test merging duplicate columns like R's tidyr::unite()."""
+    headers = ["ID", "DM Complications", "DM Complications", "DM Complications", "Age"]
+    data = [["1", "A", "B", "C", "25"], ["2", "X", "Y", "Z", "30"]]
+
+    result_headers, result_data = merge_duplicate_columns_data(headers, data)
+
+    assert result_headers == ["ID", "DM Complications", "Age"]
+    assert result_data == [["1", "A,B,C", "25"], ["2", "X,Y,Z", "30"]]
+
+
+def test_merge_duplicate_columns_data_with_nulls():
+    """Test merging duplicate columns with null values."""
+    headers = ["ID", "DM Complications", "DM Complications", "DM Complications", "Age"]
+    data = [["1", "A", None, "C", "25"], ["2", None, "Y", None, "30"]]
+
+    result_headers, result_data = merge_duplicate_columns_data(headers, data)
+
+    assert result_headers == ["ID", "DM Complications", "Age"]
+    # Empty values are filtered out before joining
+    assert result_data == [["1", "A,C", "25"], ["2", "Y", "30"]]
+
+
+def test_merge_duplicate_columns_data_all_nulls():
+    """Test merging when all duplicate columns have null values."""
+    headers = ["ID", "DM Complications", "DM Complications", "Age"]
+    data = [["1", None, None, "25"]]
+
+    result_headers, result_data = merge_duplicate_columns_data(headers, data)
+
+    assert result_headers == ["ID", "DM Complications", "Age"]
+    # All nulls result in None
+    assert result_data == [["1", None, "25"]]
+
+
+def test_merge_duplicate_columns_data_multiple_groups():
+    """Test merging multiple groups of duplicate columns."""
+    headers = ["ID", "Status", "Status", "Value", "Value", "Value", "Name"]
+    data = [["1", "A", "B", "X", "Y", "Z", "Alice"]]
+
+    result_headers, result_data = merge_duplicate_columns_data(headers, data)
+
+    assert result_headers == ["ID", "Status", "Value", "Name"]
+    assert result_data == [["1", "A,B", "X,Y,Z", "Alice"]]
+
+
+@pytest.mark.skipif(not TRACKER_SBU_2024.exists(), reason="Tracker file not available")
+def test_read_all_patient_sheets_2024():
+    """Test reading all patient sheets from 2024 tracker with Patient List and Annual."""
+    df_all = read_all_patient_sheets(TRACKER_SBU_2024)
+
+    # Check that we have data
+    assert len(df_all) > 0, "Should have extracted patient data"
+
+    # Check that metadata columns were added
+    assert "sheet_name" in df_all.columns
+    assert "tracker_month" in df_all.columns
+    assert "tracker_year" in df_all.columns
+    assert "file_name" in df_all.columns
+    assert "clinic_id" in df_all.columns
+
+    # Check that clinic_id is extracted from parent directory
+    clinic_ids = df_all["clinic_id"].unique().to_list()
+    assert len(clinic_ids) == 1  # All rows should have same clinic_id
+    assert clinic_ids[0] == "SBU"  # Parent directory name
+
+    # Check that we have data from multiple months
+    unique_months = df_all["tracker_month"].unique().to_list()
+    assert len(unique_months) > 1, "Should have data from multiple months"
+
+    # Check that year is correct
+    assert all(year == 2024 for year in df_all["tracker_year"].unique().to_list())
+
+    # Check that patient_id column exists
+    assert "patient_id" in df_all.columns
+
+    # Check that we filtered out invalid rows (no null patient_ids)
+    assert df_all["patient_id"].null_count() == 0
+
+    # Check for baseline HbA1c column from Patient List (should be present after join)
+    # Note: This may have .static suffix if there were conflicts
+    hba1c_cols = [col for col in df_all.columns if "hba1c_baseline" in col.lower()]
+    print(f"\nHbA1c baseline columns: {hba1c_cols}")
+
+    print(
+        f"\n2024 Tracker: {len(df_all)} total patients from {len(unique_months)} months"
+        f" (with Patient List & Annual data) ✓"
+    )
+
+
+@pytest.mark.skipif(not TRACKER_PNG_2019.exists(), reason="Tracker file not available")
+def test_read_all_patient_sheets_2019():
+    """Test reading all patient sheets from 2019 tracker (different formats across months)."""
+    df_all = read_all_patient_sheets(TRACKER_PNG_2019)
+
+    # Check that we have data
+    assert len(df_all) > 0, "Should have extracted patient data"
+
+    # Check metadata columns
+    assert "sheet_name" in df_all.columns
+    assert "tracker_month" in df_all.columns
+    assert "tracker_year" in df_all.columns
+
+    # Check that year is correct
+    assert all(year == 2019 for year in df_all["tracker_year"].unique().to_list())
+
+    # Check that patient_id column exists
+    assert "patient_id" in df_all.columns
+
+    # Check that we filtered out invalid rows
+    assert df_all["patient_id"].null_count() == 0
+
+    # 2019 tracker has format changes across months - verify we handled them
+    unique_months = df_all["tracker_month"].unique().to_list()
+    print(f"\n2019 Tracker: {len(df_all)} total patients from {len(unique_months)} months ✓")
+
+
+@pytest.mark.skipif(not TRACKER_SBU_2024.exists(), reason="Tracker file not available")
+def test_read_all_patient_sheets_file_name():
+    """Test that file_name metadata is correctly added."""
+    df_all = read_all_patient_sheets(TRACKER_SBU_2024)
+
+    assert "file_name" in df_all.columns
+    file_names = df_all["file_name"].unique().to_list()
+    assert len(file_names) == 1
+    assert file_names[0] == TRACKER_SBU_2024.stem
+
+
+@pytest.mark.skipif(not TRACKER_MHS_2017.exists(), reason="Tracker file not available")
+def test_read_all_patient_sheets_2017_mhs_complete():
+    """
+    End-to-end test: 2017 Mahosot Hospital tracker (Laos/MHS).
+
+    Characteristics:
+    - Year: 2017
+    - Sheets: Jan17-Dec17 (March is MISSING)
+    - NO Patient List or Annual sheets
+    - clinic_id should be "MHS"
+
+    Expected patient counts per month:
+    - Jan17: 6, Feb17: 6, Apr17: 6, May17: 8, Jun17: 11, Jul17: 11
+    - Aug17: 11, Sep17: 12, Oct17: 12, Nov17: 12, Dec17: 14
+    - Total: 109 patients (11 months)
+    """
+    df_all = read_all_patient_sheets(TRACKER_MHS_2017)
+
+    # Basic validation
+    assert len(df_all) > 0, "Should have extracted patient data"
+    assert "patient_id" in df_all.columns
+    assert "tracker_month" in df_all.columns
+    assert "tracker_year" in df_all.columns
+    assert "clinic_id" in df_all.columns
+
+    # Check clinic_id
+    assert df_all["clinic_id"].unique().to_list() == ["MHS"]
+
+    # Check year
+    assert df_all["tracker_year"].unique().to_list() == [2017]
+
+    # Check we have exactly 11 months (March is missing)
+    unique_months = sorted(df_all["tracker_month"].unique().to_list())
+    expected_months = [1, 2, 4, 5, 6, 7, 8, 9, 10, 11, 12]  # Missing 3 (March)
+    assert unique_months == expected_months, f"Expected {expected_months}, got {unique_months}"
+
+    # Verify patient counts per month
+    import calendar
+
+    expected_counts = {
+        1: 6,  # Jan
+        2: 6,  # Feb
+        # 3 is missing (March)
+        4: 6,  # Apr
+        5: 8,  # May
+        6: 11,  # Jun
+        7: 11,  # Jul
+        8: 11,  # Aug
+        9: 12,  # Sep
+        10: 12,  # Oct
+        11: 12,  # Nov
+        12: 14,  # Dec
+    }
+
+    for month, expected_count in expected_counts.items():
+        month_data = df_all.filter(pl.col("tracker_month") == month)
+        actual_count = len(month_data)
+        assert actual_count == expected_count, (
+            f"Month {month} ({calendar.month_abbr[month]}17): "
+            f"expected {expected_count} patients, got {actual_count}"
+        )
+
+    # Total patient count
+    total_expected = sum(expected_counts.values())  # 109
+    assert len(df_all) == total_expected, (
+        f"Total patients: expected {total_expected}, got {len(df_all)}"
+    )
+
+    print(
+        f"\n✓ 2017 MHS Tracker: {len(df_all)} patients from 11 months (March missing as expected)"
+    )
+
+
+@pytest.mark.skipif(not TRACKER_MHS_2025.exists(), reason="Tracker file not available")
+def test_read_all_patient_sheets_2025_mhs_with_patient_list():
+    """
+    End-to-end test: 2025 Mahosot Hospital tracker (Laos/MHS).
+
+    Characteristics:
+    - Year: 2025
+    - Sheets: Jan25-Jun25 (6 months)
+    - HAS Patient List and Annual sheets
+    - clinic_id should be "MHS"
+
+    Expected patient counts per month:
+    - Jan25: 95, Feb25: 97, Mar25: 97, Apr25: 97, May25: 98, Jun25: 99
+    - Total: 583 patients
+    """
+    df_all = read_all_patient_sheets(TRACKER_MHS_2025)
+
+    # Basic validation
+    assert len(df_all) > 0, "Should have extracted patient data"
+    assert "patient_id" in df_all.columns
+    assert "tracker_month" in df_all.columns
+    assert "tracker_year" in df_all.columns
+    assert "clinic_id" in df_all.columns
+
+    # Check clinic_id
+    assert df_all["clinic_id"].unique().to_list() == ["MHS"]
+
+    # Check year
+    assert df_all["tracker_year"].unique().to_list() == [2025]
+
+    # Check we have exactly 6 months (Jan-Jun)
+    unique_months = sorted(df_all["tracker_month"].unique().to_list())
+    expected_months = [1, 2, 3, 4, 5, 6]
+    assert unique_months == expected_months, f"Expected {expected_months}, got {unique_months}"
+
+    # Verify patient counts per month
+    import calendar
+
+    expected_counts = {
+        1: 95,  # Jan
+        2: 97,  # Feb
+        3: 97,  # Mar
+        4: 97,  # Apr
+        5: 98,  # May
+        6: 99,  # Jun
+    }
+
+    for month, expected_count in expected_counts.items():
+        month_data = df_all.filter(pl.col("tracker_month") == month)
+        actual_count = len(month_data)
+        assert actual_count == expected_count, (
+            f"Month {month} ({calendar.month_abbr[month]}25): "
+            f"expected {expected_count} patients, got {actual_count}"
+        )
+
+    # Total patient count
+    total_expected = sum(expected_counts.values())  # 583
+    assert len(df_all) == total_expected, (
+        f"Total patients: expected {total_expected}, got {len(df_all)}"
+    )
+
+    # Check that Patient List data was joined (should have columns from Patient List)
+    # Note: The exact columns depend on what's in the Patient List sheet
+    # We verify by checking for potential .static suffix columns
+    static_cols = [col for col in df_all.columns if ".static" in col]
+    print(f"\nColumns from Patient List (.static suffix): {len(static_cols)}")
+
+    # Check that Annual data was joined
+    annual_cols = [col for col in df_all.columns if ".annual" in col]
+    print(f"Columns from Annual sheet (.annual suffix): {len(annual_cols)}")
+
+    print(
+        f"\n✓ 2025 MHS Tracker: {len(df_all)} patients from 6 months "
+        f"(with Patient List & Annual data joined)"
+    )
+
+
+def test_export_patient_raw(tmp_path):
+    """Test exporting patient data to parquet file."""
+    from a4d.extract.patient import export_patient_raw, read_all_patient_sheets
+
+    # Use the 2024 SBU tracker as test data
+    tracker_file = TRACKER_SBU_2024
+    if not tracker_file.exists():
+        pytest.skip("Tracker file not available")
+
+    # Extract data
+    df = read_all_patient_sheets(tracker_file)
+
+    # Export to temp directory
+    output_dir = tmp_path / "patient_data_raw"
+    output_path = export_patient_raw(df, tracker_file, output_dir)
+
+    # Verify output file exists
+    assert output_path.exists()
+    assert output_path.name == "2024_Sibu Hospital A4D Tracker_patient_raw.parquet"
+    assert output_path.parent == output_dir
+
+    # Verify we can read it back
+    df_read = pl.read_parquet(output_path)
+    assert len(df_read) == len(df)
+    assert df_read.columns == df.columns
+
+    # Verify content matches
+    assert df_read.equals(df)
+
+    print(f"\n✓ Successfully exported and verified {len(df)} rows to parquet")
diff --git a/a4d-python/tests/test_extract/test_patient_helpers.py b/a4d-python/tests/test_extract/test_patient_helpers.py
new file mode 100644
index 0000000..6def861
--- /dev/null
+++ b/a4d-python/tests/test_extract/test_patient_helpers.py
@@ -0,0 +1,470 @@
+"""Unit tests for patient extraction helper functions."""
+
+import random
+from unittest.mock import Mock
+
+import pytest
+from openpyxl import Workbook
+
+from a4d.extract.patient import (
+    filter_valid_columns,
+    find_data_start_row,
+    merge_headers,
+    read_header_rows,
+)
+
+
+def create_mock_mapper(known_columns: set[str]):
+    """Create a mock ColumnMapper that validates specific column names."""
+    mapper = Mock()
+    mapper.is_known_column = lambda col: col in known_columns
+    return mapper
+
+
+class TestFindDataStartRow:
+    """Tests for find_data_start_row() function."""
+
+    def test_data_starts_at_row_1(self):
+        """Test when data starts at the very first row."""
+        wb = Workbook()
+        ws = wb.active
+        ws["A1"] = 1
+        ws["A2"] = 2
+
+        result = find_data_start_row(ws)
+        assert result == 1
+
+        wb.close()
+
+    def test_data_starts_after_empty_rows(self):
+        """Test when there are empty rows before data."""
+        wb = Workbook()
+        ws = wb.active
+        # Leave rows 1-10 empty
+        ws["A11"] = 1
+        ws["A12"] = 2
+
+        result = find_data_start_row(ws)
+        assert result == 11
+
+        wb.close()
+
+    def test_realistic_tracker_layout(self):
+        """Test with realistic tracker layout (headers at rows 75-76, data at 77)."""
+        wb = Workbook()
+        ws = wb.active
+
+        # Simulate typical tracker: empty rows, then title rows, then headers, then data
+        # Title area NOT in column A (column A stays empty until headers)
+        ws["B1"] = "Hospital Name"
+        ws["C1"] = "General Hospital"
+
+        # Headers at rows 75-76 (typical for real trackers)
+        ws["B75"] = "Patient"
+        ws["B76"] = "ID*"
+
+        # Data starts at row 77
+        ws["A77"] = 1
+        ws["A78"] = 2
+
+        result = find_data_start_row(ws)
+        assert result == 77  # First non-None in column A
+
+        wb.close()
+
+    def test_randomized_data_position(self):
+        """Test with randomized data start position."""
+        wb = Workbook()
+        ws = wb.active
+
+        # Random start position between 10 and 100
+        random_start = random.randint(10, 100)
+
+        # Insert first data value at random position (must be numeric)
+        ws[f"A{random_start}"] = 1
+
+        result = find_data_start_row(ws)
+        assert result == random_start
+
+        wb.close()
+
+    def test_column_a_empty_raises_error(self):
+        """Test that ValueError is raised when column A is empty."""
+        wb = Workbook()
+        ws = wb.active
+
+        # Put data in other columns but not A
+        ws["B1"] = "Some data"
+        ws["C5"] = "More data"
+
+        with pytest.raises(ValueError, match="No patient data found in column A"):
+            find_data_start_row(ws)
+
+        wb.close()
+
+    def test_ignores_none_values(self):
+        """Test that None/empty cells are skipped correctly."""
+        wb = Workbook()
+        ws = wb.active
+
+        # Explicitly set some cells to None (they start as None anyway)
+        ws["A1"] = None
+        ws["A2"] = None
+        ws["A3"] = None
+        ws["A4"] = 1  # First numeric data
+
+        result = find_data_start_row(ws)
+        assert result == 4
+
+        wb.close()
+
+
+class TestReadHeaderRows:
+    """Tests for read_header_rows() function."""
+
+    def test_basic_two_row_headers(self):
+        """Test reading basic two-row headers."""
+        wb = Workbook()
+        ws = wb.active
+
+        # Data starts at row 5, so headers are at rows 3 and 4
+        ws["A3"] = "Patient"
+        ws["B3"] = "Date"
+        ws["C3"] = "HbA1c"
+
+        ws["A4"] = "ID*"
+        ws["B4"] = "(dd-mmm-yyyy)"
+        ws["C4"] = "%"
+
+        ws["A5"] = "P001"  # Data starts here
+
+        header_1, header_2 = read_header_rows(ws, data_start_row=5)
+
+        assert header_1 == ["ID*", "(dd-mmm-yyyy)", "%"]
+        assert header_2 == ["Patient", "Date", "HbA1c"]
+
+        wb.close()
+
+    def test_trims_to_last_non_none_column(self):
+        """Test that headers are trimmed to last non-None column."""
+        wb = Workbook()
+        ws = wb.active
+
+        # Data starts at row 10
+        ws["A8"] = "Patient"
+        ws["B8"] = "Name"
+        ws["C8"] = "Age"
+        # D8-Z8 remain None
+
+        ws["A9"] = "ID*"
+        ws["B9"] = None
+        ws["C9"] = None
+
+        ws["A10"] = "P001"
+
+        header_1, header_2 = read_header_rows(ws, data_start_row=10)
+
+        # Should trim to column C (last non-None)
+        assert len(header_1) == 3
+        assert len(header_2) == 3
+        assert header_1 == ["ID*", None, None]
+        assert header_2 == ["Patient", "Name", "Age"]
+
+        wb.close()
+
+    def test_realistic_tracker_width(self):
+        """Test with realistic tracker dimensions (31 columns)."""
+        wb = Workbook()
+        ws = wb.active
+
+        data_start_row = 77
+
+        # Create 31 columns of headers
+        for col_idx in range(1, 32):  # 1 to 31 inclusive
+            ws.cell(row=75, column=col_idx, value=f"H2_Col{col_idx}")
+            ws.cell(row=76, column=col_idx, value=f"H1_Col{col_idx}")
+
+        # Put data at row 77
+        ws.cell(row=77, column=1, value="P001")
+
+        header_1, header_2 = read_header_rows(ws, data_start_row=data_start_row)
+
+        assert len(header_1) == 31
+        assert len(header_2) == 31
+        assert header_1[0] == "H1_Col1"
+        assert header_1[30] == "H1_Col31"
+        assert header_2[0] == "H2_Col1"
+        assert header_2[30] == "H2_Col31"
+
+        wb.close()
+
+    def test_mixed_none_values_in_headers(self):
+        """Test headers with mixed None and non-None values."""
+        wb = Workbook()
+        ws = wb.active
+
+        # Header row 2 (further from data)
+        ws["A3"] = "Patient"
+        ws["B3"] = None
+        ws["C3"] = "Updated HbA1c"
+        ws["D3"] = None  # Horizontally merged
+        ws["E3"] = None
+
+        # Header row 1 (closer to data)
+        ws["A4"] = "ID*"
+        ws["B4"] = "Name"
+        ws["C4"] = "%"
+        ws["D4"] = "(dd-mmm-yyyy)"
+        ws["E4"] = None
+
+        ws["A5"] = "P001"  # Data
+
+        header_1, header_2 = read_header_rows(ws, data_start_row=5)
+
+        # Should trim to column D (last non-None in header_1)
+        assert len(header_1) == 4
+        assert len(header_2) == 4
+        assert header_1 == ["ID*", "Name", "%", "(dd-mmm-yyyy)"]
+        assert header_2 == ["Patient", None, "Updated HbA1c", None]
+
+        wb.close()
+
+    def test_randomized_header_position(self):
+        """Test with randomized data start position."""
+        wb = Workbook()
+        ws = wb.active
+
+        # Random data start between rows 20 and 100
+        random_data_start = random.randint(20, 100)
+        header_row_1 = random_data_start - 1
+        header_row_2 = random_data_start - 2
+
+        # Set headers
+        ws.cell(row=header_row_2, column=1, value="Header2")
+        ws.cell(row=header_row_1, column=1, value="Header1")
+        ws.cell(row=random_data_start, column=1, value="Data")
+
+        header_1, header_2 = read_header_rows(ws, data_start_row=random_data_start)
+
+        assert header_1 == ["Header1"]
+        assert header_2 == ["Header2"]
+
+        wb.close()
+
+    def test_respects_max_cols_parameter(self):
+        """Test that max_cols parameter limits the read width."""
+        wb = Workbook()
+        ws = wb.active
+
+        # Create 200 columns of data
+        for col_idx in range(1, 201):
+            ws.cell(row=3, column=col_idx, value=f"H2_{col_idx}")
+            ws.cell(row=4, column=col_idx, value=f"H1_{col_idx}")
+
+        ws["A5"] = "Data"
+
+        # Read with max_cols=50
+        header_1, header_2 = read_header_rows(ws, data_start_row=5, max_cols=50)
+
+        # Should only read up to column 50
+        assert len(header_1) == 50
+        assert len(header_2) == 50
+        assert header_1[49] == "H1_50"
+
+        wb.close()
+
+    def test_all_none_headers(self):
+        """Test when both header rows are completely None.
+
+        Note: When no non-None values are found, the function returns
+        max_cols None values (default behavior). In practice, this edge
+        case doesn't occur as real trackers always have headers.
+        """
+        wb = Workbook()
+        ws = wb.active
+
+        # Headers are all None
+        # (openpyxl cells are None by default)
+
+        ws["A5"] = "Data"
+
+        header_1, header_2 = read_header_rows(ws, data_start_row=5, max_cols=10)
+
+        # Returns max_cols None values when nothing is found
+        assert len(header_1) == 10
+        assert len(header_2) == 10
+        assert all(h is None for h in header_1)
+        assert all(h is None for h in header_2)
+
+        wb.close()
+
+
+class TestMergeHeaders:
+    """Tests for merge_headers() function."""
+
+    def test_both_headers_present(self):
+        """Test merging when both header rows have values."""
+        h1 = ["%", "mmol/L", "kg"]
+        h2 = ["HbA1c", "FBG", "Weight"]
+        result = merge_headers(h1, h2)
+        assert result == ["HbA1c %", "FBG mmol/L", "Weight kg"]
+
+    def test_only_h2_present(self):
+        """Test when only header row 2 has values."""
+        h1 = [None, None, None]
+        h2 = ["Patient ID", "Name", "Age"]
+        result = merge_headers(h1, h2)
+        assert result == ["Patient ID", "Name", "Age"]
+
+    def test_only_h1_present(self):
+        """Test when only header row 1 has values (single-line headers)."""
+        h1 = ["Patient ID", "Name", "Age"]
+        h2 = [None, None, None]
+        result = merge_headers(h1, h2)
+        assert result == ["Patient ID", "Name", "Age"]
+
+    def test_horizontal_merge_forward_fill(self):
+        """Test forward-fill with synonym validation.
+
+        Forward-fill happens when mapper validates the combined header.
+        """
+        h1 = ["%", "(dd-mmm-yyyy)", "mmol/L", "(dd-mmm-yyyy)"]
+        h2 = ["Updated HbA1c", None, "Updated FBG", None]
+        # Mock mapper that knows these forward-filled patterns
+        mapper = create_mock_mapper({
+            "Updated HbA1c %",
+            "Updated HbA1c (dd-mmm-yyyy)",
+            "Updated FBG mmol/L",
+            "Updated FBG (dd-mmm-yyyy)",
+        })
+        result = merge_headers(h1, h2, mapper)
+        assert result == [
+            "Updated HbA1c %",
+            "Updated HbA1c (dd-mmm-yyyy)",
+            "Updated FBG mmol/L",
+            "Updated FBG (dd-mmm-yyyy)",
+        ]
+
+    def test_mixed_headers(self):
+        """Test realistic mix of header patterns.
+
+        Forward-fill happens when mapper validates the combined header.
+        """
+        h1 = ["ID*", "Name", "%", "(date)", None, "kg"]
+        h2 = ["Patient", None, "HbA1c", None, "Notes", "Weight"]
+        # Mock mapper that validates these forward-fills
+        mapper = create_mock_mapper({
+            "Patient ID*",
+            "Patient Name",
+            "HbA1c %",
+            "HbA1c (date)",
+        })
+        result = merge_headers(h1, h2, mapper)
+        assert result == [
+            "Patient ID*",
+            "Patient Name",  # Forward-filled and validated
+            "HbA1c %",
+            "HbA1c (date)",  # Forward-filled and validated
+            "Notes",
+            "Weight kg",
+        ]
+
+    def test_none_values_reset_forward_fill(self):
+        """Test that None in both headers results in None.
+
+        Forward-fill only happens when h1 exists and mapper validates.
+        """
+        h1 = ["%", "(date)", None, "kg"]
+        h2 = ["HbA1c", None, None, "Weight"]
+        # Mock mapper that validates HbA1c forward-fills
+        mapper = create_mock_mapper({
+            "HbA1c %",
+            "HbA1c (date)",
+        })
+        result = merge_headers(h1, h2, mapper)
+        assert result == [
+            "HbA1c %",
+            "HbA1c (date)",
+            None,
+            "Weight kg",
+        ]
+
+    def test_whitespace_normalization(self):
+        """Test that extra whitespace and newlines are normalized."""
+        h1 = ["ID\n(format)", "  Name  "]
+        h2 = ["Patient\nID", "Full  Name"]
+        result = merge_headers(h1, h2)
+        assert result == [
+            "Patient ID ID (format)",
+            "Full Name Name",
+        ]
+
+    def test_empty_headers(self):
+        """Test with empty header lists."""
+        result = merge_headers([], [])
+        assert result == []
+
+    def test_single_column(self):
+        """Test with single column."""
+        h1 = ["ID"]
+        h2 = ["Patient"]
+        result = merge_headers(h1, h2)
+        assert result == ["Patient ID"]
+
+
+class TestFilterValidColumns:
+    """Tests for filter_valid_columns() function."""
+
+    def test_all_valid_headers(self):
+        """Test when all headers are valid (no None)."""
+        headers = ["ID", "Name", "Age"]
+        data = [("1", "Alice", "30"), ("2", "Bob", "25")]
+        valid_headers, filtered_data = filter_valid_columns(headers, data)
+
+        assert valid_headers == ["ID", "Name", "Age"]
+        assert filtered_data == [["1", "Alice", "30"], ["2", "Bob", "25"]]
+
+    def test_some_none_headers(self):
+        """Test filtering out None headers."""
+        headers = ["ID", None, "Name", None, "Age"]
+        data = [("1", "x", "Alice", "y", "30"), ("2", "x", "Bob", "y", "25")]
+        valid_headers, filtered_data = filter_valid_columns(headers, data)
+
+        assert valid_headers == ["ID", "Name", "Age"]
+        assert filtered_data == [["1", "Alice", "30"], ["2", "Bob", "25"]]
+
+    def test_all_none_headers(self):
+        """Test when all headers are None."""
+        headers = [None, None, None]
+        data = [("1", "2", "3"), ("4", "5", "6")]
+        valid_headers, filtered_data = filter_valid_columns(headers, data)
+
+        assert valid_headers == []
+        assert filtered_data == []
+
+    def test_empty_data(self):
+        """Test with empty data."""
+        headers = ["ID", "Name"]
+        data = []
+        valid_headers, filtered_data = filter_valid_columns(headers, data)
+
+        assert valid_headers == ["ID", "Name"]
+        assert filtered_data == []
+
+    def test_single_valid_column(self):
+        """Test with single valid column."""
+        headers = [None, "ID", None]
+        data = [("x", "1", "y"), ("x", "2", "y")]
+        valid_headers, filtered_data = filter_valid_columns(headers, data)
+
+        assert valid_headers == ["ID"]
+        assert filtered_data == [["1"], ["2"]]
+
+    def test_preserves_order(self):
+        """Test that column order is preserved."""
+        headers = ["A", None, "B", None, "C", "D", None]
+        data = [(1, 2, 3, 4, 5, 6, 7)]
+        valid_headers, filtered_data = filter_valid_columns(headers, data)
+
+        assert valid_headers == ["A", "B", "C", "D"]
+        assert filtered_data == [[1, 3, 5, 6]]
diff --git a/a4d-python/tests/test_gcp/__init__.py b/a4d-python/tests/test_gcp/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/a4d-python/tests/test_gcp/test_bigquery.py b/a4d-python/tests/test_gcp/test_bigquery.py
new file mode 100644
index 0000000..8512092
--- /dev/null
+++ b/a4d-python/tests/test_gcp/test_bigquery.py
@@ -0,0 +1,173 @@
+"""Tests for BigQuery loading module."""
+
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+from a4d.gcp.bigquery import (
+    PARQUET_TO_TABLE,
+    TABLE_CONFIGS,
+    load_pipeline_tables,
+    load_table,
+)
+
+
+def _get_job_config(mock_client):
+    """Extract job_config from mock client's load_table_from_file call."""
+    return mock_client.load_table_from_file.call_args.kwargs["job_config"]
+
+
+class TestTableConfigs:
+    """Test that table configurations match the R pipeline."""
+
+    def test_patient_data_monthly_clustering(self):
+        assert TABLE_CONFIGS["patient_data_monthly"] == [
+            "clinic_id",
+            "patient_id",
+            "tracker_date",
+        ]
+
+    def test_patient_data_annual_clustering(self):
+        assert TABLE_CONFIGS["patient_data_annual"] == ["patient_id", "tracker_date"]
+
+    def test_patient_data_static_clustering(self):
+        assert TABLE_CONFIGS["patient_data_static"] == [
+            "clinic_id",
+            "patient_id",
+            "tracker_date",
+        ]
+
+    def test_all_pipeline_tables_have_configs(self):
+        for table_name in PARQUET_TO_TABLE.values():
+            assert table_name in TABLE_CONFIGS, f"Missing config for {table_name}"
+
+
+class TestLoadTable:
+    """Test loading a single parquet file to BigQuery."""
+
+    def test_raises_file_not_found(self, tmp_path):
+        missing_file = tmp_path / "missing.parquet"
+        with pytest.raises(FileNotFoundError, match="Parquet file not found"):
+            load_table(missing_file, "patient_data_monthly")
+
+    @patch("a4d.gcp.bigquery.get_bigquery_client")
+    def test_load_table_with_replace(self, mock_get_client, tmp_path):
+        parquet_file = tmp_path / "test.parquet"
+        parquet_file.write_bytes(b"fake parquet data")
+
+        mock_client = MagicMock()
+        mock_job = MagicMock()
+        mock_job.output_rows = 100
+        mock_client.load_table_from_file.return_value = mock_job
+        mock_get_client.return_value = mock_client
+
+        load_table(parquet_file, "patient_data_monthly", client=mock_client)
+
+        mock_client.load_table_from_file.assert_called_once()
+        job_config = _get_job_config(mock_client)
+        assert job_config.clustering_fields == ["clinic_id", "patient_id", "tracker_date"]
+        mock_job.result.assert_called_once()
+
+    @patch("a4d.gcp.bigquery.get_bigquery_client")
+    def test_load_table_with_append(self, mock_get_client, tmp_path):
+        parquet_file = tmp_path / "test.parquet"
+        parquet_file.write_bytes(b"fake parquet data")
+
+        mock_client = MagicMock()
+        mock_job = MagicMock()
+        mock_job.output_rows = 50
+        mock_client.load_table_from_file.return_value = mock_job
+
+        load_table(parquet_file, "patient_data_monthly", client=mock_client, replace=False)
+
+        job_config = _get_job_config(mock_client)
+        assert job_config.write_disposition == "WRITE_APPEND"
+
+    @patch("a4d.gcp.bigquery.get_bigquery_client")
+    def test_load_table_correct_table_ref(self, mock_get_client, tmp_path):
+        parquet_file = tmp_path / "test.parquet"
+        parquet_file.write_bytes(b"fake parquet data")
+
+        mock_client = MagicMock()
+        mock_job = MagicMock()
+        mock_job.output_rows = 10
+        mock_client.load_table_from_file.return_value = mock_job
+
+        load_table(
+            parquet_file,
+            "patient_data_static",
+            client=mock_client,
+            dataset="test_dataset",
+            project_id="test_project",
+        )
+
+        table_ref = mock_client.load_table_from_file.call_args.args[1]
+        assert table_ref == "test_project.test_dataset.patient_data_static"
+
+
+class TestLoadPipelineTables:
+    """Test loading all pipeline tables."""
+
+    def test_raises_if_dir_missing(self, tmp_path):
+        missing_dir = tmp_path / "nonexistent"
+        with pytest.raises(FileNotFoundError, match="Tables directory not found"):
+            load_pipeline_tables(missing_dir)
+
+    @patch("a4d.gcp.bigquery.load_table")
+    @patch("a4d.gcp.bigquery.get_bigquery_client")
+    def test_loads_existing_tables(self, mock_get_client, mock_load, tmp_path):
+        tables_dir = tmp_path / "tables"
+        tables_dir.mkdir()
+
+        # Create some table files
+        (tables_dir / "patient_data_static.parquet").write_bytes(b"data")
+        (tables_dir / "patient_data_monthly.parquet").write_bytes(b"data")
+
+        mock_client = MagicMock()
+        mock_get_client.return_value = mock_client
+        mock_load.return_value = MagicMock()
+
+        results = load_pipeline_tables(tables_dir, client=mock_client)
+
+        assert mock_load.call_count == 2
+        assert "patient_data_static" in results
+        assert "patient_data_monthly" in results
+
+    @patch("a4d.gcp.bigquery.load_table")
+    @patch("a4d.gcp.bigquery.get_bigquery_client")
+    def test_skips_missing_tables(self, mock_get_client, mock_load, tmp_path):
+        tables_dir = tmp_path / "tables"
+        tables_dir.mkdir()
+
+        # Only create one table file
+        (tables_dir / "patient_data_static.parquet").write_bytes(b"data")
+
+        mock_client = MagicMock()
+        mock_get_client.return_value = mock_client
+        mock_load.return_value = MagicMock()
+
+        results = load_pipeline_tables(tables_dir, client=mock_client)
+
+        assert mock_load.call_count == 1
+        assert "patient_data_static" in results
+        assert "patient_data_monthly" not in results
+
+    @patch("a4d.gcp.bigquery.load_table")
+    @patch("a4d.gcp.bigquery.get_bigquery_client")
+    def test_continues_on_single_table_failure(self, mock_get_client, mock_load, tmp_path):
+        tables_dir = tmp_path / "tables"
+        tables_dir.mkdir()
+
+        (tables_dir / "patient_data_static.parquet").write_bytes(b"data")
+        (tables_dir / "patient_data_monthly.parquet").write_bytes(b"data")
+
+        mock_client = MagicMock()
+        mock_get_client.return_value = mock_client
+
+        # First call succeeds, second fails
+        mock_load.side_effect = [MagicMock(), Exception("API error")]
+
+        results = load_pipeline_tables(tables_dir, client=mock_client)
+
+        # Should have one success despite the failure
+        assert len(results) == 1
diff --git a/a4d-python/tests/test_gcp/test_storage.py b/a4d-python/tests/test_gcp/test_storage.py
new file mode 100644
index 0000000..77ff437
--- /dev/null
+++ b/a4d-python/tests/test_gcp/test_storage.py
@@ -0,0 +1,114 @@
+"""Tests for Google Cloud Storage module."""
+
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+from a4d.gcp.storage import download_tracker_files, upload_output
+
+
+class TestDownloadTrackerFiles:
+    """Test downloading tracker files from GCS."""
+
+    @patch("a4d.gcp.storage.get_storage_client")
+    def test_downloads_files(self, mock_get_client, tmp_path):
+        destination = tmp_path / "trackers"
+
+        mock_client = MagicMock()
+        mock_get_client.return_value = mock_client
+        mock_bucket = MagicMock()
+        mock_client.bucket.return_value = mock_bucket
+
+        # Simulate blobs in bucket
+        blob1 = MagicMock()
+        blob1.name = "2024/tracker1.xlsx"
+        blob2 = MagicMock()
+        blob2.name = "2024/tracker2.xlsx"
+        mock_bucket.list_blobs.return_value = [blob1, blob2]
+
+        result = download_tracker_files(destination, client=mock_client)
+
+        assert len(result) == 2
+        assert blob1.download_to_filename.called
+        assert blob2.download_to_filename.called
+
+    @patch("a4d.gcp.storage.get_storage_client")
+    def test_skips_directory_markers(self, mock_get_client, tmp_path):
+        destination = tmp_path / "trackers"
+
+        mock_client = MagicMock()
+        mock_get_client.return_value = mock_client
+        mock_bucket = MagicMock()
+        mock_client.bucket.return_value = mock_bucket
+
+        blob_dir = MagicMock()
+        blob_dir.name = "2024/"
+        blob_file = MagicMock()
+        blob_file.name = "2024/tracker.xlsx"
+        mock_bucket.list_blobs.return_value = [blob_dir, blob_file]
+
+        result = download_tracker_files(destination, client=mock_client)
+
+        assert len(result) == 1
+        assert not blob_dir.download_to_filename.called
+
+    @patch("a4d.gcp.storage.get_storage_client")
+    def test_creates_destination_directory(self, mock_get_client, tmp_path):
+        destination = tmp_path / "new" / "dir"
+
+        mock_client = MagicMock()
+        mock_get_client.return_value = mock_client
+        mock_bucket = MagicMock()
+        mock_client.bucket.return_value = mock_bucket
+        mock_bucket.list_blobs.return_value = []
+
+        download_tracker_files(destination, client=mock_client)
+
+        assert destination.exists()
+
+
+class TestUploadOutput:
+    """Test uploading output to GCS."""
+
+    def test_raises_if_source_missing(self, tmp_path):
+        missing_dir = tmp_path / "nonexistent"
+        with pytest.raises(FileNotFoundError, match="Source directory not found"):
+            upload_output(missing_dir)
+
+    @patch("a4d.gcp.storage.get_storage_client")
+    def test_uploads_files(self, mock_get_client, tmp_path):
+        source = tmp_path / "output"
+        source.mkdir()
+        (source / "tables").mkdir()
+        (source / "tables" / "data.parquet").write_bytes(b"data")
+        (source / "logs.txt").write_text("log")
+
+        mock_client = MagicMock()
+        mock_get_client.return_value = mock_client
+        mock_bucket = MagicMock()
+        mock_client.bucket.return_value = mock_bucket
+        mock_blob = MagicMock()
+        mock_bucket.blob.return_value = mock_blob
+
+        result = upload_output(source, client=mock_client)
+
+        assert len(result) == 2
+        assert mock_blob.upload_from_filename.call_count == 2
+
+    @patch("a4d.gcp.storage.get_storage_client")
+    def test_upload_with_prefix(self, mock_get_client, tmp_path):
+        source = tmp_path / "output"
+        source.mkdir()
+        (source / "file.parquet").write_bytes(b"data")
+
+        mock_client = MagicMock()
+        mock_get_client.return_value = mock_client
+        mock_bucket = MagicMock()
+        mock_client.bucket.return_value = mock_bucket
+        mock_blob = MagicMock()
+        mock_bucket.blob.return_value = mock_blob
+
+        result = upload_output(source, prefix="2024-01", client=mock_client)
+
+        assert len(result) == 1
+        assert result[0] == "2024-01/file.parquet"
diff --git a/a4d-python/tests/test_integration/__init__.py b/a4d-python/tests/test_integration/__init__.py
new file mode 100644
index 0000000..19172f4
--- /dev/null
+++ b/a4d-python/tests/test_integration/__init__.py
@@ -0,0 +1,9 @@
+"""Integration tests for A4D pipeline.
+
+These tests use real tracker files and are marked as 'slow' and 'integration'.
+They are skipped by default in CI/CD to keep test runs fast.
+
+Run them explicitly with:
+    uv run pytest -m integration
+    uv run pytest tests/test_integration/
+"""
diff --git a/a4d-python/tests/test_integration/conftest.py b/a4d-python/tests/test_integration/conftest.py
new file mode 100644
index 0000000..2e798e4
--- /dev/null
+++ b/a4d-python/tests/test_integration/conftest.py
@@ -0,0 +1,42 @@
+"""Shared fixtures for integration tests."""
+
+from pathlib import Path
+
+import pytest
+
+# Base path to tracker files
+TRACKER_BASE = Path("/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload")
+
+
+@pytest.fixture
+def tracker_2024_penang():
+    """2024 Penang tracker - has Annual + Patient List sheets."""
+    return TRACKER_BASE / "Malaysia/PNG/2024_Penang General Hospital A4D Tracker.xlsx"
+
+
+@pytest.fixture
+def tracker_2023_sibu():
+    """2023 Sibu tracker - has duplicate column mapping edge case."""
+    return TRACKER_BASE / "Malaysia/SBU/2023_Sibu Hospital A4D Tracker.xlsx"
+
+
+@pytest.fixture
+def tracker_2022_penang():
+    """2022 Penang tracker - legacy format without Annual sheet."""
+    return TRACKER_BASE / "Malaysia/PNG/2022_Penang General Hospital A4D Tracker.xlsx"
+
+
+@pytest.fixture
+def tracker_2024_isdfi():
+    """2024 ISDFI Philippines tracker."""
+    return TRACKER_BASE / "Philippines/ISD/2024_ISDFI A4D Tracker.xlsx"
+
+
+# Expected values for validation
+EXPECTED_SCHEMA_COLS = 83  # After cleaning
+
+
+def skip_if_missing(tracker_path: Path):
+    """Skip test if tracker file is not available."""
+    if not tracker_path.exists():
+        pytest.skip(f"Tracker file not found: {tracker_path}")
diff --git a/a4d-python/tests/test_integration/test_clean_integration.py b/a4d-python/tests/test_integration/test_clean_integration.py
new file mode 100644
index 0000000..a8423f4
--- /dev/null
+++ b/a4d-python/tests/test_integration/test_clean_integration.py
@@ -0,0 +1,133 @@
+"""Integration tests for patient data cleaning.
+
+Tests cleaning on real extracted data, validating:
+- Correct schema (83 columns)
+- Type conversions work correctly
+- Error tracking works
+- Derived columns are created
+"""
+
+import pytest
+
+from a4d.clean.patient import clean_patient_data
+from a4d.errors import ErrorCollector
+from a4d.extract.patient import read_all_patient_sheets
+
+from .conftest import EXPECTED_SCHEMA_COLS, skip_if_missing
+
+pytestmark = [pytest.mark.slow, pytest.mark.integration]
+
+
+class TestClean2024Penang:
+    """Test cleaning on 2024 Penang extracted data."""
+
+    def test_clean_produces_correct_schema(self, tracker_2024_penang):
+        """Should produce exactly 83 columns after cleaning."""
+        skip_if_missing(tracker_2024_penang)
+
+        df_raw = read_all_patient_sheets(tracker_2024_penang)
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        assert len(df_clean.columns) == EXPECTED_SCHEMA_COLS
+
+    def test_clean_preserves_row_count(self, tracker_2024_penang):
+        """Should not drop rows during cleaning."""
+        skip_if_missing(tracker_2024_penang)
+
+        df_raw = read_all_patient_sheets(tracker_2024_penang)
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        assert len(df_clean) == len(df_raw)
+
+    def test_clean_creates_derived_columns(self, tracker_2024_penang):
+        """Should create derived columns (insulin_type, insulin_subtype, etc.)."""
+        skip_if_missing(tracker_2024_penang)
+
+        df_raw = read_all_patient_sheets(tracker_2024_penang)
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        # Check derived columns exist
+        assert "insulin_type" in df_clean.columns
+        assert "insulin_subtype" in df_clean.columns
+        assert "blood_pressure_sys_mmhg" in df_clean.columns
+        assert "blood_pressure_dias_mmhg" in df_clean.columns
+
+    def test_clean_tracks_errors(self, tracker_2024_penang):
+        """Should track data quality errors in ErrorCollector."""
+        skip_if_missing(tracker_2024_penang)
+
+        df_raw = read_all_patient_sheets(tracker_2024_penang)
+        collector = ErrorCollector()
+        clean_patient_data(df_raw, collector)
+
+        # Should have some errors (type conversions, invalid values, etc.)
+        # Exact count varies, but should be non-zero for this tracker
+        assert len(collector) >= 0  # May have 0 or more errors
+
+    def test_clean_has_required_columns(self, tracker_2024_penang):
+        """Should have all required columns in final schema."""
+        skip_if_missing(tracker_2024_penang)
+
+        df_raw = read_all_patient_sheets(tracker_2024_penang)
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        # Check key columns exist
+        required_columns = [
+            "patient_id",
+            "tracker_year",
+            "tracker_month",
+            "age",
+            "hba1c_updated",
+            "fbg_updated_mg",
+            "insulin_type",
+        ]
+        for col in required_columns:
+            assert col in df_clean.columns, f"Missing required column: {col}"
+
+
+class TestClean2023Sibu:
+    """Test cleaning on 2023 Sibu (edge case)."""
+
+    def test_clean_after_duplicate_handling(self, tracker_2023_sibu):
+        """Should clean successfully after duplicate column handling."""
+        skip_if_missing(tracker_2023_sibu)
+
+        df_raw = read_all_patient_sheets(tracker_2023_sibu)
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        assert len(df_clean.columns) == EXPECTED_SCHEMA_COLS
+        assert len(df_clean) == 14
+
+
+class TestClean2022PenangLegacy:
+    """Test cleaning on 2022 Penang (legacy format)."""
+
+    def test_clean_legacy_format(self, tracker_2022_penang):
+        """Should clean legacy format to same 83-column schema."""
+        skip_if_missing(tracker_2022_penang)
+
+        df_raw = read_all_patient_sheets(tracker_2022_penang)
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        # Should produce same schema regardless of input format
+        assert len(df_clean.columns) == EXPECTED_SCHEMA_COLS
+        assert len(df_clean) == 156
+
+    def test_clean_legacy_has_patient_list_data(self, tracker_2022_penang):
+        """Should preserve Patient List data (dob, province, etc.) after cleaning."""
+        skip_if_missing(tracker_2022_penang)
+
+        df_raw = read_all_patient_sheets(tracker_2022_penang)
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        # Patient List columns should be preserved
+        assert "dob" in df_clean.columns
+        assert "province" in df_clean.columns
+        assert "sex" in df_clean.columns
diff --git a/a4d-python/tests/test_integration/test_e2e.py b/a4d-python/tests/test_integration/test_e2e.py
new file mode 100644
index 0000000..c4ed7bf
--- /dev/null
+++ b/a4d-python/tests/test_integration/test_e2e.py
@@ -0,0 +1,147 @@
+"""End-to-end integration tests for the full pipeline (extraction + cleaning).
+
+Tests the complete workflow on real tracker files, validating:
+- Extraction + Cleaning work together correctly
+- Final output has correct schema and row counts
+- Different tracker formats (2024, 2023, 2022) all produce consistent output
+"""
+
+import pytest
+
+from a4d.clean.patient import clean_patient_data
+from a4d.errors import ErrorCollector
+from a4d.extract.patient import read_all_patient_sheets
+
+from .conftest import EXPECTED_SCHEMA_COLS, skip_if_missing
+
+pytestmark = [pytest.mark.slow, pytest.mark.integration, pytest.mark.e2e]
+
+
+@pytest.mark.parametrize(
+    ("tracker_fixture", "expected_rows", "expected_year", "description"),
+    [
+        ("tracker_2024_penang", 174, 2024, "2024 Penang - Annual + Patient List"),
+        ("tracker_2024_isdfi", 70, 2024, "2024 ISDFI Philippines"),
+        ("tracker_2023_sibu", 14, 2023, "2023 Sibu - duplicate columns edge case"),
+        ("tracker_2022_penang", 156, 2022, "2022 Penang - legacy format"),
+    ],
+)
+def test_e2e_pipeline(tracker_fixture, expected_rows, expected_year, description, request):
+    """Test full pipeline (extract + clean) on various tracker formats.
+
+    This test validates that:
+    1. Extraction works and produces expected row count
+    2. Cleaning works and produces 83-column schema
+    3. Row count is preserved through the pipeline
+    4. Year is extracted correctly
+    """
+    tracker_path = request.getfixturevalue(tracker_fixture)
+    skip_if_missing(tracker_path)
+
+    # Step 1: Extract
+    df_raw = read_all_patient_sheets(tracker_path)
+    assert len(df_raw) == expected_rows, f"Extraction failed for {description}"
+
+    # Step 2: Clean
+    collector = ErrorCollector()
+    df_clean = clean_patient_data(df_raw, collector)
+
+    # Validate final output
+    assert len(df_clean) == expected_rows, f"Cleaning changed row count for {description}"
+    assert len(df_clean.columns) == EXPECTED_SCHEMA_COLS, f"Schema incorrect for {description}"
+    assert df_clean["tracker_year"].unique().to_list() == [expected_year], (
+        f"Year incorrect for {description}"
+    )
+
+
+class TestE2E2024Penang:
+    """Detailed end-to-end test for 2024 Penang tracker."""
+
+    def test_e2e_full_pipeline(self, tracker_2024_penang):
+        """Test complete pipeline with detailed validations."""
+        skip_if_missing(tracker_2024_penang)
+
+        # Extract
+        df_raw = read_all_patient_sheets(tracker_2024_penang)
+        assert len(df_raw) == 174
+
+        # Clean
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        # Validate schema
+        assert len(df_clean.columns) == 83
+        assert len(df_clean) == 174
+
+        # Validate metadata
+        assert "tracker_year" in df_clean.columns
+        assert "tracker_month" in df_clean.columns
+        assert "clinic_id" in df_clean.columns
+
+        # Validate year and months
+        assert df_clean["tracker_year"].unique().to_list() == [2024]
+        months = sorted(df_clean["tracker_month"].unique().to_list())
+        assert months == list(range(1, 13))  # Should have all 12 months
+
+        # Validate clinic_id
+        assert df_clean["clinic_id"].unique().to_list() == ["PNG"]
+
+    def test_e2e_critical_columns_populated(self, tracker_2024_penang):
+        """Validate that critical columns are fully populated after pipeline."""
+        skip_if_missing(tracker_2024_penang)
+
+        df_raw = read_all_patient_sheets(tracker_2024_penang)
+        collector = ErrorCollector()
+        df_clean = clean_patient_data(df_raw, collector)
+
+        # These columns must be 100% populated for every row
+        required_full = [
+            "patient_id",
+            "status",
+            "clinic_id",
+            "tracker_year",
+            "tracker_month",
+        ]
+        for col in required_full:
+            null_count = df_clean[col].is_null().sum()
+            assert null_count == 0, f"{col} has {null_count} null values, expected 0"
+
+        # These columns should have high population (allow some nulls)
+        required_partial = ["age", "last_clinic_visit_date"]
+        for col in required_partial:
+            non_null = df_clean[col].is_not_null().sum()
+            assert non_null > len(df_clean) * 0.9, f"{col} has <90% population"
+
+
+class TestE2ECrosYearConsistency:
+    """Test that different years produce consistent schemas."""
+
+    def test_all_years_produce_same_schema(
+        self, tracker_2024_penang, tracker_2023_sibu, tracker_2022_penang
+    ):
+        """All tracker years should produce the same 83-column schema."""
+        trackers = [
+            (tracker_2024_penang, "2024_Penang"),
+            (tracker_2023_sibu, "2023_Sibu"),
+            (tracker_2022_penang, "2022_Penang"),
+        ]
+
+        column_names_per_tracker = {}
+
+        for tracker_path, name in trackers:
+            if not tracker_path.exists():
+                pytest.skip(f"Tracker file not found: {tracker_path}")
+
+            # Full pipeline
+            df_raw = read_all_patient_sheets(tracker_path)
+            collector = ErrorCollector()
+            df_clean = clean_patient_data(df_raw, collector)
+
+            # Collect column names
+            column_names_per_tracker[name] = set(df_clean.columns)
+
+        # All trackers should have same column names
+        if len(column_names_per_tracker) > 1:
+            first_columns = list(column_names_per_tracker.values())[0]
+            for name, columns in column_names_per_tracker.items():
+                assert columns == first_columns, f"{name} has different columns than others"
diff --git a/a4d-python/tests/test_integration/test_extract_integration.py b/a4d-python/tests/test_integration/test_extract_integration.py
new file mode 100644
index 0000000..9d5399b
--- /dev/null
+++ b/a4d-python/tests/test_integration/test_extract_integration.py
@@ -0,0 +1,134 @@
+"""Integration tests for patient data extraction.
+
+Tests extraction on real tracker files, validating:
+- Correct number of rows extracted
+- Correct number of columns
+- Month sheets are processed correctly
+- Annual and Patient List sheets are handled (if present)
+- Metadata columns are added correctly
+"""
+
+import pytest
+
+from a4d.extract.patient import read_all_patient_sheets
+
+from .conftest import skip_if_missing
+
+pytestmark = [pytest.mark.slow, pytest.mark.integration]
+
+
+class TestExtract2024Penang:
+    """Test extraction on 2024 Penang tracker (has Annual + Patient List)."""
+
+    def test_extract_total_rows(self, tracker_2024_penang):
+        """Should extract all patient records from all sheets."""
+        skip_if_missing(tracker_2024_penang)
+
+        df = read_all_patient_sheets(tracker_2024_penang)
+
+        # 2024 Penang has 12 month sheets + data from Patient List
+        assert len(df) == 174
+        assert len(df.columns) > 0  # Should have columns (exact count varies before cleaning)
+
+    def test_extract_has_metadata_columns(self, tracker_2024_penang):
+        """Should add metadata columns (tracker_year, tracker_month, sheet_name, file_name)."""
+        skip_if_missing(tracker_2024_penang)
+
+        df = read_all_patient_sheets(tracker_2024_penang)
+
+        assert "tracker_year" in df.columns
+        assert "tracker_month" in df.columns
+        assert "sheet_name" in df.columns
+        assert "file_name" in df.columns
+        assert "clinic_id" in df.columns
+
+    def test_extract_year_is_correct(self, tracker_2024_penang):
+        """Should extract year 2024 from sheet names."""
+        skip_if_missing(tracker_2024_penang)
+
+        df = read_all_patient_sheets(tracker_2024_penang)
+
+        # All rows should have year 2024
+        assert df["tracker_year"].unique().to_list() == [2024]
+
+    def test_extract_has_12_months(self, tracker_2024_penang):
+        """Should process 12 month sheets (Jan-Dec 2024)."""
+        skip_if_missing(tracker_2024_penang)
+
+        df = read_all_patient_sheets(tracker_2024_penang)
+
+        months = sorted(df["tracker_month"].unique().to_list())
+        expected_months = list(range(1, 13))  # 1-12
+        assert months == expected_months
+
+    def test_extract_clinic_id(self, tracker_2024_penang):
+        """Should extract clinic_id from parent directory."""
+        skip_if_missing(tracker_2024_penang)
+
+        df = read_all_patient_sheets(tracker_2024_penang)
+
+        # Parent directory is PNG
+        assert df["clinic_id"].unique().to_list() == ["PNG"]
+
+
+class TestExtract2023Sibu:
+    """Test extraction on 2023 Sibu tracker (edge case with duplicate columns)."""
+
+    def test_extract_handles_duplicates(self, tracker_2023_sibu):
+        """Should handle duplicate column mappings (complication_screening)."""
+        skip_if_missing(tracker_2023_sibu)
+
+        # This should not raise DuplicateError
+        df = read_all_patient_sheets(tracker_2023_sibu)
+
+        assert len(df) == 14  # 2023 Sibu has 14 total records
+        assert len(df.columns) > 0
+
+    def test_extract_year_2023(self, tracker_2023_sibu):
+        """Should extract year 2023."""
+        skip_if_missing(tracker_2023_sibu)
+
+        df = read_all_patient_sheets(tracker_2023_sibu)
+
+        assert df["tracker_year"].unique().to_list() == [2023]
+
+    def test_extract_months_sep_to_dec(self, tracker_2023_sibu):
+        """Should extract months Sep-Dec 2023."""
+        skip_if_missing(tracker_2023_sibu)
+
+        df = read_all_patient_sheets(tracker_2023_sibu)
+
+        months = sorted(df["tracker_month"].unique().to_list())
+        expected_months = [9, 10, 11, 12]  # Sep-Dec
+        assert months == expected_months
+
+
+class TestExtract2022PenangLegacy:
+    """Test extraction on 2022 Penang (legacy format without Annual sheet)."""
+
+    def test_extract_legacy_format(self, tracker_2022_penang):
+        """Should handle legacy format without Annual sheet."""
+        skip_if_missing(tracker_2022_penang)
+
+        df = read_all_patient_sheets(tracker_2022_penang)
+
+        assert len(df) == 156  # 2022 Penang has 156 total records
+        assert len(df.columns) > 0
+
+    def test_extract_legacy_has_patient_list(self, tracker_2022_penang):
+        """Should still process Patient List sheet in legacy format."""
+        skip_if_missing(tracker_2022_penang)
+
+        df = read_all_patient_sheets(tracker_2022_penang)
+
+        # Should have data from Patient List (static columns like dob, province)
+        # Check if we have any of the Patient List specific columns
+        assert "dob" in df.columns or "province" in df.columns
+
+    def test_extract_legacy_year_2022(self, tracker_2022_penang):
+        """Should extract year 2022."""
+        skip_if_missing(tracker_2022_penang)
+
+        df = read_all_patient_sheets(tracker_2022_penang)
+
+        assert df["tracker_year"].unique().to_list() == [2022]
diff --git a/a4d-python/tests/test_integration/test_r_validation.py b/a4d-python/tests/test_integration/test_r_validation.py
new file mode 100644
index 0000000..08d9fe6
--- /dev/null
+++ b/a4d-python/tests/test_integration/test_r_validation.py
@@ -0,0 +1,855 @@
+"""Validation tests comparing Python outputs against R pipeline outputs.
+
+Tests that verify Python implementation matches R implementation by comparing
+the final cleaned parquet files for all 174 trackers.
+
+These tests require:
+- R pipeline outputs in:
+  /Volumes/USB SanDisk 3.2Gen1 Media/a4d/output_r/patient_data_cleaned/
+- Python pipeline outputs in:
+  /Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/output/patient_data_cleaned/
+
+Run with: uv run pytest tests/test_integration/test_r_validation.py -v -m slow
+"""
+
+from pathlib import Path
+
+import polars as pl
+import pytest
+
+# Mark all tests as slow and integration
+pytestmark = [pytest.mark.slow, pytest.mark.integration]
+
+# Define output directories
+R_OUTPUT_DIR = Path("/Volumes/USB SanDisk 3.2Gen1 Media/a4d/output_r/patient_data_cleaned")
+PY_OUTPUT_DIR = Path("/Volumes/USB SanDisk 3.2Gen1 Media/a4d/output_python/patient_data_cleaned")
+
+# Acceptable differences where Python behavior is correct/better than R
+# These tests will PASS with the documented differences
+ACCEPTABLE_DIFFERENCES = {
+    "2024_Mandalay Children's Hospital A4D Tracker_patient_cleaned.parquet": {
+        "record_diff": 11,
+        "reason": "R implicit filtering: MM_MD001 has 12 monthly records in Python but only 1 in R",
+    },
+    "2024_Mahosot Hospital A4D Tracker_patient_cleaned.parquet": {
+        "record_diff": 1,
+        "reason": (
+            "Python correctly extracts LA-MH088 which is missing row number "
+            "in Excel column A; R incorrectly drops it"
+        ),
+    },
+    "2022_Children's Hospital 2 A4D Tracker_patient_cleaned.parquet": {
+        "record_diff": -15,
+        "reason": (
+            "Excel data quality issue: Oct22 sheet has space instead of 1 "
+            "in column A for first patient row, causing Python to misdetect "
+            "headers and skip October (15 rows). R handles this differently."
+        ),
+    },
+}
+
+# Known issues in Python that need to be fixed
+# Tests will run normally and only SKIP if the issue still exists
+# If the issue is fixed, the test will FAIL with a message to remove it from this dict
+KNOWN_ISSUES = {
+    "2018_Penang General Hospital A4D Tracker_DC_patient_cleaned.parquet": {
+        "duplicate_records": (
+            "Excel has duplicate patient_id MY_PN004 in Oct18 sheet "
+            "that needs to be fixed"
+        ),
+    },
+    "2023_Vietnam National Children's Hospital A4D Tracker_patient_cleaned.parquet": {
+        "duplicate_records": (
+            "Excel has duplicate patient_id VN_VC026 in Aug23 sheet "
+            "that needs to be fixed"
+        ),
+    },
+    "2023_NPH A4D Tracker_patient_cleaned.parquet": {
+        "duplicate_records": (
+            "4 patients KH_NPH026, KH_NPH027, KH_NPH028, KH_NPH029 have "
+            "incorrect patient_id in Sep23 and Oct23 and are truncated to "
+            "KH_NPH02 causing duplicates"
+        ),
+    },
+    "2025_06_North Okkalapa General Hospital A4D Tracker_patient_cleaned.parquet": {
+        "patient_id_format": (
+            "R replaces MM_NO097/098/099 with 'Undefined' due to format "
+            "validation. Python correctly preserves original IDs."
+        ),
+    },
+}
+
+# Trackers to skip due to data quality issues in source Excel files
+SKIP_VALIDATION = {
+    "2024_Vietnam National Children Hospital A4D Tracker_patient_cleaned.parquet": (
+        "Excel has duplicate patient rows with conflicting data in Jul24"
+    ),
+}
+
+# Columns to skip in data value comparison due to known extraction/processing differences
+# These columns have acceptable differences between R and Python
+SKIP_COLUMNS_IN_COMPARISON = {
+    "insulin_total_units",  # R has problems extracting this column correctly
+}
+
+# File-specific column exceptions where R has systematic extraction errors
+# Format: {filename: {reason: str, skip_columns: [str]}}
+# Use this when R has errors affecting many/all patients in specific columns for a file
+FILE_COLUMN_EXCEPTIONS = {
+    "2025_06_Jayavarman VII Hospital A4D Tracker_patient_cleaned.parquet": {
+        "reason": (
+            "Excel cells contain Unicode '≥15' (U+2265). R's readxl reads "
+            "raw Unicode. Python's openpyxl (data_only=True) normalizes to "
+            "ASCII '>15'. R's regex grepl('>|<') only matches ASCII, fails "
+            "to parse '≥15', results in error value 999999. R needs update "
+            "to handle Unicode comparison operators (≥, ≤)."
+        ),
+        "skip_columns": [
+            "hba1c_baseline",
+            "hba1c_baseline_exceeds",
+            "hba1c_updated",
+            "hba1c_updated_exceeds",
+        ],
+    },
+    "2025_06_Kantha Bopha II Hospital A4D Tracker_patient_cleaned.parquet": {
+        "reason": (
+            "R BUG: Sets province to 'Undefined' for Takéo, Tboung Khmum, "
+            "and Preah Sihanouk despite these being in "
+            "allowed_provinces.yaml. Python now correctly validates and "
+            "preserves these province names using sanitize_str(). All three "
+            "provinces are properly listed in the YAML with correct UTF-8 "
+            "encoding (Takéo has é as U+00E9). R's sanitize_str() should "
+            "handle this by removing accents, but validation fails. Needs "
+            "investigation in R's check_allowed_values() or YAML loading."
+        ),
+        "skip_columns": ["province"],
+    },
+    "2025_06_Mahosot Hospital A4D Tracker_patient_cleaned.parquet": {
+        "reason": (
+            "Patient LA_MH054 has invalid insulin_regimen value 'nph' "
+            "(lowercase). R uppercases to 'NPH', Python preserves original. "
+            "Both should reject as invalid."
+        ),
+        "skip_columns": ["insulin_regimen"],
+    },
+    "2025_06_Mandalay Children's Hospital A4D Tracker_patient_cleaned.parquet": {
+        "reason": (
+            "R has systematic extraction errors - sets error values "
+            "(999999 or 9999-09-09) for most columns. "
+            "Python correctly extracts data."
+        ),
+        "skip_columns": [
+            "age",
+            "blood_pressure_updated",
+            "bmi_date",
+            "dob",
+            "fbg_updated_date",
+            "hba1c_updated_date",
+            "hospitalisation_date",
+            "last_clinic_visit_date",
+            "last_remote_followup_date",
+            "lost_date",
+            "recruitment_date",
+            "t1d_diagnosis_age",
+            "t1d_diagnosis_date",
+            "complication_screening_eye_exam_date",
+            "complication_screening_foot_exam_date",
+            "complication_screening_kidney_test_date",
+            "complication_screening_lipid_profile_date",
+            "complication_screening_thyroid_test_date",
+        ],
+    },
+    "2025_06_Mandalay General Hospital A4D Tracker_patient_cleaned.parquet": {
+        "reason": (
+            "R sets error value 999999 for t1d_diagnosis_age. "
+            "Python correctly extracts values."
+        ),
+        "skip_columns": ["t1d_diagnosis_age"],
+    },
+    "2025_06_NPH A4D Tracker_patient_cleaned.parquet": {
+        "reason": "R sets error values for dates/age. Python correctly extracts data.",
+        "skip_columns": [
+            "age",
+            "blood_pressure_updated",
+            "bmi_date",
+            "dob",
+            "fbg_updated_date",
+            "hba1c_updated_date",
+            "insulin_regimen",
+            "insulin_type",
+            "last_clinic_visit_date",
+            "lost_date",
+            "recruitment_date",
+            "t1d_diagnosis_age",
+            "t1d_diagnosis_date",
+        ],
+    },
+    "2025_06_North Okkalapa General Hospital A4D Tracker_patient_cleaned.parquet": {
+        "reason": "clinic_id recently changed; insulin_subtype Python correct, R wrong",
+        "skip_columns": ["clinic_id", "insulin_subtype"],
+    },
+}
+
+# Columns that should never be null/empty - critical data integrity check
+REQUIRED_COLUMNS = {
+    "patient_id",
+    "tracker_month",
+    "tracker_year",
+    "tracker_date",
+    "clinic_id",
+    "status",
+}
+
+# Exceptions for required column validation
+# Files where specific required columns have known null values
+# Format: {filename: {column: reason}}
+REQUIRED_COLUMN_EXCEPTIONS = {
+    "2017_Mandalay Children's Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "2017 tracker has missing status values in source Excel file",
+    },
+    "2018_Vietnam National Children_s Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "2018 tracker has missing status values in source Excel file",
+    },
+    "2019_CDA A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient KH_CD008 has missing status in April 2019 in source Excel file",
+    },
+    "2019_Mahosot Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": (
+            "Patient LA_MH005 has missing status in January and "
+            "February 2019 in source Excel file"
+        ),
+    },
+    "2019_Preah Kossamak Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient KH_PK022 has missing status in August 2019 in source Excel file",
+    },
+    "2019_Vietnam National Children_s Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patients VN_VC053 and VN_VC054 have missing status values in source Excel file",
+    },
+    "2021_Mandalay Children's Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient MM_MD072 has missing status in February 2021 in source Excel file",
+    },
+    "2021_Preah Kossamak Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient KH_KB017_PK has missing status in source Excel file",
+    },
+    "2022_Chiang Mai Maharaj Nakorn A4D Tracker_patient_cleaned.parquet": {
+        "status": (
+            "Patients TH_CP027, TH_CP028, TH_CP029, TH_CP030 "
+            "have missing status in source Excel file"
+        ),
+    },
+    "2022_Chulalongkorn Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patients TH_CH006, TH_CH007, TH_CH008 have missing status in source Excel file",
+    },
+    "2022_Kantha Bopha Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient KH_KB168 has missing status in source Excel file",
+    },
+    "2022_Likas Women & Children's Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient MY_LW013 has missing status in source Excel file",
+    },
+    "2022_Mandalay Children's Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": (
+            "Patients MM_MD078, MM_MD079, MM_MD080, MM_MD081, "
+            "MM_MD082, MM_MD083 have missing status in "
+            "source Excel file"
+        ),
+    },
+    "2022_Penang General Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient MY_PN013 has missing status in source Excel file",
+    },
+    "2022_Putrajaya Hospital A4D Tracker_DC_patient_cleaned.parquet": {
+        "status": "Patient MY_PJ011 has missing status in source Excel file",
+    },
+    "2022_Sarawak General Hospital A4D Tracker_DC_patient_cleaned.parquet": {
+        "status": "Patients MY_SW017, MY_SW018, MY_SW020 have missing status in source Excel file",
+    },
+    "2022_Surat Thani A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient TH_ST023 has missing status in source Excel file",
+    },
+    "2022_Udon Thani Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient TH_UT013 has missing status in source Excel file",
+    },
+    "2023_Mahosot Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient LA_MH082 has missing status in source Excel file",
+    },
+    "2023_Nakornping Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient TH_NK005 has missing status in source Excel file",
+    },
+    "2023_Surat Thani Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient TH_ST024 has missing status in source Excel file",
+    },
+    "2024_Likas Women & Children's Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patient MY_LW018 has missing status in source Excel file",
+    },
+    "2024_Yangon General Hospital A4D Tracker_patient_cleaned.parquet": {
+        "status": "Patients MM_YG067 and MM_YG068 have missing status in source Excel file",
+    },
+}
+
+# Value mappings for known acceptable differences between R and Python
+# Format: {column_name: {r_value: py_value}}
+# These values are considered equivalent during comparison
+VALUE_MAPPINGS = {
+    "status": {
+        "Active - Remote": "Active Remote",
+        "Active - Clinic": "Active Clinic",
+    },
+}
+
+# Patient-level exceptions where R has extraction errors but Python is correct
+# Format: {filename: {patient_id: {reason: str, skip_columns: [str]}}}
+# These specific patient-column combinations will be excluded from comparison for ALL months
+PATIENT_LEVEL_EXCEPTIONS = {
+    "2025_06_CDA A4D Tracker_patient_cleaned.parquet": {
+        "KH_CD018": {
+            "reason": (
+                "R extraction error: missing 'Analog Insulin' value "
+                "that Python correctly extracts"
+            ),
+            "skip_columns": ["insulin_type"],
+        },
+    },
+    "2025_06_Jayavarman VII Hospital A4D Tracker_patient_cleaned.parquet": {
+        "KH_JV078": {
+            "reason": (
+                "R sets error date '9999-09-09' for lost_date when "
+                "Excel cell is empty. Python correctly extracts null."
+            ),
+            "skip_columns": ["lost_date"],
+        },
+    },
+    "2025_06_Kantha Bopha II Hospital A4D Tracker_patient_cleaned.parquet": {
+        "KH_KB023": {
+            "reason": (
+                "R extraction error: sex should be 'F' but R sets "
+                "'Undefined'. Python correctly extracts 'F'."
+            ),
+            "skip_columns": ["sex"],
+        },
+        "KH_KB073": {
+            "reason": (
+                "R extraction error: missing 'Analog Insulin' value "
+                "that Python correctly extracts"
+            ),
+            "skip_columns": ["insulin_type"],
+        },
+        "KH_KB139": {
+            "reason": (
+                "R extraction error: missing 'Analog Insulin' value "
+                "that Python correctly extracts"
+            ),
+            "skip_columns": ["insulin_type"],
+        },
+    },
+}
+
+
+def get_all_tracker_files() -> list[tuple[str, Path, Path]]:
+    """Get list of all tracker parquet files that exist in R output.
+
+    Returns:
+        List of (filename, r_path, py_path) tuples
+    """
+    if not R_OUTPUT_DIR.exists():
+        return []
+
+    trackers = []
+    for r_file in sorted(R_OUTPUT_DIR.glob("*_patient_cleaned.parquet")):
+        filename = r_file.name
+        py_file = PY_OUTPUT_DIR / filename
+        trackers.append((filename, r_file, py_file))
+
+    return trackers
+
+
+@pytest.fixture(scope="module")
+def tracker_files():
+    """Fixture providing list of all tracker files to validate."""
+    trackers = get_all_tracker_files()
+    if not trackers:
+        pytest.skip("R output directory not found or empty")
+    return trackers
+
+
+def test_output_directories_exist():
+    """Verify that both R and Python output directories exist."""
+    assert R_OUTPUT_DIR.exists(), f"R output directory not found: {R_OUTPUT_DIR}"
+    assert PY_OUTPUT_DIR.exists(), f"Python output directory not found: {PY_OUTPUT_DIR}"
+
+
+@pytest.mark.parametrize(("filename", "r_path", "py_path"), get_all_tracker_files())
+def test_record_count_matches(filename, r_path, py_path):
+    """Test that record counts match between R and Python for each tracker.
+
+    Validates that the number of records in the cleaned output matches,
+    with allowances for known acceptable differences.
+    """
+    # Skip if marked for skipping
+    if filename in SKIP_VALIDATION:
+        pytest.skip(SKIP_VALIDATION[filename])
+
+    # Skip if Python file doesn't exist
+    if not py_path.exists():
+        pytest.skip(f"Python output not found: {py_path}")
+
+    # Read both files
+    df_r = pl.read_parquet(r_path)
+    df_py = pl.read_parquet(py_path)
+
+    r_count = len(df_r)
+    py_count = len(df_py)
+    actual_diff = py_count - r_count
+
+    # Check if this is an acceptable difference
+    if filename in ACCEPTABLE_DIFFERENCES and "record_diff" in ACCEPTABLE_DIFFERENCES[filename]:
+        acceptable = ACCEPTABLE_DIFFERENCES[filename]
+        expected_diff = acceptable["record_diff"]
+
+        if actual_diff == expected_diff:
+            # Expected difference exists, test passes
+            pass
+        elif actual_diff == 0:
+            # Difference no longer exists! Alert to update config
+            pytest.fail(
+                f"{filename} is listed in ACCEPTABLE_DIFFERENCES but counts now match "
+                f"(R: {r_count}, Python: {py_count}). "
+                f"Please remove this file from ACCEPTABLE_DIFFERENCES dict."
+            )
+        else:
+            # Different difference than expected
+            assert actual_diff == expected_diff, (
+                f"{filename}: Expected difference of {expected_diff} records "
+                f"(reason: {acceptable['reason']}), but got {actual_diff}. "
+                f"R: {r_count}, Python: {py_count}"
+            )
+    else:
+        # Should match exactly
+        assert r_count == py_count, (
+            f"{filename}: Record count mismatch - R: {r_count}, Python: {py_count}"
+        )
+
+
+@pytest.mark.parametrize(("filename", "r_path", "py_path"), get_all_tracker_files())
+def test_schema_matches(filename, r_path, py_path):
+    """Test that column schemas match between R and Python for each tracker.
+
+    Validates that both outputs have the same column names.
+    """
+    # Skip if marked for skipping
+    if filename in SKIP_VALIDATION:
+        pytest.skip(SKIP_VALIDATION[filename])
+
+    # Skip if Python file doesn't exist
+    if not py_path.exists():
+        pytest.skip(f"Python output not found: {py_path}")
+
+    # Read both files
+    df_r = pl.read_parquet(r_path)
+    df_py = pl.read_parquet(py_path)
+
+    r_columns = set(df_r.columns)
+    py_columns = set(df_py.columns)
+
+    missing_in_py = r_columns - py_columns
+    extra_in_py = py_columns - r_columns
+
+    assert not missing_in_py, f"{filename}: Missing columns in Python: {missing_in_py}"
+    assert not extra_in_py, f"{filename}: Extra columns in Python: {extra_in_py}"
+
+
+@pytest.mark.parametrize(("filename", "r_path", "py_path"), get_all_tracker_files())
+def test_patient_ids_match(filename, r_path, py_path):
+    """Test that unique patient IDs match between R and Python for each tracker.
+
+    Validates that both outputs contain the same set of unique patient_ids,
+    with allowances for known acceptable differences.
+    """
+    # Skip if marked for skipping
+    if filename in SKIP_VALIDATION:
+        pytest.skip(SKIP_VALIDATION[filename])
+
+    # Skip if Python file doesn't exist
+    if not py_path.exists():
+        pytest.skip(f"Python output not found: {py_path}")
+
+    # Read both files
+    df_r = pl.read_parquet(r_path)
+    df_py = pl.read_parquet(py_path)
+
+    if filename == "2025_06_North Okkalapa General Hospital A4D Tracker_patient_cleaned.parquet":
+        print("Debug: R patient_ids:", sorted(df_r["patient_id"].unique().to_list()))
+        print("Debug: Python patient_ids:", sorted(df_py["patient_id"].unique().to_list()))
+
+    r_patients = set(df_r["patient_id"])
+    py_patients = set(df_py["patient_id"])
+
+    # Should match exactly (acceptable record count differences don't affect patient_id validation)
+    missing_in_py = r_patients - py_patients
+    extra_in_py = py_patients - r_patients
+
+    # Check if mismatch exists
+    has_mismatch = missing_in_py or extra_in_py
+
+    # If this has a known issue, only skip if the issue still exists
+    if filename in KNOWN_ISSUES:
+        issue_type = None
+        issue_msg = None
+
+        if "patient_id_format" in KNOWN_ISSUES[filename]:
+            issue_type = "patient_id_format"
+            issue_msg = KNOWN_ISSUES[filename]["patient_id_format"]
+        elif "patient_id_extraction" in KNOWN_ISSUES[filename]:
+            issue_type = "patient_id_extraction"
+            issue_msg = KNOWN_ISSUES[filename]["patient_id_extraction"]
+
+        if issue_type and issue_msg:
+            if has_mismatch:
+                pytest.skip(f"Known issue - {issue_msg}")
+            else:
+                # Issue is fixed! Fail the test to alert that KNOWN_ISSUES can be updated
+                pytest.fail(
+                    f"{filename} is listed in KNOWN_ISSUES but patient_ids now match! "
+                    f"Please remove this file from KNOWN_ISSUES dict."
+                )
+
+    # Assert no mismatches for files not in KNOWN_ISSUES
+    assert not missing_in_py, f"{filename}: Missing patient_ids in Python: {missing_in_py}"
+    assert not extra_in_py, f"{filename}: Extra patient_ids in Python: {extra_in_py}"
+
+
+@pytest.mark.parametrize(("filename", "r_path", "py_path"), get_all_tracker_files())
+def test_no_duplicate_records(filename, r_path, py_path):
+    """Test that there are no duplicate (patient_id, tracker_month) combinations.
+
+    Validates data quality by ensuring no unintended duplicates in Python output.
+    """
+    # Skip if marked for skipping
+    if filename in SKIP_VALIDATION:
+        pytest.skip(SKIP_VALIDATION[filename])
+
+    # Skip if Python file doesn't exist
+    if not py_path.exists():
+        pytest.skip(f"Python output not found: {py_path}")
+
+    # Read Python file
+    df_py = pl.read_parquet(py_path)
+
+    # Check for duplicates
+    duplicates = (
+        df_py.group_by(["patient_id", "clinic_id", "tracker_month"])
+        .agg(pl.len().alias("count"))
+        .filter(pl.col("count") > 1)
+    )
+
+    has_duplicates = len(duplicates) > 0
+
+    # If this has a known duplicate issue, only skip if duplicates still exist
+    if filename in KNOWN_ISSUES and "duplicate_records" in KNOWN_ISSUES[filename]:
+        if has_duplicates:
+            pytest.skip(f"Known issue - {KNOWN_ISSUES[filename]['duplicate_records']}")
+        else:
+            # Issue is fixed! Fail the test to alert that KNOWN_ISSUES can be updated
+            pytest.fail(
+                f"{filename} is listed in KNOWN_ISSUES but no longer has duplicates! "
+                f"Please remove this file from KNOWN_ISSUES dict."
+            )
+
+    assert len(duplicates) == 0, (
+        f"{filename}: Found {len(duplicates)} duplicate "
+        f"(patient_id, clinic_id, tracker_month) combinations"
+    )
+
+
+@pytest.mark.parametrize(("filename", "r_path", "py_path"), get_all_tracker_files())
+def test_required_columns_not_null(filename, r_path, py_path):
+    """Test that required columns are never null/empty in Python output.
+
+    Validates critical data integrity by ensuring required columns
+    like patient_id, tracker_month, clinic_id, etc. always have values.
+    """
+    # Skip if marked for skipping
+    if filename in SKIP_VALIDATION:
+        pytest.skip(SKIP_VALIDATION[filename])
+
+    # Skip if Python file doesn't exist
+    if not py_path.exists():
+        pytest.skip(f"Python output not found: {py_path}")
+
+    # Read Python file
+    df_py = pl.read_parquet(py_path)
+
+    # First, check if exceptions are still valid (alert if fixed)
+    if filename in REQUIRED_COLUMN_EXCEPTIONS:
+        for col, _reason in REQUIRED_COLUMN_EXCEPTIONS[filename].items():
+            if col in df_py.columns:
+                null_count = df_py[col].null_count()
+                if null_count == 0:
+                    # Exception exists but column has no nulls - issue is fixed!
+                    pytest.fail(
+                        f"{filename} is listed in REQUIRED_COLUMN_EXCEPTIONS for column '{col}' "
+                        f"but this column no longer has null values! "
+                        f"Please remove this exception from REQUIRED_COLUMN_EXCEPTIONS dict."
+                    )
+
+    # Check each required column
+    null_issues = []
+    for col in REQUIRED_COLUMNS:
+        if col not in df_py.columns:
+            null_issues.append(f"{col}: Column missing from output")
+            continue
+
+        # Skip if this file/column combination has a known exception
+        if filename in REQUIRED_COLUMN_EXCEPTIONS:
+            if col in REQUIRED_COLUMN_EXCEPTIONS[filename]:
+                continue
+
+        null_count = df_py[col].null_count()
+        if null_count > 0:
+            null_issues.append(f"{col}: {null_count} null values found")
+
+    if null_issues:
+        error_msg = f"{filename}: Required columns have null/missing values:\n"
+        error_msg += "\n".join(f"  - {issue}" for issue in null_issues)
+        pytest.fail(error_msg)
+
+
+class TestValidationSummary:
+    """Summary tests providing overall validation statistics."""
+
+    def test_file_coverage(self, tracker_files):
+        """Report file coverage statistics (informational only)."""
+        total_trackers = len(tracker_files)
+        skipped = 0
+        missing_py = 0
+        available = 0
+
+        for filename, _r_path, py_path in tracker_files:
+            if filename in SKIP_VALIDATION:
+                skipped += 1
+            elif not py_path.exists():
+                missing_py += 1
+            else:
+                available += 1
+
+        print(f"\n{'=' * 60}")
+        print("R vs Python File Coverage Summary")
+        print(f"{'=' * 60}")
+        print(f"Total trackers in R output: {total_trackers}")
+        print(f"Python files available: {available + skipped}")
+        print(f"Skipped (Excel data issues): {skipped}")
+        print(f"Missing Python output: {missing_py}")
+        print(f"File coverage: {(available / total_trackers * 100):.1f}%")
+        print(f"{'=' * 60}")
+
+        # Just report, don't assert - this is informational only
+
+
+@pytest.mark.parametrize(("filename", "r_path", "py_path"), get_all_tracker_files())
+def test_data_values_match(filename, r_path, py_path):
+    """Test that data values match between R and Python for matching patients.
+
+    Compares all column values for patients that exist in both outputs,
+    grouped by (patient_id, tracker_month) to identify exactly which
+    patient-month combinations have mismatching data.
+    """
+    if int(filename[:4]) < 2025:
+        pytest.skip("Data value comparison only for 2025 trackers and later")
+
+    # Skip if marked for skipping
+    if filename in SKIP_VALIDATION:
+        pytest.skip(SKIP_VALIDATION[filename])
+
+    # Skip if Python file doesn't exist
+    if not py_path.exists():
+        pytest.skip(f"Python output not found: {py_path}")
+
+    # Read both files
+    # Note: We use inner join, so we only compare patients that exist in both outputs
+    # This allows us to compare data values even when there are patient_id differences
+    df_r = pl.read_parquet(r_path)
+    df_py = pl.read_parquet(py_path)
+
+    # Get common columns (some might differ)
+    r_cols = set(df_r.columns)
+    py_cols = set(df_py.columns)
+    common_cols = sorted(r_cols & py_cols)
+
+    # Must have at least patient_id and tracker_month
+    assert "patient_id" in common_cols
+    assert "tracker_month" in common_cols
+
+    # Join on patient_id and tracker_month to compare matching records
+    # Use inner join to only compare patients that exist in both
+    df_r_subset = df_r.select(common_cols)
+    df_py_subset = df_py.select(common_cols)
+
+    # Add suffixes to distinguish R vs Python columns
+    df_r_renamed = df_r_subset.rename(
+        {col: f"{col}_r" for col in common_cols if col not in ["patient_id", "tracker_month"]}
+    )
+    df_py_renamed = df_py_subset.rename(
+        {col: f"{col}_py" for col in common_cols if col not in ["patient_id", "tracker_month"]}
+    )
+
+    # Join on patient_id and tracker_month
+    df_joined = df_r_renamed.join(df_py_renamed, on=["patient_id", "tracker_month"], how="inner")
+
+    if len(df_joined) == 0:
+        pytest.skip("No matching (patient_id, tracker_month) combinations to compare")
+
+    # Compare each column
+    mismatches = []
+    for col in common_cols:
+        if col in ["patient_id", "tracker_month"]:
+            continue
+
+        # Skip columns with known acceptable differences (global)
+        if col in SKIP_COLUMNS_IN_COMPARISON:
+            continue
+
+        # Skip columns with file-specific systematic errors
+        if filename in FILE_COLUMN_EXCEPTIONS:
+            if col in FILE_COLUMN_EXCEPTIONS[filename].get("skip_columns", []):
+                continue
+
+        r_col = f"{col}_r"
+        py_col = f"{col}_py"
+
+        # Start with all joined data
+        df_compare = df_joined
+
+        # Filter out patient-level exceptions for this file and column
+        if filename in PATIENT_LEVEL_EXCEPTIONS:
+            for patient_id, exception_info in PATIENT_LEVEL_EXCEPTIONS[filename].items():
+                if col in exception_info.get("skip_columns", []):
+                    # Exclude this patient from comparison for this column
+                    df_compare = df_compare.filter(pl.col("patient_id") != patient_id)
+
+        # Apply value mappings if this column has known equivalences
+        if col in VALUE_MAPPINGS:
+            mapping = VALUE_MAPPINGS[col]
+            # Map R values to their Python equivalents for comparison
+            df_compare = df_compare.with_columns(
+                pl.col(r_col)
+                .replace_strict(mapping, default=pl.col(r_col), return_dtype=pl.Utf8)
+                .alias(f"{r_col}_mapped")
+            )
+            r_col_for_comparison = f"{r_col}_mapped"
+        else:
+            r_col_for_comparison = r_col
+
+        # Check if numeric column - use approximate comparison for floats
+        is_numeric = df_compare[r_col_for_comparison].dtype in [
+            pl.Float32,
+            pl.Float64,
+            pl.Int8,
+            pl.Int16,
+            pl.Int32,
+            pl.Int64,
+        ]
+
+        # Check if string column - treat null and empty string as equivalent
+        is_string = df_compare[r_col_for_comparison].dtype in [pl.Utf8, pl.String]
+
+        if is_numeric and df_compare[r_col_for_comparison].dtype in [pl.Float32, pl.Float64]:
+            # For floats, use approximate equality (accounting for floating point precision)
+            # Values must differ by more than 1e-6 to be considered different
+            diff_mask = (
+                # Both non-null and significantly different
+                (
+                    (df_compare[r_col_for_comparison].is_not_null())
+                    & (df_compare[py_col].is_not_null())
+                    & ((df_compare[r_col_for_comparison] - df_compare[py_col]).abs() > 1e-6)
+                )
+                # One null, other not null
+                | (
+                    (df_compare[r_col_for_comparison].is_null())
+                    & (df_compare[py_col].is_not_null())
+                )
+                | (
+                    (df_compare[r_col_for_comparison].is_not_null())
+                    & (df_compare[py_col].is_null())
+                )
+            )
+        elif is_string:
+            # For strings, treat null and empty string as equivalent
+            # Normalize: convert empty strings to null for comparison
+            r_normalized = (
+                pl.when(df_compare[r_col_for_comparison] == "")
+                .then(None)
+                .otherwise(df_compare[r_col_for_comparison])
+            )
+            py_normalized = (
+                pl.when(df_compare[py_col] == "").then(None).otherwise(df_compare[py_col])
+            )
+
+            df_compare = df_compare.with_columns(
+                [
+                    r_normalized.alias(f"{r_col_for_comparison}_norm"),
+                    py_normalized.alias(f"{py_col}_norm"),
+                ]
+            )
+
+            diff_mask = (
+                # Both non-null and different
+                (
+                    (df_compare[f"{r_col_for_comparison}_norm"].is_not_null())
+                    & (df_compare[f"{py_col}_norm"].is_not_null())
+                    & (df_compare[f"{r_col_for_comparison}_norm"] != df_compare[f"{py_col}_norm"])
+                )
+                # One null, other not null (after normalization)
+                | (
+                    (df_compare[f"{r_col_for_comparison}_norm"].is_null())
+                    & (df_compare[f"{py_col}_norm"].is_not_null())
+                )
+                | (
+                    (df_compare[f"{r_col_for_comparison}_norm"].is_not_null())
+                    & (df_compare[f"{py_col}_norm"].is_null())
+                )
+            )
+        else:
+            # For non-floats and non-strings, use exact comparison
+            diff_mask = (
+                # Both non-null and different
+                (
+                    (df_compare[r_col_for_comparison].is_not_null())
+                    & (df_compare[py_col].is_not_null())
+                    & (df_compare[r_col_for_comparison] != df_compare[py_col])
+                )
+                # One null, other not null
+                | (
+                    (df_compare[r_col_for_comparison].is_null())
+                    & (df_compare[py_col].is_not_null())
+                )
+                | (
+                    (df_compare[r_col_for_comparison].is_not_null())
+                    & (df_compare[py_col].is_null())
+                )
+            )
+
+        diff_records = df_compare.filter(diff_mask)
+
+        if len(diff_records) > 0:
+            mismatches.append(
+                {
+                    "column": col,
+                    "mismatches": len(diff_records),
+                    "sample_patients": diff_records.select(
+                        ["patient_id", "tracker_month", r_col, py_col]
+                    ).head(5),
+                }
+            )
+
+    if mismatches:
+        # Build detailed error message
+        error_msg = f"{filename}: Found data mismatches in {len(mismatches)} columns\n"
+        for mismatch in mismatches[:5]:  # Show first 5 columns with issues
+            error_msg += (
+                f"\nColumn '{mismatch['column']}': {mismatch['mismatches']} mismatching records\n"
+            )
+            error_msg += "Sample differing records:\n"
+            error_msg += str(mismatch["sample_patients"])
+
+        if len(mismatches) > 5:
+            error_msg += f"\n\n... and {len(mismatches) - 5} more columns with mismatches"
+
+        pytest.fail(error_msg)
diff --git a/a4d-python/tests/test_reference/__init__.py b/a4d-python/tests/test_reference/__init__.py
new file mode 100644
index 0000000..54f1221
--- /dev/null
+++ b/a4d-python/tests/test_reference/__init__.py
@@ -0,0 +1 @@
+"""Tests for reference data loaders and validators."""
diff --git a/a4d-python/tests/test_reference/test_provinces.py b/a4d-python/tests/test_reference/test_provinces.py
new file mode 100644
index 0000000..61eb58d
--- /dev/null
+++ b/a4d-python/tests/test_reference/test_provinces.py
@@ -0,0 +1,248 @@
+"""Tests for province validation."""
+
+from a4d.reference import (
+    get_country_for_province,
+    is_valid_province,
+    load_allowed_provinces,
+    load_provinces_by_country,
+)
+
+
+class TestLoadAllowedProvinces:
+    """Tests for load_allowed_provinces function."""
+
+    def test_loads_provinces_from_yaml(self):
+        """Test that provinces are loaded from YAML file."""
+        provinces = load_allowed_provinces()
+
+        assert isinstance(provinces, list)
+        assert len(provinces) > 0
+        assert all(isinstance(p, str) for p in provinces)
+
+    def test_provinces_are_lowercased(self):
+        """Test that all provinces are lowercased for case-insensitive matching."""
+        provinces = load_allowed_provinces()
+
+        # All should be lowercase
+        assert all(p == p.lower() for p in provinces)
+
+    def test_includes_known_provinces_lowercased(self):
+        """Test that known provinces are included (lowercased)."""
+        provinces = load_allowed_provinces()
+
+        # Test samples from each country in the YAML (lowercased)
+        assert "bangkok" in provinces  # Thailand
+        assert "vientiane" in provinces  # Laos
+        assert "hà nội*" in provinces  # Vietnam (note the asterisk)
+        assert "phnom penh" in provinces  # Cambodia
+        assert "yangon region" in provinces  # Myanmar
+        assert "kuala lumpur*" in provinces  # Malaysia
+
+    def test_returns_flattened_list(self):
+        """Test that provinces from all countries are in single list."""
+        provinces = load_allowed_provinces()
+        provinces_by_country = load_provinces_by_country()
+
+        # Count should match flattened version
+        expected_count = sum(len(provs) for provs in provinces_by_country.values())
+        assert len(provinces) == expected_count
+
+    def test_no_duplicates(self):
+        """Test that there are no duplicate provinces in the list."""
+        provinces = load_allowed_provinces()
+
+        assert len(provinces) == len(set(provinces))
+
+
+class TestLoadProvincesByCountry:
+    """Tests for load_provinces_by_country function."""
+
+    def test_loads_provinces_by_country(self):
+        """Test that provinces are organized by country."""
+        provinces_by_country = load_provinces_by_country()
+
+        assert isinstance(provinces_by_country, dict)
+        assert len(provinces_by_country) > 0
+
+    def test_provinces_are_lowercased(self):
+        """Test that all provinces are lowercased."""
+        provinces_by_country = load_provinces_by_country()
+
+        for _country, provinces in provinces_by_country.items():
+            assert all(p == p.lower() for p in provinces)
+
+    def test_includes_expected_countries(self):
+        """Test that expected countries are present."""
+        provinces_by_country = load_provinces_by_country()
+
+        expected_countries = [
+            "THAILAND",
+            "LAOS",
+            "VIETNAM",
+            "CAMBODIA",
+            "MYANMAR",
+            "MALAYSIA",
+        ]
+
+        for country in expected_countries:
+            assert country in provinces_by_country
+            assert len(provinces_by_country[country]) > 0
+
+    def test_thailand_provinces(self):
+        """Test that Thailand has correct number of provinces."""
+        provinces_by_country = load_provinces_by_country()
+
+        thailand_provinces = provinces_by_country["THAILAND"]
+
+        # Thailand has 72 provinces in the data file
+        assert len(thailand_provinces) == 72
+        assert "bangkok" in thailand_provinces
+        assert "chiang mai" in thailand_provinces
+        assert "phuket" in thailand_provinces
+
+
+class TestIsValidProvince:
+    """Tests for is_valid_province function."""
+
+    def test_valid_province_returns_true(self):
+        """Test that valid provinces return True."""
+        assert is_valid_province("Bangkok")
+        assert is_valid_province("Vientiane")
+        assert is_valid_province("Hà Nội*")
+        assert is_valid_province("Phnom Penh")
+
+    def test_invalid_province_returns_false(self):
+        """Test that invalid provinces return False."""
+        assert not is_valid_province("Invalid Province")
+        assert not is_valid_province("Unknown City")
+        assert not is_valid_province("Test")
+
+    def test_none_returns_true(self):
+        """Test that None is considered valid (nullable field)."""
+        assert is_valid_province(None)
+
+    def test_empty_string_returns_false(self):
+        """Test that empty string is invalid."""
+        assert not is_valid_province("")
+
+    def test_case_insensitive(self):
+        """Test that validation is case-insensitive."""
+        assert is_valid_province("Bangkok")
+        assert is_valid_province("bangkok")
+        assert is_valid_province("BANGKOK")
+        assert is_valid_province("BaNgKoK")
+
+    def test_unicode_provinces(self):
+        """Test that Unicode province names work correctly."""
+        # Vietnam has many provinces with Unicode characters
+        assert is_valid_province("Hà Nội*")
+        assert is_valid_province("Hồ Chí Minh*")
+        assert is_valid_province("Bà Rịa–Vũng Tàu")
+        assert is_valid_province("Đà Nẵng*")
+
+        # Case variations
+        assert is_valid_province("HÀ NỘI*")
+        assert is_valid_province("hà nội*")
+
+
+class TestGetCountryForProvince:
+    """Tests for get_country_for_province function."""
+
+    def test_returns_correct_country(self):
+        """Test that correct country is returned for provinces."""
+        assert get_country_for_province("Bangkok") == "THAILAND"
+        assert get_country_for_province("Vientiane") == "LAOS"
+        assert get_country_for_province("Hà Nội*") == "VIETNAM"
+        assert get_country_for_province("Phnom Penh") == "CAMBODIA"
+        assert get_country_for_province("Yangon Region") == "MYANMAR"
+        assert get_country_for_province("Kuala Lumpur*") == "MALAYSIA"
+
+    def test_returns_none_for_invalid_province(self):
+        """Test that None is returned for invalid provinces."""
+        assert get_country_for_province("Invalid Province") is None
+        assert get_country_for_province("Unknown") is None
+
+    def test_case_insensitive(self):
+        """Test that lookup is case-insensitive."""
+        assert get_country_for_province("Bangkok") == "THAILAND"
+        assert get_country_for_province("bangkok") == "THAILAND"
+        assert get_country_for_province("BANGKOK") == "THAILAND"
+        assert get_country_for_province("BaNgKoK") == "THAILAND"
+
+    def test_multiple_provinces_same_country(self):
+        """Test that different provinces from same country work."""
+        # All should return THAILAND
+        assert get_country_for_province("Bangkok") == "THAILAND"
+        assert get_country_for_province("Chiang Mai") == "THAILAND"
+        assert get_country_for_province("Phuket") == "THAILAND"
+
+    def test_unicode_provinces(self):
+        """Test that Unicode provinces work correctly."""
+        assert get_country_for_province("Hà Nội*") == "VIETNAM"
+        assert get_country_for_province("hà nội*") == "VIETNAM"
+        assert get_country_for_province("HÀ NỘI*") == "VIETNAM"
+
+
+class TestIntegrationWithActualData:
+    """Integration tests with actual reference_data file."""
+
+    def test_all_countries_have_provinces(self):
+        """Test that every country has at least one province."""
+        provinces_by_country = load_provinces_by_country()
+
+        for country, provinces in provinces_by_country.items():
+            assert len(provinces) > 0, f"{country} has no provinces"
+
+    def test_total_province_count(self):
+        """Test that total province count is reasonable."""
+        provinces = load_allowed_provinces()
+
+        # We expect 200+ provinces across all countries
+        assert len(provinces) > 200
+
+    def test_no_empty_province_names(self):
+        """Test that no province names are empty strings."""
+        provinces = load_allowed_provinces()
+
+        assert all(p.strip() for p in provinces)
+
+    def test_round_trip_validation(self):
+        """Test that all loaded provinces pass validation."""
+        provinces = load_allowed_provinces()
+
+        for province in provinces:
+            assert is_valid_province(province)
+            country = get_country_for_province(province)
+            assert country is not None
+
+    def test_special_characters_preserved(self):
+        """Test that special characters in province names are preserved."""
+        provinces = load_allowed_provinces()
+
+        # Vietnam provinces with Unicode (lowercased)
+        unicode_provinces = [p for p in provinces if any(ord(c) > 127 for c in p)]
+        assert len(unicode_provinces) > 0
+
+        # Provinces with asterisks (indicating cities, lowercased)
+        asterisk_provinces = [p for p in provinces if "*" in p]
+        assert len(asterisk_provinces) > 0
+
+    def test_case_insensitive_validation_comprehensive(self):
+        """Test case-insensitive validation with various cases."""
+        provinces_by_country = load_provinces_by_country()
+
+        # Get a few provinces from the data
+        provinces_by_country["THAILAND"]
+        vietnam = provinces_by_country["VIETNAM"]
+
+        # Test that both original case and variations work
+        # (provinces are stored lowercase, so we test against "bangkok")
+        assert is_valid_province("Bangkok")  # Title case
+        assert is_valid_province("BANGKOK")  # Upper case
+        assert is_valid_province("bangkok")  # Lower case
+
+        # Test with Vietnamese provinces
+        test_province = vietnam[0]  # Get first province
+        assert is_valid_province(test_province)
+        assert is_valid_province(test_province.upper())
+        assert is_valid_province(test_province.title())
diff --git a/a4d-python/tests/test_reference/test_synonyms.py b/a4d-python/tests/test_reference/test_synonyms.py
new file mode 100644
index 0000000..7e4dc61
--- /dev/null
+++ b/a4d-python/tests/test_reference/test_synonyms.py
@@ -0,0 +1,344 @@
+"""Tests for column synonym mapper."""
+
+from pathlib import Path
+
+import polars as pl
+import pytest
+import yaml
+
+from a4d.reference import ColumnMapper, load_patient_mapper, load_product_mapper
+from a4d.reference.synonyms import sanitize_str
+
+
+class TestSanitizeStr:
+    """Tests for sanitize_str function."""
+
+    def test_basic_sanitization(self):
+        """Test basic sanitization cases."""
+        assert sanitize_str("Patient ID") == "patientid"
+        assert sanitize_str("Patient ID*") == "patientid"
+        assert sanitize_str("Age* On Reporting") == "ageonreporting"
+
+    def test_lowercase_conversion(self):
+        """Test lowercase conversion."""
+        assert sanitize_str("PATIENT ID") == "patientid"
+        assert sanitize_str("Patient Name") == "patientname"
+
+    def test_space_removal(self):
+        """Test space removal."""
+        assert sanitize_str("Date 2022") == "date2022"
+        assert sanitize_str("My Awesome Column") == "myawesomecolumn"
+
+    def test_special_character_removal(self):
+        """Test special character removal."""
+        assert sanitize_str("Patient ID*") == "patientid"
+        assert sanitize_str("My Awesome 1st Column!!") == "myawesome1stcolumn"
+        assert sanitize_str("D.O.B.") == "dob"
+        assert sanitize_str("Age (Years)") == "ageyears"
+        assert sanitize_str("Patient.Name..ANON") == "patientnameanon"
+
+    def test_alphanumeric_preserved(self):
+        """Test that alphanumeric characters are preserved."""
+        assert sanitize_str("Age1") == "age1"
+        assert sanitize_str("test123abc") == "test123abc"
+
+    def test_empty_string(self):
+        """Test empty string."""
+        assert sanitize_str("") == ""
+
+    def test_only_special_chars(self):
+        """Test string with only special characters."""
+        assert sanitize_str("***!!!") == ""
+        assert sanitize_str("...") == ""
+
+
+class TestColumnMapper:
+    """Tests for ColumnMapper class."""
+
+    @pytest.fixture
+    def simple_synonyms(self, tmp_path: Path) -> Path:
+        """Create a simple synonym YAML file for testing."""
+        synonyms = {
+            "age": ["Age", "Age*", "age on reporting"],
+            "patient_id": ["ID", "Patient ID", "Patient ID*"],
+            "name": ["Patient Name"],
+            "province": ["Province"],
+            "empty_column": [],  # Column with no synonyms
+        }
+
+        yaml_path = tmp_path / "test_synonyms.yaml"
+        with open(yaml_path, "w") as f:
+            yaml.dump(synonyms, f)
+
+        return yaml_path
+
+    @pytest.fixture
+    def duplicate_synonyms(self, tmp_path: Path) -> Path:
+        """Create synonym YAML with duplicate synonyms."""
+        synonyms = {
+            "age": ["Age", "Years"],
+            "age_at_diagnosis": ["Age", "Age at diagnosis"],  # "Age" duplicated
+        }
+
+        yaml_path = tmp_path / "test_duplicates.yaml"
+        with open(yaml_path, "w") as f:
+            yaml.dump(synonyms, f)
+
+        return yaml_path
+
+    def test_init_loads_synonyms(self, simple_synonyms: Path):
+        """Test that __init__ loads synonyms from YAML file."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        assert len(mapper.synonyms) == 5
+        assert "age" in mapper.synonyms
+        assert "Age" in mapper.synonyms["age"]
+        # After sanitization, some synonyms collapse (e.g., "Age" and "Age*" both become "age")
+        assert (
+            len(mapper._lookup) == 6
+        )  # Sanitized synonyms (age+ageonreporting+id+patientid+patientname+province)
+
+    def test_init_missing_file_raises_error(self):
+        """Test that __init__ raises error for missing file."""
+        with pytest.raises(FileNotFoundError, match="YAML file not found"):
+            ColumnMapper(Path("/nonexistent/file.yaml"))
+
+    def test_build_lookup_creates_reverse_mapping(self, simple_synonyms: Path):
+        """Test that reverse lookup is built correctly with SANITIZED keys."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        # Lookup uses sanitized keys (lowercase, no spaces, no special chars)
+        assert mapper._lookup["age"] == "age"  # "Age" and "Age*" both sanitize to "age"
+        assert mapper._lookup["ageonreporting"] == "age"  # "age on reporting" → "ageonreporting"
+        assert mapper._lookup["id"] == "patient_id"  # "ID" → "id"
+        assert (
+            mapper._lookup["patientid"] == "patient_id"
+        )  # "Patient ID" and "Patient ID*" → "patientid"
+
+    def test_build_lookup_handles_duplicates(self, duplicate_synonyms: Path):
+        """Test that duplicate SANITIZED synonyms log warning and use last definition."""
+        mapper = ColumnMapper(duplicate_synonyms)
+
+        # "Age" appears in both age and age_at_diagnosis
+        # After sanitization, both become "age" → duplicate!
+        # Should map to the last one encountered
+        assert "age" in mapper._lookup
+        assert mapper._lookup["age"] in ["age", "age_at_diagnosis"]
+
+    def test_get_standard_name(self, simple_synonyms: Path):
+        """Test getting standard name for a column."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        assert mapper.get_standard_name("Age") == "age"
+        assert mapper.get_standard_name("Patient ID*") == "patient_id"
+        assert mapper.get_standard_name("unknown_column") == "unknown_column"
+
+    def test_get_standard_name_with_sanitization(self, simple_synonyms: Path):
+        """Test that sanitization allows flexible synonym matching."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        # All these variants should map to "patient_id" after sanitization
+        assert mapper.get_standard_name("Patient ID") == "patient_id"
+        assert mapper.get_standard_name("Patient ID*") == "patient_id"
+        assert mapper.get_standard_name("PATIENT ID") == "patient_id"
+        assert mapper.get_standard_name("patient id") == "patient_id"
+        assert mapper.get_standard_name("ID") == "patient_id"
+
+        # Age variants
+        assert mapper.get_standard_name("Age") == "age"
+        assert mapper.get_standard_name("Age*") == "age"
+        assert mapper.get_standard_name("age on reporting") == "age"
+        assert mapper.get_standard_name("AGE ON REPORTING") == "age"
+
+        # Test with extra spaces/special chars (should still match)
+        assert mapper.get_standard_name("Patient  ID*") == "patient_id"
+
+    def test_rename_columns_basic(self, simple_synonyms: Path):
+        """Test basic column renaming."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        df = pl.DataFrame(
+            {
+                "Age": [25, 30],
+                "Patient ID": ["P001", "P002"],
+                "Province": ["Bangkok", "Hanoi"],
+            }
+        )
+
+        renamed = mapper.rename_columns(df)
+
+        assert "age" in renamed.columns
+        assert "patient_id" in renamed.columns
+        assert "province" in renamed.columns
+        assert "Age" not in renamed.columns
+
+    def test_rename_columns_keeps_unmapped(self, simple_synonyms: Path):
+        """Test that unmapped columns are kept by default."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        df = pl.DataFrame(
+            {
+                "Age": [25],
+                "UnknownColumn": ["value"],
+                "AnotherUnmapped": [42],
+            }
+        )
+
+        renamed = mapper.rename_columns(df)
+
+        assert "age" in renamed.columns
+        assert "UnknownColumn" in renamed.columns
+        assert "AnotherUnmapped" in renamed.columns
+
+    def test_rename_columns_strict_mode_raises_error(self, simple_synonyms: Path):
+        """Test that strict mode raises error for unmapped columns."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        df = pl.DataFrame(
+            {
+                "Age": [25],
+                "UnknownColumn": ["value"],
+            }
+        )
+
+        with pytest.raises(ValueError, match="Unmapped columns found"):
+            mapper.rename_columns(df, strict=True)
+
+    def test_rename_columns_no_changes_needed(self, simple_synonyms: Path):
+        """Test renaming when columns are already standardized."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        df = pl.DataFrame(
+            {
+                "age": [25],
+                "patient_id": ["P001"],
+            }
+        )
+
+        renamed = mapper.rename_columns(df)
+
+        assert renamed.columns == df.columns
+        assert renamed.equals(df)
+
+    def test_get_expected_columns(self, simple_synonyms: Path):
+        """Test getting set of expected standard columns."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        expected = mapper.get_expected_columns()
+
+        assert expected == {"age", "patient_id", "name", "province", "empty_column"}
+
+    def test_get_missing_columns(self, simple_synonyms: Path):
+        """Test getting missing columns from DataFrame."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        df = pl.DataFrame(
+            {
+                "age": [25],
+                "patient_id": ["P001"],
+            }
+        )
+
+        missing = mapper.get_missing_columns(df)
+
+        assert missing == {"name", "province", "empty_column"}
+
+    def test_validate_required_columns_success(self, simple_synonyms: Path):
+        """Test validation passes when required columns present."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        df = pl.DataFrame(
+            {
+                "age": [25],
+                "patient_id": ["P001"],
+                "name": ["Test"],
+            }
+        )
+
+        # Should not raise
+        mapper.validate_required_columns(df, ["age", "patient_id"])
+
+    def test_validate_required_columns_failure(self, simple_synonyms: Path):
+        """Test validation fails when required columns missing."""
+        mapper = ColumnMapper(simple_synonyms)
+
+        df = pl.DataFrame(
+            {
+                "age": [25],
+            }
+        )
+
+        with pytest.raises(ValueError, match="Required columns missing"):
+            mapper.validate_required_columns(df, ["age", "patient_id", "name"])
+
+
+class TestLoaderFunctions:
+    """Tests for loader convenience functions."""
+
+    def test_load_patient_mapper_with_actual_file(self):
+        """Test loading patient mapper with actual reference_data file."""
+        mapper = load_patient_mapper()
+
+        # Check that some expected columns are present
+        assert "age" in mapper.synonyms
+        assert "patient_id" in mapper.synonyms
+        assert "province" in mapper.synonyms
+
+        # Check that synonyms are loaded
+        assert len(mapper._lookup) > 0
+        assert mapper.get_standard_name("Age") == "age"
+
+    def test_load_product_mapper_with_actual_file(self):
+        """Test loading product mapper with actual reference_data file."""
+        mapper = load_product_mapper()
+
+        # Check that some expected columns are present
+        assert "product" in mapper.synonyms
+        assert "clinic_id" in mapper.synonyms
+
+        # Check that synonyms are loaded
+        assert len(mapper._lookup) > 0
+
+
+class TestIntegrationWithActualData:
+    """Integration tests with actual reference_data files."""
+
+    def test_patient_mapper_renames_all_known_synonyms(self):
+        """Test that patient mapper can rename all synonyms in YAML."""
+        mapper = load_patient_mapper()
+
+        # Create DataFrame with various synonyms
+        test_data = {
+            "Age": [25],
+            "Patient ID": ["P001"],
+            "D.O.B.": ["1999-01-01"],
+            "Gender": ["M"],
+        }
+
+        df = pl.DataFrame(test_data)
+        renamed = mapper.rename_columns(df)
+
+        # Check that columns are renamed correctly
+        assert "age" in renamed.columns
+        assert "patient_id" in renamed.columns
+        assert "dob" in renamed.columns
+        assert "sex" in renamed.columns
+
+    def test_product_mapper_renames_all_known_synonyms(self):
+        """Test that product mapper can rename all synonyms in YAML."""
+        mapper = load_product_mapper()
+
+        # Create DataFrame with various synonyms
+        test_data = {
+            "Product": ["Insulin"],
+            "Date": ["2024-01-01"],
+            "Units Received": [10],
+        }
+
+        df = pl.DataFrame(test_data)
+        renamed = mapper.rename_columns(df)
+
+        # Check that columns are renamed correctly
+        assert "product" in renamed.columns
+        assert "product_entry_date" in renamed.columns
+        assert "product_units_received" in renamed.columns
diff --git a/a4d-python/tests/test_tables/test_patient.py b/a4d-python/tests/test_tables/test_patient.py
new file mode 100644
index 0000000..31aa932
--- /dev/null
+++ b/a4d-python/tests/test_tables/test_patient.py
@@ -0,0 +1,361 @@
+"""Tests for patient table creation."""
+
+from pathlib import Path
+
+import polars as pl
+import pytest
+
+from a4d.tables.patient import (
+    create_table_patient_data_annual,
+    create_table_patient_data_monthly,
+    create_table_patient_data_static,
+    read_cleaned_patient_data,
+)
+
+
+@pytest.fixture
+def cleaned_patient_data_files(tmp_path: Path) -> list[Path]:
+    """Create test cleaned patient data files."""
+    data_dir = tmp_path / "cleaned"
+    data_dir.mkdir()
+
+    file1 = data_dir / "tracker1_2024_01.parquet"
+    df1 = pl.DataFrame(
+        {
+            "patient_id": ["P001", "P002", "P003"],
+            "clinic_id": ["C001", "C001", "C002"],
+            "name": ["Alice", "Bob", "Charlie"],
+            "dob": ["2010-01-15", "2011-03-20", "2009-08-10"],
+            "sex": ["F", "M", "M"],
+            "recruitment_date": ["2024-01-10", "2024-01-15", "2024-01-05"],
+            "province": ["Province1", "Province1", "Province2"],
+            "hba1c_baseline": [8.5, 7.2, 9.1],
+            "hba1c_baseline_exceeds": [True, False, True],
+            "fbg_baseline_mg": [120, 110, 130],
+            "fbg_baseline_mmol": [6.7, 6.1, 7.2],
+            "patient_consent": [True, True, True],
+            "t1d_diagnosis_date": ["2023-01-01", "2022-05-10", "2021-12-15"],
+            "t1d_diagnosis_age": [13, 11, 12],
+            "t1d_diagnosis_with_dka": [True, False, True],
+            "status_out": ["Active", "Active", "Active"],
+            "lost_date": [None, None, None],
+            "file_name": ["tracker1.xlsx", "tracker1.xlsx", "tracker1.xlsx"],
+            "tracker_date": ["2024-01-31", "2024-01-31", "2024-01-31"],
+            "tracker_month": [1, 1, 1],
+            "tracker_year": [2024, 2024, 2024],
+            "sheet_name": ["Jan 2024", "Jan 2024", "Jan 2024"],
+            "weight": [45.5, 52.3, 48.1],
+            "height": [155, 162, 158],
+            "bmi": [18.9, 19.9, 19.3],
+            "bmi_date": ["2024-01-15", "2024-01-18", "2024-01-20"],
+            "age": [14, 13, 15],
+            "status": ["Active", "Active", "Active"],
+            "hba1c_updated": [7.8, 6.9, 8.5],
+            "hba1c_updated_date": ["2024-01-20", "2024-01-22", "2024-01-18"],
+            "hba1c_updated_exceeds": [False, False, True],
+            "fbg_updated_mg": [115, 105, 125],
+            "fbg_updated_mmol": [6.4, 5.8, 6.9],
+            "fbg_updated_date": ["2024-01-20", "2024-01-22", "2024-01-18"],
+            "insulin_type": ["Rapid", "Mixed", "Rapid"],
+            "insulin_subtype": ["Lispro", "30/70", "Aspart"],
+            "insulin_regimen": ["Basal-bolus", "Twice daily", "Basal-bolus"],
+            "insulin_injections": [4, 2, 4],
+            "insulin_total_units": [35, 28, 40],
+            "testing_frequency": [4, 3, 4],
+            "support_level": ["Full", "Full", "Partial"],
+            "last_clinic_visit_date": ["2024-01-25", "2024-01-28", "2024-01-22"],
+            "last_remote_followup_date": [None, None, None],
+            "hospitalisation_date": [None, None, None],
+            "hospitalisation_cause": [None, None, None],
+            "observations": ["Doing well", "Good progress", "Needs improvement"],
+            "observations_category": ["Good", "Good", "Fair"],
+            "edu_occ": ["Student", "Student", "Student"],
+            "edu_occ_updated": ["Student", "Student", "Student"],
+            "blood_pressure_updated": ["110/70", "115/75", "120/80"],
+            "blood_pressure_sys_mmhg": [110, 115, 120],
+            "blood_pressure_dias_mmhg": [70, 75, 80],
+            "complication_screening_kidney_test_date": ["2024-01-10", None, "2024-01-08"],
+            "complication_screening_kidney_test_value": ["Normal", None, "Normal"],
+            "complication_screening_eye_exam_date": ["2024-01-10", None, None],
+            "complication_screening_eye_exam_value": ["Normal", None, None],
+            "complication_screening_foot_exam_date": [None, None, None],
+            "complication_screening_foot_exam_value": [None, None, None],
+            "complication_screening_lipid_profile_date": [None, None, None],
+            "complication_screening_lipid_profile_triglycerides_value": [None, None, None],
+            "complication_screening_lipid_profile_cholesterol_value": [None, None, None],
+            "complication_screening_lipid_profile_ldl_mg_value": [None, None, None],
+            "complication_screening_lipid_profile_ldl_mmol_value": [None, None, None],
+            "complication_screening_lipid_profile_hdl_mg_value": [None, None, None],
+            "complication_screening_lipid_profile_hdl_mmol_value": [None, None, None],
+            "complication_screening_thyroid_test_date": [None, None, None],
+            "complication_screening_thyroid_test_ft4_ng_value": [None, None, None],
+            "complication_screening_thyroid_test_ft4_pmol_value": [None, None, None],
+            "complication_screening_thyroid_test_tsh_value": [None, None, None],
+            "complication_screening_remarks": [None, None, None],
+            "dm_complication_eye": [None, None, None],
+            "dm_complication_kidney": [None, None, None],
+            "dm_complication_others": [None, None, None],
+            "dm_complication_remarks": [None, None, None],
+            "family_history": ["No diabetes", "Type 2 in family", "No diabetes"],
+            "other_issues": [None, None, None],
+        }
+    )
+    df1.write_parquet(file1)
+
+    file2 = data_dir / "tracker1_2024_02.parquet"
+    df2 = pl.DataFrame(
+        {
+            "patient_id": ["P001", "P002"],
+            "clinic_id": ["C001", "C001"],
+            "name": ["Alice", "Bob"],
+            "dob": ["2010-01-15", "2011-03-20"],
+            "sex": ["F", "M"],
+            "recruitment_date": ["2024-01-10", "2024-01-15"],
+            "province": ["Province1", "Province1"],
+            "hba1c_baseline": [8.5, 7.2],
+            "hba1c_baseline_exceeds": [True, False],
+            "fbg_baseline_mg": [120, 110],
+            "fbg_baseline_mmol": [6.7, 6.1],
+            "patient_consent": [True, True],
+            "t1d_diagnosis_date": ["2023-01-01", "2022-05-10"],
+            "t1d_diagnosis_age": [13, 11],
+            "t1d_diagnosis_with_dka": [True, False],
+            "status_out": ["Active", "Active"],
+            "lost_date": [None, None],
+            "file_name": ["tracker1.xlsx", "tracker1.xlsx"],
+            "tracker_date": ["2024-02-29", "2024-02-29"],
+            "tracker_month": [2, 2],
+            "tracker_year": [2024, 2024],
+            "sheet_name": ["Feb 2024", "Feb 2024"],
+            "weight": [46.0, 52.8],
+            "height": [155, 162],
+            "bmi": [19.1, 20.1],
+            "bmi_date": ["2024-02-15", "2024-02-18"],
+            "age": [14, 13],
+            "status": ["Active", "Active"],
+            "hba1c_updated": [7.5, 6.7],
+            "hba1c_updated_date": ["2024-02-20", "2024-02-22"],
+            "hba1c_updated_exceeds": [False, False],
+            "fbg_updated_mg": [110, 100],
+            "fbg_updated_mmol": [6.1, 5.6],
+            "fbg_updated_date": ["2024-02-20", "2024-02-22"],
+            "insulin_type": ["Rapid", "Mixed"],
+            "insulin_subtype": ["Lispro", "30/70"],
+            "insulin_regimen": ["Basal-bolus", "Twice daily"],
+            "insulin_injections": [4, 2],
+            "insulin_total_units": [36, 29],
+            "testing_frequency": [4, 3],
+            "support_level": ["Full", "Full"],
+            "last_clinic_visit_date": ["2024-02-25", "2024-02-28"],
+            "last_remote_followup_date": [None, None],
+            "hospitalisation_date": [None, None],
+            "hospitalisation_cause": [None, None],
+            "observations": ["Excellent progress", "Very good"],
+            "observations_category": ["Excellent", "Good"],
+            "edu_occ": ["Student", "Student"],
+            "edu_occ_updated": ["Student", "Student"],
+            "blood_pressure_updated": ["108/68", "112/72"],
+            "blood_pressure_sys_mmhg": [108, 112],
+            "blood_pressure_dias_mmhg": [68, 72],
+            "complication_screening_kidney_test_date": [None, None],
+            "complication_screening_kidney_test_value": [None, None],
+            "complication_screening_eye_exam_date": [None, None],
+            "complication_screening_eye_exam_value": [None, None],
+            "complication_screening_foot_exam_date": [None, None],
+            "complication_screening_foot_exam_value": [None, None],
+            "complication_screening_lipid_profile_date": [None, None],
+            "complication_screening_lipid_profile_triglycerides_value": [None, None],
+            "complication_screening_lipid_profile_cholesterol_value": [None, None],
+            "complication_screening_lipid_profile_ldl_mg_value": [None, None],
+            "complication_screening_lipid_profile_ldl_mmol_value": [None, None],
+            "complication_screening_lipid_profile_hdl_mg_value": [None, None],
+            "complication_screening_lipid_profile_hdl_mmol_value": [None, None],
+            "complication_screening_thyroid_test_date": [None, None],
+            "complication_screening_thyroid_test_ft4_ng_value": [None, None],
+            "complication_screening_thyroid_test_ft4_pmol_value": [None, None],
+            "complication_screening_thyroid_test_tsh_value": [None, None],
+            "complication_screening_remarks": [None, None],
+            "dm_complication_eye": [None, None],
+            "dm_complication_kidney": [None, None],
+            "dm_complication_others": [None, None],
+            "dm_complication_remarks": [None, None],
+            "family_history": ["No diabetes", "Type 2 in family"],
+            "other_issues": [None, None],
+        }
+    )
+    df2.write_parquet(file2)
+
+    return [file1, file2]
+
+
+def test_read_cleaned_patient_data(cleaned_patient_data_files: list[Path]):
+    """Test reading and combining cleaned patient data files."""
+    result = read_cleaned_patient_data(cleaned_patient_data_files)
+
+    assert isinstance(result, pl.DataFrame)
+    assert result.shape[0] == 5  # 3 rows from file1 + 2 rows from file2
+    assert "patient_id" in result.columns
+    assert "clinic_id" in result.columns
+    assert set(result["patient_id"].to_list()) == {"P001", "P002", "P003"}
+
+
+def test_read_cleaned_patient_data_empty_list():
+    """Test that empty file list raises error."""
+    with pytest.raises(ValueError, match="No cleaned files provided"):
+        read_cleaned_patient_data([])
+
+
+def test_create_table_patient_data_static(cleaned_patient_data_files: list[Path], tmp_path: Path):
+    """Test creation of static patient data table."""
+    output_dir = tmp_path / "output"
+
+    output_file = create_table_patient_data_static(cleaned_patient_data_files, output_dir)
+
+    assert output_file.exists()
+    assert output_file.name == "patient_data_static.parquet"
+
+    result = pl.read_parquet(output_file)
+
+    assert result.shape[0] == 3
+    assert set(result["patient_id"].to_list()) == {"P001", "P002", "P003"}
+
+    p001_data = result.filter(pl.col("patient_id") == "P001")
+    assert p001_data["tracker_month"][0] == 2
+    assert p001_data["tracker_year"][0] == 2024
+
+    p002_data = result.filter(pl.col("patient_id") == "P002")
+    assert p002_data["tracker_month"][0] == 2
+    assert p002_data["tracker_year"][0] == 2024
+
+    p003_data = result.filter(pl.col("patient_id") == "P003")
+    assert p003_data["tracker_month"][0] == 1
+    assert p003_data["tracker_year"][0] == 2024
+
+    assert "name" in result.columns
+    assert "dob" in result.columns
+    assert "recruitment_date" in result.columns
+    assert "weight" not in result.columns
+    assert "status" not in result.columns
+
+
+def test_create_table_patient_data_monthly(cleaned_patient_data_files: list[Path], tmp_path: Path):
+    """Test creation of monthly patient data table."""
+    output_dir = tmp_path / "output"
+
+    output_file = create_table_patient_data_monthly(cleaned_patient_data_files, output_dir)
+
+    assert output_file.exists()
+    assert output_file.name == "patient_data_monthly.parquet"
+
+    result = pl.read_parquet(output_file)
+
+    assert result.shape[0] == 5
+
+    assert "weight" in result.columns
+    assert "bmi" in result.columns
+    assert "status" in result.columns
+    assert "insulin_type" in result.columns
+    assert "name" not in result.columns
+    assert "dob" not in result.columns
+
+    sorted_check = result["tracker_year"].to_list()
+    assert sorted_check == sorted(sorted_check)
+
+
+def test_create_table_patient_data_annual(cleaned_patient_data_files: list[Path], tmp_path: Path):
+    """Test creation of annual patient data table."""
+    output_dir = tmp_path / "output"
+
+    output_file = create_table_patient_data_annual(cleaned_patient_data_files, output_dir)
+
+    assert output_file.exists()
+    assert output_file.name == "patient_data_annual.parquet"
+
+    result = pl.read_parquet(output_file)
+
+    assert result.shape[0] == 3
+
+    assert "complication_screening_kidney_test_date" in result.columns
+    assert "dm_complication_eye" in result.columns
+    assert "family_history" in result.columns
+    assert "name" not in result.columns
+    assert "weight" not in result.columns
+
+    p001_data = result.filter(pl.col("patient_id") == "P001")
+    assert p001_data.shape[0] == 1
+    assert p001_data["tracker_month"][0] == 2
+    assert p001_data["tracker_year"][0] == 2024
+
+
+def test_create_table_patient_data_annual_filters_pre_2024(tmp_path: Path):
+    """Test that annual table filters out data before 2024."""
+    data_dir = tmp_path / "cleaned"
+    data_dir.mkdir()
+
+    file1 = data_dir / "tracker_2023.parquet"
+    df1 = pl.DataFrame(
+        {
+            "patient_id": ["P001"],
+            "status": ["Active"],
+            "tracker_month": [12],
+            "tracker_year": [2023],
+            "tracker_date": ["2023-12-31"],
+            "edu_occ": ["Student"],
+            "edu_occ_updated": ["Student"],
+            "blood_pressure_updated": ["110/70"],
+            "blood_pressure_sys_mmhg": [110],
+            "blood_pressure_dias_mmhg": [70],
+            "complication_screening_kidney_test_date": [None],
+            "complication_screening_kidney_test_value": [None],
+            "complication_screening_eye_exam_date": [None],
+            "complication_screening_eye_exam_value": [None],
+            "complication_screening_foot_exam_date": [None],
+            "complication_screening_foot_exam_value": [None],
+            "complication_screening_lipid_profile_date": [None],
+            "complication_screening_lipid_profile_triglycerides_value": [None],
+            "complication_screening_lipid_profile_cholesterol_value": [None],
+            "complication_screening_lipid_profile_ldl_mg_value": [None],
+            "complication_screening_lipid_profile_ldl_mmol_value": [None],
+            "complication_screening_lipid_profile_hdl_mg_value": [None],
+            "complication_screening_lipid_profile_hdl_mmol_value": [None],
+            "complication_screening_thyroid_test_date": [None],
+            "complication_screening_thyroid_test_ft4_ng_value": [None],
+            "complication_screening_thyroid_test_ft4_pmol_value": [None],
+            "complication_screening_thyroid_test_tsh_value": [None],
+            "complication_screening_remarks": [None],
+            "dm_complication_eye": [None],
+            "dm_complication_kidney": [None],
+            "dm_complication_others": [None],
+            "dm_complication_remarks": [None],
+            "family_history": ["No diabetes"],
+            "other_issues": [None],
+        }
+    )
+    df1.write_parquet(file1)
+
+    output_dir = tmp_path / "output"
+    output_file = create_table_patient_data_annual([file1], output_dir)
+
+    result = pl.read_parquet(output_file)
+    assert result.shape[0] == 0
+
+
+def test_static_table_sorting(cleaned_patient_data_files: list[Path], tmp_path: Path):
+    """Test that static table is sorted correctly."""
+    output_dir = tmp_path / "output"
+    output_file = create_table_patient_data_static(cleaned_patient_data_files, output_dir)
+
+    result = pl.read_parquet(output_file)
+
+    tracker_years = result["tracker_year"].to_list()
+    tracker_months = result["tracker_month"].to_list()
+    patient_ids = result["patient_id"].to_list()
+
+    for i in range(len(result) - 1):
+        if tracker_years[i] < tracker_years[i + 1]:
+            continue
+        elif tracker_years[i] == tracker_years[i + 1]:
+            if tracker_months[i] < tracker_months[i + 1]:
+                continue
+            elif tracker_months[i] == tracker_months[i + 1]:
+                assert patient_ids[i] <= patient_ids[i + 1]
diff --git a/a4d-python/uv.lock b/a4d-python/uv.lock
new file mode 100644
index 0000000..10cf087
--- /dev/null
+++ b/a4d-python/uv.lock
@@ -0,0 +1,1298 @@
+version = 1
+revision = 3
+requires-python = ">=3.11"
+resolution-markers = [
+    "python_full_version >= '3.14'",
+    "python_full_version == '3.13.*'",
+    "python_full_version < '3.13'",
+]
+
+[[package]]
+name = "a4d"
+version = "2.0.0"
+source = { editable = "." }
+dependencies = [
+    { name = "duckdb" },
+    { name = "fastexcel" },
+    { name = "google-cloud-bigquery" },
+    { name = "google-cloud-storage" },
+    { name = "loguru" },
+    { name = "openpyxl" },
+    { name = "pandera", extra = ["polars"] },
+    { name = "polars" },
+    { name = "pydantic" },
+    { name = "pydantic-settings" },
+    { name = "python-dateutil" },
+    { name = "pyyaml" },
+    { name = "rich" },
+    { name = "tqdm" },
+    { name = "typer" },
+]
+
+[package.dev-dependencies]
+dev = [
+    { name = "pre-commit" },
+    { name = "pytest" },
+    { name = "pytest-cov" },
+    { name = "pytest-mock" },
+    { name = "ruff" },
+    { name = "ty" },
+]
+
+[package.metadata]
+requires-dist = [
+    { name = "duckdb", specifier = ">=0.10.0" },
+    { name = "fastexcel", specifier = ">=0.16.0" },
+    { name = "google-cloud-bigquery", specifier = ">=3.17.0" },
+    { name = "google-cloud-storage", specifier = ">=2.14.0" },
+    { name = "loguru", specifier = ">=0.7.0" },
+    { name = "openpyxl", specifier = ">=3.1.0" },
+    { name = "pandera", extras = ["polars"], specifier = ">=0.18.0" },
+    { name = "polars", specifier = ">=0.20.0" },
+    { name = "pydantic", specifier = ">=2.6.0" },
+    { name = "pydantic-settings", specifier = ">=2.2.0" },
+    { name = "python-dateutil", specifier = ">=2.8.0" },
+    { name = "pyyaml", specifier = ">=6.0" },
+    { name = "rich", specifier = ">=13.7.0" },
+    { name = "tqdm", specifier = ">=4.66.0" },
+    { name = "typer", specifier = ">=0.9.0" },
+]
+
+[package.metadata.requires-dev]
+dev = [
+    { name = "pre-commit", specifier = ">=4.3.0" },
+    { name = "pytest", specifier = ">=8.4.2" },
+    { name = "pytest-cov", specifier = ">=7.0.0" },
+    { name = "pytest-mock", specifier = ">=3.15.1" },
+    { name = "ruff", specifier = ">=0.14.1" },
+    { name = "ty", specifier = ">=0.0.1a23" },
+]
+
+[[package]]
+name = "annotated-types"
+version = "0.7.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ee/67/531ea369ba64dcff5ec9c3402f9f51bf748cec26dde048a2f973a4eea7f5/annotated_types-0.7.0.tar.gz", hash = "sha256:aff07c09a53a08bc8cfccb9c85b05f1aa9a2a6f23728d790723543408344ce89", size = 16081, upload-time = "2024-05-20T21:33:25.928Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/78/b6/6307fbef88d9b5ee7421e68d78a9f162e0da4900bc5f5793f6d3d0e34fb8/annotated_types-0.7.0-py3-none-any.whl", hash = "sha256:1f02e8b43a8fbbc3f3e0d4f0f4bfc8131bcb4eebe8849b8e5c773f3a1c582a53", size = 13643, upload-time = "2024-05-20T21:33:24.1Z" },
+]
+
+[[package]]
+name = "cachetools"
+version = "6.2.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/cc/7e/b975b5814bd36faf009faebe22c1072a1fa1168db34d285ef0ba071ad78c/cachetools-6.2.1.tar.gz", hash = "sha256:3f391e4bd8f8bf0931169baf7456cc822705f4e2a31f840d218f445b9a854201", size = 31325, upload-time = "2025-10-12T14:55:30.139Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/96/c5/1e741d26306c42e2bf6ab740b2202872727e0f606033c9dd713f8b93f5a8/cachetools-6.2.1-py3-none-any.whl", hash = "sha256:09868944b6dde876dfd44e1d47e18484541eaf12f26f29b7af91b26cc892d701", size = 11280, upload-time = "2025-10-12T14:55:28.382Z" },
+]
+
+[[package]]
+name = "certifi"
+version = "2025.10.5"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/4c/5b/b6ce21586237c77ce67d01dc5507039d444b630dd76611bbca2d8e5dcd91/certifi-2025.10.5.tar.gz", hash = "sha256:47c09d31ccf2acf0be3f701ea53595ee7e0b8fa08801c6624be771df09ae7b43", size = 164519, upload-time = "2025-10-05T04:12:15.808Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/e4/37/af0d2ef3967ac0d6113837b44a4f0bfe1328c2b9763bd5b1744520e5cfed/certifi-2025.10.5-py3-none-any.whl", hash = "sha256:0f212c2744a9bb6de0c56639a6f68afe01ecd92d91f14ae897c4fe7bbeeef0de", size = 163286, upload-time = "2025-10-05T04:12:14.03Z" },
+]
+
+[[package]]
+name = "cfgv"
+version = "3.4.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/11/74/539e56497d9bd1d484fd863dd69cbbfa653cd2aa27abfe35653494d85e94/cfgv-3.4.0.tar.gz", hash = "sha256:e52591d4c5f5dead8e0f673fb16db7949d2cfb3f7da4582893288f0ded8fe560", size = 7114, upload-time = "2023-08-12T20:38:17.776Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/c5/55/51844dd50c4fc7a33b653bfaba4c2456f06955289ca770a5dbd5fd267374/cfgv-3.4.0-py2.py3-none-any.whl", hash = "sha256:b7265b1f29fd3316bfcd2b330d63d024f2bfd8bcb8b0272f8e19a504856c48f9", size = 7249, upload-time = "2023-08-12T20:38:16.269Z" },
+]
+
+[[package]]
+name = "charset-normalizer"
+version = "3.4.4"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/13/69/33ddede1939fdd074bce5434295f38fae7136463422fe4fd3e0e89b98062/charset_normalizer-3.4.4.tar.gz", hash = "sha256:94537985111c35f28720e43603b8e7b43a6ecfb2ce1d3058bbe955b73404e21a", size = 129418, upload-time = "2025-10-14T04:42:32.879Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/ed/27/c6491ff4954e58a10f69ad90aca8a1b6fe9c5d3c6f380907af3c37435b59/charset_normalizer-3.4.4-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:6e1fcf0720908f200cd21aa4e6750a48ff6ce4afe7ff5a79a90d5ed8a08296f8", size = 206988, upload-time = "2025-10-14T04:40:33.79Z" },
+    { url = "https://files.pythonhosted.org/packages/94/59/2e87300fe67ab820b5428580a53cad894272dbb97f38a7a814a2a1ac1011/charset_normalizer-3.4.4-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:5f819d5fe9234f9f82d75bdfa9aef3a3d72c4d24a6e57aeaebba32a704553aa0", size = 147324, upload-time = "2025-10-14T04:40:34.961Z" },
+    { url = "https://files.pythonhosted.org/packages/07/fb/0cf61dc84b2b088391830f6274cb57c82e4da8bbc2efeac8c025edb88772/charset_normalizer-3.4.4-cp311-cp311-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:a59cb51917aa591b1c4e6a43c132f0cdc3c76dbad6155df4e28ee626cc77a0a3", size = 142742, upload-time = "2025-10-14T04:40:36.105Z" },
+    { url = "https://files.pythonhosted.org/packages/62/8b/171935adf2312cd745d290ed93cf16cf0dfe320863ab7cbeeae1dcd6535f/charset_normalizer-3.4.4-cp311-cp311-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:8ef3c867360f88ac904fd3f5e1f902f13307af9052646963ee08ff4f131adafc", size = 160863, upload-time = "2025-10-14T04:40:37.188Z" },
+    { url = "https://files.pythonhosted.org/packages/09/73/ad875b192bda14f2173bfc1bc9a55e009808484a4b256748d931b6948442/charset_normalizer-3.4.4-cp311-cp311-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:d9e45d7faa48ee908174d8fe84854479ef838fc6a705c9315372eacbc2f02897", size = 157837, upload-time = "2025-10-14T04:40:38.435Z" },
+    { url = "https://files.pythonhosted.org/packages/6d/fc/de9cce525b2c5b94b47c70a4b4fb19f871b24995c728e957ee68ab1671ea/charset_normalizer-3.4.4-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:840c25fb618a231545cbab0564a799f101b63b9901f2569faecd6b222ac72381", size = 151550, upload-time = "2025-10-14T04:40:40.053Z" },
+    { url = "https://files.pythonhosted.org/packages/55/c2/43edd615fdfba8c6f2dfbd459b25a6b3b551f24ea21981e23fb768503ce1/charset_normalizer-3.4.4-cp311-cp311-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:ca5862d5b3928c4940729dacc329aa9102900382fea192fc5e52eb69d6093815", size = 149162, upload-time = "2025-10-14T04:40:41.163Z" },
+    { url = "https://files.pythonhosted.org/packages/03/86/bde4ad8b4d0e9429a4e82c1e8f5c659993a9a863ad62c7df05cf7b678d75/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:d9c7f57c3d666a53421049053eaacdd14bbd0a528e2186fcb2e672effd053bb0", size = 150019, upload-time = "2025-10-14T04:40:42.276Z" },
+    { url = "https://files.pythonhosted.org/packages/1f/86/a151eb2af293a7e7bac3a739b81072585ce36ccfb4493039f49f1d3cae8c/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_armv7l.whl", hash = "sha256:277e970e750505ed74c832b4bf75dac7476262ee2a013f5574dd49075879e161", size = 143310, upload-time = "2025-10-14T04:40:43.439Z" },
+    { url = "https://files.pythonhosted.org/packages/b5/fe/43dae6144a7e07b87478fdfc4dbe9efd5defb0e7ec29f5f58a55aeef7bf7/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_ppc64le.whl", hash = "sha256:31fd66405eaf47bb62e8cd575dc621c56c668f27d46a61d975a249930dd5e2a4", size = 162022, upload-time = "2025-10-14T04:40:44.547Z" },
+    { url = "https://files.pythonhosted.org/packages/80/e6/7aab83774f5d2bca81f42ac58d04caf44f0cc2b65fc6db2b3b2e8a05f3b3/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_riscv64.whl", hash = "sha256:0d3d8f15c07f86e9ff82319b3d9ef6f4bf907608f53fe9d92b28ea9ae3d1fd89", size = 149383, upload-time = "2025-10-14T04:40:46.018Z" },
+    { url = "https://files.pythonhosted.org/packages/4f/e8/b289173b4edae05c0dde07f69f8db476a0b511eac556dfe0d6bda3c43384/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_s390x.whl", hash = "sha256:9f7fcd74d410a36883701fafa2482a6af2ff5ba96b9a620e9e0721e28ead5569", size = 159098, upload-time = "2025-10-14T04:40:47.081Z" },
+    { url = "https://files.pythonhosted.org/packages/d8/df/fe699727754cae3f8478493c7f45f777b17c3ef0600e28abfec8619eb49c/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:ebf3e58c7ec8a8bed6d66a75d7fb37b55e5015b03ceae72a8e7c74495551e224", size = 152991, upload-time = "2025-10-14T04:40:48.246Z" },
+    { url = "https://files.pythonhosted.org/packages/1a/86/584869fe4ddb6ffa3bd9f491b87a01568797fb9bd8933f557dba9771beaf/charset_normalizer-3.4.4-cp311-cp311-win32.whl", hash = "sha256:eecbc200c7fd5ddb9a7f16c7decb07b566c29fa2161a16cf67b8d068bd21690a", size = 99456, upload-time = "2025-10-14T04:40:49.376Z" },
+    { url = "https://files.pythonhosted.org/packages/65/f6/62fdd5feb60530f50f7e38b4f6a1d5203f4d16ff4f9f0952962c044e919a/charset_normalizer-3.4.4-cp311-cp311-win_amd64.whl", hash = "sha256:5ae497466c7901d54b639cf42d5b8c1b6a4fead55215500d2f486d34db48d016", size = 106978, upload-time = "2025-10-14T04:40:50.844Z" },
+    { url = "https://files.pythonhosted.org/packages/7a/9d/0710916e6c82948b3be62d9d398cb4fcf4e97b56d6a6aeccd66c4b2f2bd5/charset_normalizer-3.4.4-cp311-cp311-win_arm64.whl", hash = "sha256:65e2befcd84bc6f37095f5961e68a6f077bf44946771354a28ad434c2cce0ae1", size = 99969, upload-time = "2025-10-14T04:40:52.272Z" },
+    { url = "https://files.pythonhosted.org/packages/f3/85/1637cd4af66fa687396e757dec650f28025f2a2f5a5531a3208dc0ec43f2/charset_normalizer-3.4.4-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:0a98e6759f854bd25a58a73fa88833fba3b7c491169f86ce1180c948ab3fd394", size = 208425, upload-time = "2025-10-14T04:40:53.353Z" },
+    { url = "https://files.pythonhosted.org/packages/9d/6a/04130023fef2a0d9c62d0bae2649b69f7b7d8d24ea5536feef50551029df/charset_normalizer-3.4.4-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:b5b290ccc2a263e8d185130284f8501e3e36c5e02750fc6b6bdeb2e9e96f1e25", size = 148162, upload-time = "2025-10-14T04:40:54.558Z" },
+    { url = "https://files.pythonhosted.org/packages/78/29/62328d79aa60da22c9e0b9a66539feae06ca0f5a4171ac4f7dc285b83688/charset_normalizer-3.4.4-cp312-cp312-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:74bb723680f9f7a6234dcf67aea57e708ec1fbdf5699fb91dfd6f511b0a320ef", size = 144558, upload-time = "2025-10-14T04:40:55.677Z" },
+    { url = "https://files.pythonhosted.org/packages/86/bb/b32194a4bf15b88403537c2e120b817c61cd4ecffa9b6876e941c3ee38fe/charset_normalizer-3.4.4-cp312-cp312-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:f1e34719c6ed0b92f418c7c780480b26b5d9c50349e9a9af7d76bf757530350d", size = 161497, upload-time = "2025-10-14T04:40:57.217Z" },
+    { url = "https://files.pythonhosted.org/packages/19/89/a54c82b253d5b9b111dc74aca196ba5ccfcca8242d0fb64146d4d3183ff1/charset_normalizer-3.4.4-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:2437418e20515acec67d86e12bf70056a33abdacb5cb1655042f6538d6b085a8", size = 159240, upload-time = "2025-10-14T04:40:58.358Z" },
+    { url = "https://files.pythonhosted.org/packages/c0/10/d20b513afe03acc89ec33948320a5544d31f21b05368436d580dec4e234d/charset_normalizer-3.4.4-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:11d694519d7f29d6cd09f6ac70028dba10f92f6cdd059096db198c283794ac86", size = 153471, upload-time = "2025-10-14T04:40:59.468Z" },
+    { url = "https://files.pythonhosted.org/packages/61/fa/fbf177b55bdd727010f9c0a3c49eefa1d10f960e5f09d1d887bf93c2e698/charset_normalizer-3.4.4-cp312-cp312-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:ac1c4a689edcc530fc9d9aa11f5774b9e2f33f9a0c6a57864e90908f5208d30a", size = 150864, upload-time = "2025-10-14T04:41:00.623Z" },
+    { url = "https://files.pythonhosted.org/packages/05/12/9fbc6a4d39c0198adeebbde20b619790e9236557ca59fc40e0e3cebe6f40/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:21d142cc6c0ec30d2efee5068ca36c128a30b0f2c53c1c07bd78cb6bc1d3be5f", size = 150647, upload-time = "2025-10-14T04:41:01.754Z" },
+    { url = "https://files.pythonhosted.org/packages/ad/1f/6a9a593d52e3e8c5d2b167daf8c6b968808efb57ef4c210acb907c365bc4/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_armv7l.whl", hash = "sha256:5dbe56a36425d26d6cfb40ce79c314a2e4dd6211d51d6d2191c00bed34f354cc", size = 145110, upload-time = "2025-10-14T04:41:03.231Z" },
+    { url = "https://files.pythonhosted.org/packages/30/42/9a52c609e72471b0fc54386dc63c3781a387bb4fe61c20231a4ebcd58bdd/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:5bfbb1b9acf3334612667b61bd3002196fe2a1eb4dd74d247e0f2a4d50ec9bbf", size = 162839, upload-time = "2025-10-14T04:41:04.715Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/5b/c0682bbf9f11597073052628ddd38344a3d673fda35a36773f7d19344b23/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_riscv64.whl", hash = "sha256:d055ec1e26e441f6187acf818b73564e6e6282709e9bcb5b63f5b23068356a15", size = 150667, upload-time = "2025-10-14T04:41:05.827Z" },
+    { url = "https://files.pythonhosted.org/packages/e4/24/a41afeab6f990cf2daf6cb8c67419b63b48cf518e4f56022230840c9bfb2/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_s390x.whl", hash = "sha256:af2d8c67d8e573d6de5bc30cdb27e9b95e49115cd9baad5ddbd1a6207aaa82a9", size = 160535, upload-time = "2025-10-14T04:41:06.938Z" },
+    { url = "https://files.pythonhosted.org/packages/2a/e5/6a4ce77ed243c4a50a1fecca6aaaab419628c818a49434be428fe24c9957/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:780236ac706e66881f3b7f2f32dfe90507a09e67d1d454c762cf642e6e1586e0", size = 154816, upload-time = "2025-10-14T04:41:08.101Z" },
+    { url = "https://files.pythonhosted.org/packages/a8/ef/89297262b8092b312d29cdb2517cb1237e51db8ecef2e9af5edbe7b683b1/charset_normalizer-3.4.4-cp312-cp312-win32.whl", hash = "sha256:5833d2c39d8896e4e19b689ffc198f08ea58116bee26dea51e362ecc7cd3ed26", size = 99694, upload-time = "2025-10-14T04:41:09.23Z" },
+    { url = "https://files.pythonhosted.org/packages/3d/2d/1e5ed9dd3b3803994c155cd9aacb60c82c331bad84daf75bcb9c91b3295e/charset_normalizer-3.4.4-cp312-cp312-win_amd64.whl", hash = "sha256:a79cfe37875f822425b89a82333404539ae63dbdddf97f84dcbc3d339aae9525", size = 107131, upload-time = "2025-10-14T04:41:10.467Z" },
+    { url = "https://files.pythonhosted.org/packages/d0/d9/0ed4c7098a861482a7b6a95603edce4c0d9db2311af23da1fb2b75ec26fc/charset_normalizer-3.4.4-cp312-cp312-win_arm64.whl", hash = "sha256:376bec83a63b8021bb5c8ea75e21c4ccb86e7e45ca4eb81146091b56599b80c3", size = 100390, upload-time = "2025-10-14T04:41:11.915Z" },
+    { url = "https://files.pythonhosted.org/packages/97/45/4b3a1239bbacd321068ea6e7ac28875b03ab8bc0aa0966452db17cd36714/charset_normalizer-3.4.4-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:e1f185f86a6f3403aa2420e815904c67b2f9ebc443f045edd0de921108345794", size = 208091, upload-time = "2025-10-14T04:41:13.346Z" },
+    { url = "https://files.pythonhosted.org/packages/7d/62/73a6d7450829655a35bb88a88fca7d736f9882a27eacdca2c6d505b57e2e/charset_normalizer-3.4.4-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:6b39f987ae8ccdf0d2642338faf2abb1862340facc796048b604ef14919e55ed", size = 147936, upload-time = "2025-10-14T04:41:14.461Z" },
+    { url = "https://files.pythonhosted.org/packages/89/c5/adb8c8b3d6625bef6d88b251bbb0d95f8205831b987631ab0c8bb5d937c2/charset_normalizer-3.4.4-cp313-cp313-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:3162d5d8ce1bb98dd51af660f2121c55d0fa541b46dff7bb9b9f86ea1d87de72", size = 144180, upload-time = "2025-10-14T04:41:15.588Z" },
+    { url = "https://files.pythonhosted.org/packages/91/ed/9706e4070682d1cc219050b6048bfd293ccf67b3d4f5a4f39207453d4b99/charset_normalizer-3.4.4-cp313-cp313-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:81d5eb2a312700f4ecaa977a8235b634ce853200e828fbadf3a9c50bab278328", size = 161346, upload-time = "2025-10-14T04:41:16.738Z" },
+    { url = "https://files.pythonhosted.org/packages/d5/0d/031f0d95e4972901a2f6f09ef055751805ff541511dc1252ba3ca1f80cf5/charset_normalizer-3.4.4-cp313-cp313-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:5bd2293095d766545ec1a8f612559f6b40abc0eb18bb2f5d1171872d34036ede", size = 158874, upload-time = "2025-10-14T04:41:17.923Z" },
+    { url = "https://files.pythonhosted.org/packages/f5/83/6ab5883f57c9c801ce5e5677242328aa45592be8a00644310a008d04f922/charset_normalizer-3.4.4-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:a8a8b89589086a25749f471e6a900d3f662d1d3b6e2e59dcecf787b1cc3a1894", size = 153076, upload-time = "2025-10-14T04:41:19.106Z" },
+    { url = "https://files.pythonhosted.org/packages/75/1e/5ff781ddf5260e387d6419959ee89ef13878229732732ee73cdae01800f2/charset_normalizer-3.4.4-cp313-cp313-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:bc7637e2f80d8530ee4a78e878bce464f70087ce73cf7c1caf142416923b98f1", size = 150601, upload-time = "2025-10-14T04:41:20.245Z" },
+    { url = "https://files.pythonhosted.org/packages/d7/57/71be810965493d3510a6ca79b90c19e48696fb1ff964da319334b12677f0/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:f8bf04158c6b607d747e93949aa60618b61312fe647a6369f88ce2ff16043490", size = 150376, upload-time = "2025-10-14T04:41:21.398Z" },
+    { url = "https://files.pythonhosted.org/packages/e5/d5/c3d057a78c181d007014feb7e9f2e65905a6c4ef182c0ddf0de2924edd65/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_armv7l.whl", hash = "sha256:554af85e960429cf30784dd47447d5125aaa3b99a6f0683589dbd27e2f45da44", size = 144825, upload-time = "2025-10-14T04:41:22.583Z" },
+    { url = "https://files.pythonhosted.org/packages/e6/8c/d0406294828d4976f275ffbe66f00266c4b3136b7506941d87c00cab5272/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_ppc64le.whl", hash = "sha256:74018750915ee7ad843a774364e13a3db91682f26142baddf775342c3f5b1133", size = 162583, upload-time = "2025-10-14T04:41:23.754Z" },
+    { url = "https://files.pythonhosted.org/packages/d7/24/e2aa1f18c8f15c4c0e932d9287b8609dd30ad56dbe41d926bd846e22fb8d/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_riscv64.whl", hash = "sha256:c0463276121fdee9c49b98908b3a89c39be45d86d1dbaa22957e38f6321d4ce3", size = 150366, upload-time = "2025-10-14T04:41:25.27Z" },
+    { url = "https://files.pythonhosted.org/packages/e4/5b/1e6160c7739aad1e2df054300cc618b06bf784a7a164b0f238360721ab86/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_s390x.whl", hash = "sha256:362d61fd13843997c1c446760ef36f240cf81d3ebf74ac62652aebaf7838561e", size = 160300, upload-time = "2025-10-14T04:41:26.725Z" },
+    { url = "https://files.pythonhosted.org/packages/7a/10/f882167cd207fbdd743e55534d5d9620e095089d176d55cb22d5322f2afd/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:9a26f18905b8dd5d685d6d07b0cdf98a79f3c7a918906af7cc143ea2e164c8bc", size = 154465, upload-time = "2025-10-14T04:41:28.322Z" },
+    { url = "https://files.pythonhosted.org/packages/89/66/c7a9e1b7429be72123441bfdbaf2bc13faab3f90b933f664db506dea5915/charset_normalizer-3.4.4-cp313-cp313-win32.whl", hash = "sha256:9b35f4c90079ff2e2edc5b26c0c77925e5d2d255c42c74fdb70fb49b172726ac", size = 99404, upload-time = "2025-10-14T04:41:29.95Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/26/b9924fa27db384bdcd97ab83b4f0a8058d96ad9626ead570674d5e737d90/charset_normalizer-3.4.4-cp313-cp313-win_amd64.whl", hash = "sha256:b435cba5f4f750aa6c0a0d92c541fb79f69a387c91e61f1795227e4ed9cece14", size = 107092, upload-time = "2025-10-14T04:41:31.188Z" },
+    { url = "https://files.pythonhosted.org/packages/af/8f/3ed4bfa0c0c72a7ca17f0380cd9e4dd842b09f664e780c13cff1dcf2ef1b/charset_normalizer-3.4.4-cp313-cp313-win_arm64.whl", hash = "sha256:542d2cee80be6f80247095cc36c418f7bddd14f4a6de45af91dfad36d817bba2", size = 100408, upload-time = "2025-10-14T04:41:32.624Z" },
+    { url = "https://files.pythonhosted.org/packages/2a/35/7051599bd493e62411d6ede36fd5af83a38f37c4767b92884df7301db25d/charset_normalizer-3.4.4-cp314-cp314-macosx_10_13_universal2.whl", hash = "sha256:da3326d9e65ef63a817ecbcc0df6e94463713b754fe293eaa03da99befb9a5bd", size = 207746, upload-time = "2025-10-14T04:41:33.773Z" },
+    { url = "https://files.pythonhosted.org/packages/10/9a/97c8d48ef10d6cd4fcead2415523221624bf58bcf68a802721a6bc807c8f/charset_normalizer-3.4.4-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:8af65f14dc14a79b924524b1e7fffe304517b2bff5a58bf64f30b98bbc5079eb", size = 147889, upload-time = "2025-10-14T04:41:34.897Z" },
+    { url = "https://files.pythonhosted.org/packages/10/bf/979224a919a1b606c82bd2c5fa49b5c6d5727aa47b4312bb27b1734f53cd/charset_normalizer-3.4.4-cp314-cp314-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:74664978bb272435107de04e36db5a9735e78232b85b77d45cfb38f758efd33e", size = 143641, upload-time = "2025-10-14T04:41:36.116Z" },
+    { url = "https://files.pythonhosted.org/packages/ba/33/0ad65587441fc730dc7bd90e9716b30b4702dc7b617e6ba4997dc8651495/charset_normalizer-3.4.4-cp314-cp314-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:752944c7ffbfdd10c074dc58ec2d5a8a4cd9493b314d367c14d24c17684ddd14", size = 160779, upload-time = "2025-10-14T04:41:37.229Z" },
+    { url = "https://files.pythonhosted.org/packages/67/ed/331d6b249259ee71ddea93f6f2f0a56cfebd46938bde6fcc6f7b9a3d0e09/charset_normalizer-3.4.4-cp314-cp314-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:d1f13550535ad8cff21b8d757a3257963e951d96e20ec82ab44bc64aeb62a191", size = 159035, upload-time = "2025-10-14T04:41:38.368Z" },
+    { url = "https://files.pythonhosted.org/packages/67/ff/f6b948ca32e4f2a4576aa129d8bed61f2e0543bf9f5f2b7fc3758ed005c9/charset_normalizer-3.4.4-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:ecaae4149d99b1c9e7b88bb03e3221956f68fd6d50be2ef061b2381b61d20838", size = 152542, upload-time = "2025-10-14T04:41:39.862Z" },
+    { url = "https://files.pythonhosted.org/packages/16/85/276033dcbcc369eb176594de22728541a925b2632f9716428c851b149e83/charset_normalizer-3.4.4-cp314-cp314-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:cb6254dc36b47a990e59e1068afacdcd02958bdcce30bb50cc1700a8b9d624a6", size = 149524, upload-time = "2025-10-14T04:41:41.319Z" },
+    { url = "https://files.pythonhosted.org/packages/9e/f2/6a2a1f722b6aba37050e626530a46a68f74e63683947a8acff92569f979a/charset_normalizer-3.4.4-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:c8ae8a0f02f57a6e61203a31428fa1d677cbe50c93622b4149d5c0f319c1d19e", size = 150395, upload-time = "2025-10-14T04:41:42.539Z" },
+    { url = "https://files.pythonhosted.org/packages/60/bb/2186cb2f2bbaea6338cad15ce23a67f9b0672929744381e28b0592676824/charset_normalizer-3.4.4-cp314-cp314-musllinux_1_2_armv7l.whl", hash = "sha256:47cc91b2f4dd2833fddaedd2893006b0106129d4b94fdb6af1f4ce5a9965577c", size = 143680, upload-time = "2025-10-14T04:41:43.661Z" },
+    { url = "https://files.pythonhosted.org/packages/7d/a5/bf6f13b772fbb2a90360eb620d52ed8f796f3c5caee8398c3b2eb7b1c60d/charset_normalizer-3.4.4-cp314-cp314-musllinux_1_2_ppc64le.whl", hash = "sha256:82004af6c302b5d3ab2cfc4cc5f29db16123b1a8417f2e25f9066f91d4411090", size = 162045, upload-time = "2025-10-14T04:41:44.821Z" },
+    { url = "https://files.pythonhosted.org/packages/df/c5/d1be898bf0dc3ef9030c3825e5d3b83f2c528d207d246cbabe245966808d/charset_normalizer-3.4.4-cp314-cp314-musllinux_1_2_riscv64.whl", hash = "sha256:2b7d8f6c26245217bd2ad053761201e9f9680f8ce52f0fcd8d0755aeae5b2152", size = 149687, upload-time = "2025-10-14T04:41:46.442Z" },
+    { url = "https://files.pythonhosted.org/packages/a5/42/90c1f7b9341eef50c8a1cb3f098ac43b0508413f33affd762855f67a410e/charset_normalizer-3.4.4-cp314-cp314-musllinux_1_2_s390x.whl", hash = "sha256:799a7a5e4fb2d5898c60b640fd4981d6a25f1c11790935a44ce38c54e985f828", size = 160014, upload-time = "2025-10-14T04:41:47.631Z" },
+    { url = "https://files.pythonhosted.org/packages/76/be/4d3ee471e8145d12795ab655ece37baed0929462a86e72372fd25859047c/charset_normalizer-3.4.4-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:99ae2cffebb06e6c22bdc25801d7b30f503cc87dbd283479e7b606f70aff57ec", size = 154044, upload-time = "2025-10-14T04:41:48.81Z" },
+    { url = "https://files.pythonhosted.org/packages/b0/6f/8f7af07237c34a1defe7defc565a9bc1807762f672c0fde711a4b22bf9c0/charset_normalizer-3.4.4-cp314-cp314-win32.whl", hash = "sha256:f9d332f8c2a2fcbffe1378594431458ddbef721c1769d78e2cbc06280d8155f9", size = 99940, upload-time = "2025-10-14T04:41:49.946Z" },
+    { url = "https://files.pythonhosted.org/packages/4b/51/8ade005e5ca5b0d80fb4aff72a3775b325bdc3d27408c8113811a7cbe640/charset_normalizer-3.4.4-cp314-cp314-win_amd64.whl", hash = "sha256:8a6562c3700cce886c5be75ade4a5db4214fda19fede41d9792d100288d8f94c", size = 107104, upload-time = "2025-10-14T04:41:51.051Z" },
+    { url = "https://files.pythonhosted.org/packages/da/5f/6b8f83a55bb8278772c5ae54a577f3099025f9ade59d0136ac24a0df4bde/charset_normalizer-3.4.4-cp314-cp314-win_arm64.whl", hash = "sha256:de00632ca48df9daf77a2c65a484531649261ec9f25489917f09e455cb09ddb2", size = 100743, upload-time = "2025-10-14T04:41:52.122Z" },
+    { url = "https://files.pythonhosted.org/packages/0a/4c/925909008ed5a988ccbb72dcc897407e5d6d3bd72410d69e051fc0c14647/charset_normalizer-3.4.4-py3-none-any.whl", hash = "sha256:7a32c560861a02ff789ad905a2fe94e3f840803362c84fecf1851cb4cf3dc37f", size = 53402, upload-time = "2025-10-14T04:42:31.76Z" },
+]
+
+[[package]]
+name = "click"
+version = "8.3.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "colorama", marker = "sys_platform == 'win32'" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/46/61/de6cd827efad202d7057d93e0fed9294b96952e188f7384832791c7b2254/click-8.3.0.tar.gz", hash = "sha256:e7b8232224eba16f4ebe410c25ced9f7875cb5f3263ffc93cc3e8da705e229c4", size = 276943, upload-time = "2025-09-18T17:32:23.696Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/db/d3/9dcc0f5797f070ec8edf30fbadfb200e71d9db6b84d211e3b2085a7589a0/click-8.3.0-py3-none-any.whl", hash = "sha256:9b9f285302c6e3064f4330c05f05b81945b2a39544279343e6e7c5f27a9baddc", size = 107295, upload-time = "2025-09-18T17:32:22.42Z" },
+]
+
+[[package]]
+name = "colorama"
+version = "0.4.6"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/d8/53/6f443c9a4a8358a93a6792e2acffb9d9d5cb0a5cfd8802644b7b1c9a02e4/colorama-0.4.6.tar.gz", hash = "sha256:08695f5cb7ed6e0531a20572697297273c47b8cae5a63ffc6d6ed5c201be6e44", size = 27697, upload-time = "2022-10-25T02:36:22.414Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/d1/d6/3965ed04c63042e047cb6a3e6ed1a63a35087b6a609aa3a15ed8ac56c221/colorama-0.4.6-py2.py3-none-any.whl", hash = "sha256:4f1d9991f5acc0ca119f9d443620b77f9d6b33703e51011c16baf57afb285fc6", size = 25335, upload-time = "2022-10-25T02:36:20.889Z" },
+]
+
+[[package]]
+name = "coverage"
+version = "7.11.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/1c/38/ee22495420457259d2f3390309505ea98f98a5eed40901cf62196abad006/coverage-7.11.0.tar.gz", hash = "sha256:167bd504ac1ca2af7ff3b81d245dfea0292c5032ebef9d66cc08a7d28c1b8050", size = 811905, upload-time = "2025-10-15T15:15:08.542Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/49/3a/ee1074c15c408ddddddb1db7dd904f6b81bc524e01f5a1c5920e13dbde23/coverage-7.11.0-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:3d58ecaa865c5b9fa56e35efc51d1014d4c0d22838815b9fce57a27dd9576847", size = 215912, upload-time = "2025-10-15T15:12:40.665Z" },
+    { url = "https://files.pythonhosted.org/packages/70/c4/9f44bebe5cb15f31608597b037d78799cc5f450044465bcd1ae8cb222fe1/coverage-7.11.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:b679e171f1c104a5668550ada700e3c4937110dbdd153b7ef9055c4f1a1ee3cc", size = 216310, upload-time = "2025-10-15T15:12:42.461Z" },
+    { url = "https://files.pythonhosted.org/packages/42/01/5e06077cfef92d8af926bdd86b84fb28bf9bc6ad27343d68be9b501d89f2/coverage-7.11.0-cp311-cp311-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:ca61691ba8c5b6797deb221a0d09d7470364733ea9c69425a640f1f01b7c5bf0", size = 246706, upload-time = "2025-10-15T15:12:44.001Z" },
+    { url = "https://files.pythonhosted.org/packages/40/b8/7a3f1f33b35cc4a6c37e759137533119560d06c0cc14753d1a803be0cd4a/coverage-7.11.0-cp311-cp311-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:aef1747ede4bd8ca9cfc04cc3011516500c6891f1b33a94add3253f6f876b7b7", size = 248634, upload-time = "2025-10-15T15:12:45.768Z" },
+    { url = "https://files.pythonhosted.org/packages/7a/41/7f987eb33de386bc4c665ab0bf98d15fcf203369d6aacae74f5dd8ec489a/coverage-7.11.0-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:a1839d08406e4cba2953dcc0ffb312252f14d7c4c96919f70167611f4dee2623", size = 250741, upload-time = "2025-10-15T15:12:47.222Z" },
+    { url = "https://files.pythonhosted.org/packages/23/c1/a4e0ca6a4e83069fb8216b49b30a7352061ca0cb38654bd2dc96b7b3b7da/coverage-7.11.0-cp311-cp311-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:e0eb0a2dcc62478eb5b4cbb80b97bdee852d7e280b90e81f11b407d0b81c4287", size = 246837, upload-time = "2025-10-15T15:12:48.904Z" },
+    { url = "https://files.pythonhosted.org/packages/5d/03/ced062a17f7c38b4728ff76c3acb40d8465634b20b4833cdb3cc3a74e115/coverage-7.11.0-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:bc1fbea96343b53f65d5351d8fd3b34fd415a2670d7c300b06d3e14a5af4f552", size = 248429, upload-time = "2025-10-15T15:12:50.73Z" },
+    { url = "https://files.pythonhosted.org/packages/97/af/a7c6f194bb8c5a2705ae019036b8fe7f49ea818d638eedb15fdb7bed227c/coverage-7.11.0-cp311-cp311-musllinux_1_2_i686.whl", hash = "sha256:214b622259dd0cf435f10241f1333d32caa64dbc27f8790ab693428a141723de", size = 246490, upload-time = "2025-10-15T15:12:52.646Z" },
+    { url = "https://files.pythonhosted.org/packages/ab/c3/aab4df02b04a8fde79068c3c41ad7a622b0ef2b12e1ed154da986a727c3f/coverage-7.11.0-cp311-cp311-musllinux_1_2_riscv64.whl", hash = "sha256:258d9967520cca899695d4eb7ea38be03f06951d6ca2f21fb48b1235f791e601", size = 246208, upload-time = "2025-10-15T15:12:54.586Z" },
+    { url = "https://files.pythonhosted.org/packages/30/d8/e282ec19cd658238d60ed404f99ef2e45eed52e81b866ab1518c0d4163cf/coverage-7.11.0-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:cf9e6ff4ca908ca15c157c409d608da77a56a09877b97c889b98fb2c32b6465e", size = 247126, upload-time = "2025-10-15T15:12:56.485Z" },
+    { url = "https://files.pythonhosted.org/packages/d1/17/a635fa07fac23adb1a5451ec756216768c2767efaed2e4331710342a3399/coverage-7.11.0-cp311-cp311-win32.whl", hash = "sha256:fcc15fc462707b0680cff6242c48625da7f9a16a28a41bb8fd7a4280920e676c", size = 218314, upload-time = "2025-10-15T15:12:58.365Z" },
+    { url = "https://files.pythonhosted.org/packages/2a/29/2ac1dfcdd4ab9a70026edc8d715ece9b4be9a1653075c658ee6f271f394d/coverage-7.11.0-cp311-cp311-win_amd64.whl", hash = "sha256:865965bf955d92790f1facd64fe7ff73551bd2c1e7e6b26443934e9701ba30b9", size = 219203, upload-time = "2025-10-15T15:12:59.902Z" },
+    { url = "https://files.pythonhosted.org/packages/03/21/5ce8b3a0133179115af4c041abf2ee652395837cb896614beb8ce8ddcfd9/coverage-7.11.0-cp311-cp311-win_arm64.whl", hash = "sha256:5693e57a065760dcbeb292d60cc4d0231a6d4b6b6f6a3191561e1d5e8820b745", size = 217879, upload-time = "2025-10-15T15:13:01.35Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/db/86f6906a7c7edc1a52b2c6682d6dd9be775d73c0dfe2b84f8923dfea5784/coverage-7.11.0-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:9c49e77811cf9d024b95faf86c3f059b11c0c9be0b0d61bc598f453703bd6fd1", size = 216098, upload-time = "2025-10-15T15:13:02.916Z" },
+    { url = "https://files.pythonhosted.org/packages/21/54/e7b26157048c7ba555596aad8569ff903d6cd67867d41b75287323678ede/coverage-7.11.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:a61e37a403a778e2cda2a6a39abcc895f1d984071942a41074b5c7ee31642007", size = 216331, upload-time = "2025-10-15T15:13:04.403Z" },
+    { url = "https://files.pythonhosted.org/packages/b9/19/1ce6bf444f858b83a733171306134a0544eaddf1ca8851ede6540a55b2ad/coverage-7.11.0-cp312-cp312-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:c79cae102bb3b1801e2ef1511fb50e91ec83a1ce466b2c7c25010d884336de46", size = 247825, upload-time = "2025-10-15T15:13:05.92Z" },
+    { url = "https://files.pythonhosted.org/packages/71/0b/d3bcbbc259fcced5fb67c5d78f6e7ee965f49760c14afd931e9e663a83b2/coverage-7.11.0-cp312-cp312-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:16ce17ceb5d211f320b62df002fa7016b7442ea0fd260c11cec8ce7730954893", size = 250573, upload-time = "2025-10-15T15:13:07.471Z" },
+    { url = "https://files.pythonhosted.org/packages/58/8d/b0ff3641a320abb047258d36ed1c21d16be33beed4152628331a1baf3365/coverage-7.11.0-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:80027673e9d0bd6aef86134b0771845e2da85755cf686e7c7c59566cf5a89115", size = 251706, upload-time = "2025-10-15T15:13:09.4Z" },
+    { url = "https://files.pythonhosted.org/packages/59/c8/5a586fe8c7b0458053d9c687f5cff515a74b66c85931f7fe17a1c958b4ac/coverage-7.11.0-cp312-cp312-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:4d3ffa07a08657306cd2215b0da53761c4d73cb54d9143b9303a6481ec0cd415", size = 248221, upload-time = "2025-10-15T15:13:10.964Z" },
+    { url = "https://files.pythonhosted.org/packages/d0/ff/3a25e3132804ba44cfa9a778cdf2b73dbbe63ef4b0945e39602fc896ba52/coverage-7.11.0-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:a3b6a5f8b2524fd6c1066bc85bfd97e78709bb5e37b5b94911a6506b65f47186", size = 249624, upload-time = "2025-10-15T15:13:12.5Z" },
+    { url = "https://files.pythonhosted.org/packages/c5/12/ff10c8ce3895e1b17a73485ea79ebc1896a9e466a9d0f4aef63e0d17b718/coverage-7.11.0-cp312-cp312-musllinux_1_2_i686.whl", hash = "sha256:fcc0a4aa589de34bc56e1a80a740ee0f8c47611bdfb28cd1849de60660f3799d", size = 247744, upload-time = "2025-10-15T15:13:14.554Z" },
+    { url = "https://files.pythonhosted.org/packages/16/02/d500b91f5471b2975947e0629b8980e5e90786fe316b6d7299852c1d793d/coverage-7.11.0-cp312-cp312-musllinux_1_2_riscv64.whl", hash = "sha256:dba82204769d78c3fd31b35c3d5f46e06511936c5019c39f98320e05b08f794d", size = 247325, upload-time = "2025-10-15T15:13:16.438Z" },
+    { url = "https://files.pythonhosted.org/packages/77/11/dee0284fbbd9cd64cfce806b827452c6df3f100d9e66188e82dfe771d4af/coverage-7.11.0-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:81b335f03ba67309a95210caf3eb43bd6fe75a4e22ba653ef97b4696c56c7ec2", size = 249180, upload-time = "2025-10-15T15:13:17.959Z" },
+    { url = "https://files.pythonhosted.org/packages/59/1b/cdf1def928f0a150a057cab03286774e73e29c2395f0d30ce3d9e9f8e697/coverage-7.11.0-cp312-cp312-win32.whl", hash = "sha256:037b2d064c2f8cc8716fe4d39cb705779af3fbf1ba318dc96a1af858888c7bb5", size = 218479, upload-time = "2025-10-15T15:13:19.608Z" },
+    { url = "https://files.pythonhosted.org/packages/ff/55/e5884d55e031da9c15b94b90a23beccc9d6beee65e9835cd6da0a79e4f3a/coverage-7.11.0-cp312-cp312-win_amd64.whl", hash = "sha256:d66c0104aec3b75e5fd897e7940188ea1892ca1d0235316bf89286d6a22568c0", size = 219290, upload-time = "2025-10-15T15:13:21.593Z" },
+    { url = "https://files.pythonhosted.org/packages/23/a8/faa930cfc71c1d16bc78f9a19bb73700464f9c331d9e547bfbc1dbd3a108/coverage-7.11.0-cp312-cp312-win_arm64.whl", hash = "sha256:d91ebeac603812a09cf6a886ba6e464f3bbb367411904ae3790dfe28311b15ad", size = 217924, upload-time = "2025-10-15T15:13:23.39Z" },
+    { url = "https://files.pythonhosted.org/packages/60/7f/85e4dfe65e400645464b25c036a26ac226cf3a69d4a50c3934c532491cdd/coverage-7.11.0-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:cc3f49e65ea6e0d5d9bd60368684fe52a704d46f9e7fc413918f18d046ec40e1", size = 216129, upload-time = "2025-10-15T15:13:25.371Z" },
+    { url = "https://files.pythonhosted.org/packages/96/5d/dc5fa98fea3c175caf9d360649cb1aa3715e391ab00dc78c4c66fabd7356/coverage-7.11.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:f39ae2f63f37472c17b4990f794035c9890418b1b8cca75c01193f3c8d3e01be", size = 216380, upload-time = "2025-10-15T15:13:26.976Z" },
+    { url = "https://files.pythonhosted.org/packages/b2/f5/3da9cc9596708273385189289c0e4d8197d37a386bdf17619013554b3447/coverage-7.11.0-cp313-cp313-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:7db53b5cdd2917b6eaadd0b1251cf4e7d96f4a8d24e174bdbdf2f65b5ea7994d", size = 247375, upload-time = "2025-10-15T15:13:28.923Z" },
+    { url = "https://files.pythonhosted.org/packages/65/6c/f7f59c342359a235559d2bc76b0c73cfc4bac7d61bb0df210965cb1ecffd/coverage-7.11.0-cp313-cp313-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:10ad04ac3a122048688387828b4537bc9cf60c0bf4869c1e9989c46e45690b82", size = 249978, upload-time = "2025-10-15T15:13:30.525Z" },
+    { url = "https://files.pythonhosted.org/packages/e7/8c/042dede2e23525e863bf1ccd2b92689692a148d8b5fd37c37899ba882645/coverage-7.11.0-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:4036cc9c7983a2b1f2556d574d2eb2154ac6ed55114761685657e38782b23f52", size = 251253, upload-time = "2025-10-15T15:13:32.174Z" },
+    { url = "https://files.pythonhosted.org/packages/7b/a9/3c58df67bfa809a7bddd786356d9c5283e45d693edb5f3f55d0986dd905a/coverage-7.11.0-cp313-cp313-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:7ab934dd13b1c5e94b692b1e01bd87e4488cb746e3a50f798cb9464fd128374b", size = 247591, upload-time = "2025-10-15T15:13:34.147Z" },
+    { url = "https://files.pythonhosted.org/packages/26/5b/c7f32efd862ee0477a18c41e4761305de6ddd2d49cdeda0c1116227570fd/coverage-7.11.0-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:59a6e5a265f7cfc05f76e3bb53eca2e0dfe90f05e07e849930fecd6abb8f40b4", size = 249411, upload-time = "2025-10-15T15:13:38.425Z" },
+    { url = "https://files.pythonhosted.org/packages/76/b5/78cb4f1e86c1611431c990423ec0768122905b03837e1b4c6a6f388a858b/coverage-7.11.0-cp313-cp313-musllinux_1_2_i686.whl", hash = "sha256:df01d6c4c81e15a7c88337b795bb7595a8596e92310266b5072c7e301168efbd", size = 247303, upload-time = "2025-10-15T15:13:40.464Z" },
+    { url = "https://files.pythonhosted.org/packages/87/c9/23c753a8641a330f45f221286e707c427e46d0ffd1719b080cedc984ec40/coverage-7.11.0-cp313-cp313-musllinux_1_2_riscv64.whl", hash = "sha256:8c934bd088eed6174210942761e38ee81d28c46de0132ebb1801dbe36a390dcc", size = 247157, upload-time = "2025-10-15T15:13:42.087Z" },
+    { url = "https://files.pythonhosted.org/packages/c5/42/6e0cc71dc8a464486e944a4fa0d85bdec031cc2969e98ed41532a98336b9/coverage-7.11.0-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:5a03eaf7ec24078ad64a07f02e30060aaf22b91dedf31a6b24d0d98d2bba7f48", size = 248921, upload-time = "2025-10-15T15:13:43.715Z" },
+    { url = "https://files.pythonhosted.org/packages/e8/1c/743c2ef665e6858cccb0f84377dfe3a4c25add51e8c7ef19249be92465b6/coverage-7.11.0-cp313-cp313-win32.whl", hash = "sha256:695340f698a5f56f795b2836abe6fb576e7c53d48cd155ad2f80fd24bc63a040", size = 218526, upload-time = "2025-10-15T15:13:45.336Z" },
+    { url = "https://files.pythonhosted.org/packages/ff/d5/226daadfd1bf8ddbccefbd3aa3547d7b960fb48e1bdac124e2dd13a2b71a/coverage-7.11.0-cp313-cp313-win_amd64.whl", hash = "sha256:2727d47fce3ee2bac648528e41455d1b0c46395a087a229deac75e9f88ba5a05", size = 219317, upload-time = "2025-10-15T15:13:47.401Z" },
+    { url = "https://files.pythonhosted.org/packages/97/54/47db81dcbe571a48a298f206183ba8a7ba79200a37cd0d9f4788fcd2af4a/coverage-7.11.0-cp313-cp313-win_arm64.whl", hash = "sha256:0efa742f431529699712b92ecdf22de8ff198df41e43aeaaadf69973eb93f17a", size = 217948, upload-time = "2025-10-15T15:13:49.096Z" },
+    { url = "https://files.pythonhosted.org/packages/e5/8b/cb68425420154e7e2a82fd779a8cc01549b6fa83c2ad3679cd6c088ebd07/coverage-7.11.0-cp313-cp313t-macosx_10_13_x86_64.whl", hash = "sha256:587c38849b853b157706407e9ebdca8fd12f45869edb56defbef2daa5fb0812b", size = 216837, upload-time = "2025-10-15T15:13:51.09Z" },
+    { url = "https://files.pythonhosted.org/packages/33/55/9d61b5765a025685e14659c8d07037247de6383c0385757544ffe4606475/coverage-7.11.0-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:b971bdefdd75096163dd4261c74be813c4508477e39ff7b92191dea19f24cd37", size = 217061, upload-time = "2025-10-15T15:13:52.747Z" },
+    { url = "https://files.pythonhosted.org/packages/52/85/292459c9186d70dcec6538f06ea251bc968046922497377bf4a1dc9a71de/coverage-7.11.0-cp313-cp313t-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:269bfe913b7d5be12ab13a95f3a76da23cf147be7fa043933320ba5625f0a8de", size = 258398, upload-time = "2025-10-15T15:13:54.45Z" },
+    { url = "https://files.pythonhosted.org/packages/1f/e2/46edd73fb8bf51446c41148d81944c54ed224854812b6ca549be25113ee0/coverage-7.11.0-cp313-cp313t-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:dadbcce51a10c07b7c72b0ce4a25e4b6dcb0c0372846afb8e5b6307a121eb99f", size = 260574, upload-time = "2025-10-15T15:13:56.145Z" },
+    { url = "https://files.pythonhosted.org/packages/07/5e/1df469a19007ff82e2ca8fe509822820a31e251f80ee7344c34f6cd2ec43/coverage-7.11.0-cp313-cp313t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:9ed43fa22c6436f7957df036331f8fe4efa7af132054e1844918866cd228af6c", size = 262797, upload-time = "2025-10-15T15:13:58.635Z" },
+    { url = "https://files.pythonhosted.org/packages/f9/50/de216b31a1434b94d9b34a964c09943c6be45069ec704bfc379d8d89a649/coverage-7.11.0-cp313-cp313t-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:9516add7256b6713ec08359b7b05aeff8850c98d357784c7205b2e60aa2513fa", size = 257361, upload-time = "2025-10-15T15:14:00.409Z" },
+    { url = "https://files.pythonhosted.org/packages/82/1e/3f9f8344a48111e152e0fd495b6fff13cc743e771a6050abf1627a7ba918/coverage-7.11.0-cp313-cp313t-musllinux_1_2_aarch64.whl", hash = "sha256:eb92e47c92fcbcdc692f428da67db33337fa213756f7adb6a011f7b5a7a20740", size = 260349, upload-time = "2025-10-15T15:14:02.188Z" },
+    { url = "https://files.pythonhosted.org/packages/65/9b/3f52741f9e7d82124272f3070bbe316006a7de1bad1093f88d59bfc6c548/coverage-7.11.0-cp313-cp313t-musllinux_1_2_i686.whl", hash = "sha256:d06f4fc7acf3cabd6d74941d53329e06bab00a8fe10e4df2714f0b134bfc64ef", size = 258114, upload-time = "2025-10-15T15:14:03.907Z" },
+    { url = "https://files.pythonhosted.org/packages/0b/8b/918f0e15f0365d50d3986bbd3338ca01178717ac5678301f3f547b6619e6/coverage-7.11.0-cp313-cp313t-musllinux_1_2_riscv64.whl", hash = "sha256:6fbcee1a8f056af07ecd344482f711f563a9eb1c2cad192e87df00338ec3cdb0", size = 256723, upload-time = "2025-10-15T15:14:06.324Z" },
+    { url = "https://files.pythonhosted.org/packages/44/9e/7776829f82d3cf630878a7965a7d70cc6ca94f22c7d20ec4944f7148cb46/coverage-7.11.0-cp313-cp313t-musllinux_1_2_x86_64.whl", hash = "sha256:dbbf012be5f32533a490709ad597ad8a8ff80c582a95adc8d62af664e532f9ca", size = 259238, upload-time = "2025-10-15T15:14:08.002Z" },
+    { url = "https://files.pythonhosted.org/packages/9a/b8/49cf253e1e7a3bedb85199b201862dd7ca4859f75b6cf25ffa7298aa0760/coverage-7.11.0-cp313-cp313t-win32.whl", hash = "sha256:cee6291bb4fed184f1c2b663606a115c743df98a537c969c3c64b49989da96c2", size = 219180, upload-time = "2025-10-15T15:14:09.786Z" },
+    { url = "https://files.pythonhosted.org/packages/ac/e1/1a541703826be7ae2125a0fb7f821af5729d56bb71e946e7b933cc7a89a4/coverage-7.11.0-cp313-cp313t-win_amd64.whl", hash = "sha256:a386c1061bf98e7ea4758e4313c0ab5ecf57af341ef0f43a0bf26c2477b5c268", size = 220241, upload-time = "2025-10-15T15:14:11.471Z" },
+    { url = "https://files.pythonhosted.org/packages/d5/d1/5ee0e0a08621140fd418ec4020f595b4d52d7eb429ae6a0c6542b4ba6f14/coverage-7.11.0-cp313-cp313t-win_arm64.whl", hash = "sha256:f9ea02ef40bb83823b2b04964459d281688fe173e20643870bb5d2edf68bc836", size = 218510, upload-time = "2025-10-15T15:14:13.46Z" },
+    { url = "https://files.pythonhosted.org/packages/f4/06/e923830c1985ce808e40a3fa3eb46c13350b3224b7da59757d37b6ce12b8/coverage-7.11.0-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:c770885b28fb399aaf2a65bbd1c12bf6f307ffd112d6a76c5231a94276f0c497", size = 216110, upload-time = "2025-10-15T15:14:15.157Z" },
+    { url = "https://files.pythonhosted.org/packages/42/82/cdeed03bfead45203fb651ed756dfb5266028f5f939e7f06efac4041dad5/coverage-7.11.0-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:a3d0e2087dba64c86a6b254f43e12d264b636a39e88c5cc0a01a7c71bcfdab7e", size = 216395, upload-time = "2025-10-15T15:14:16.863Z" },
+    { url = "https://files.pythonhosted.org/packages/fc/ba/e1c80caffc3199aa699813f73ff097bc2df7b31642bdbc7493600a8f1de5/coverage-7.11.0-cp314-cp314-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:73feb83bb41c32811973b8565f3705caf01d928d972b72042b44e97c71fd70d1", size = 247433, upload-time = "2025-10-15T15:14:18.589Z" },
+    { url = "https://files.pythonhosted.org/packages/80/c0/5b259b029694ce0a5bbc1548834c7ba3db41d3efd3474489d7efce4ceb18/coverage-7.11.0-cp314-cp314-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:c6f31f281012235ad08f9a560976cc2fc9c95c17604ff3ab20120fe480169bca", size = 249970, upload-time = "2025-10-15T15:14:20.307Z" },
+    { url = "https://files.pythonhosted.org/packages/8c/86/171b2b5e1aac7e2fd9b43f7158b987dbeb95f06d1fbecad54ad8163ae3e8/coverage-7.11.0-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:e9570ad567f880ef675673992222746a124b9595506826b210fbe0ce3f0499cd", size = 251324, upload-time = "2025-10-15T15:14:22.419Z" },
+    { url = "https://files.pythonhosted.org/packages/1a/7e/7e10414d343385b92024af3932a27a1caf75c6e27ee88ba211221ff1a145/coverage-7.11.0-cp314-cp314-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:8badf70446042553a773547a61fecaa734b55dc738cacf20c56ab04b77425e43", size = 247445, upload-time = "2025-10-15T15:14:24.205Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/3b/e4f966b21f5be8c4bf86ad75ae94efa0de4c99c7bbb8114476323102e345/coverage-7.11.0-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:a09c1211959903a479e389685b7feb8a17f59ec5a4ef9afde7650bd5eabc2777", size = 249324, upload-time = "2025-10-15T15:14:26.234Z" },
+    { url = "https://files.pythonhosted.org/packages/00/a2/8479325576dfcd909244d0df215f077f47437ab852ab778cfa2f8bf4d954/coverage-7.11.0-cp314-cp314-musllinux_1_2_i686.whl", hash = "sha256:5ef83b107f50db3f9ae40f69e34b3bd9337456c5a7fe3461c7abf8b75dd666a2", size = 247261, upload-time = "2025-10-15T15:14:28.42Z" },
+    { url = "https://files.pythonhosted.org/packages/7b/d8/3a9e2db19d94d65771d0f2e21a9ea587d11b831332a73622f901157cc24b/coverage-7.11.0-cp314-cp314-musllinux_1_2_riscv64.whl", hash = "sha256:f91f927a3215b8907e214af77200250bb6aae36eca3f760f89780d13e495388d", size = 247092, upload-time = "2025-10-15T15:14:30.784Z" },
+    { url = "https://files.pythonhosted.org/packages/b3/b1/bbca3c472544f9e2ad2d5116b2379732957048be4b93a9c543fcd0207e5f/coverage-7.11.0-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:cdbcd376716d6b7fbfeedd687a6c4be019c5a5671b35f804ba76a4c0a778cba4", size = 248755, upload-time = "2025-10-15T15:14:32.585Z" },
+    { url = "https://files.pythonhosted.org/packages/89/49/638d5a45a6a0f00af53d6b637c87007eb2297042186334e9923a61aa8854/coverage-7.11.0-cp314-cp314-win32.whl", hash = "sha256:bab7ec4bb501743edc63609320aaec8cd9188b396354f482f4de4d40a9d10721", size = 218793, upload-time = "2025-10-15T15:14:34.972Z" },
+    { url = "https://files.pythonhosted.org/packages/30/cc/b675a51f2d068adb3cdf3799212c662239b0ca27f4691d1fff81b92ea850/coverage-7.11.0-cp314-cp314-win_amd64.whl", hash = "sha256:3d4ba9a449e9364a936a27322b20d32d8b166553bfe63059bd21527e681e2fad", size = 219587, upload-time = "2025-10-15T15:14:37.047Z" },
+    { url = "https://files.pythonhosted.org/packages/93/98/5ac886876026de04f00820e5094fe22166b98dcb8b426bf6827aaf67048c/coverage-7.11.0-cp314-cp314-win_arm64.whl", hash = "sha256:ce37f215223af94ef0f75ac68ea096f9f8e8c8ec7d6e8c346ee45c0d363f0479", size = 218168, upload-time = "2025-10-15T15:14:38.861Z" },
+    { url = "https://files.pythonhosted.org/packages/14/d1/b4145d35b3e3ecf4d917e97fc8895bcf027d854879ba401d9ff0f533f997/coverage-7.11.0-cp314-cp314t-macosx_10_13_x86_64.whl", hash = "sha256:f413ce6e07e0d0dc9c433228727b619871532674b45165abafe201f200cc215f", size = 216850, upload-time = "2025-10-15T15:14:40.651Z" },
+    { url = "https://files.pythonhosted.org/packages/ca/d1/7f645fc2eccd318369a8a9948acc447bb7c1ade2911e31d3c5620544c22b/coverage-7.11.0-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:05791e528a18f7072bf5998ba772fe29db4da1234c45c2087866b5ba4dea710e", size = 217071, upload-time = "2025-10-15T15:14:42.755Z" },
+    { url = "https://files.pythonhosted.org/packages/54/7d/64d124649db2737ceced1dfcbdcb79898d5868d311730f622f8ecae84250/coverage-7.11.0-cp314-cp314t-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:cacb29f420cfeb9283b803263c3b9a068924474ff19ca126ba9103e1278dfa44", size = 258570, upload-time = "2025-10-15T15:14:44.542Z" },
+    { url = "https://files.pythonhosted.org/packages/6c/3f/6f5922f80dc6f2d8b2c6f974835c43f53eb4257a7797727e6ca5b7b2ec1f/coverage-7.11.0-cp314-cp314t-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:314c24e700d7027ae3ab0d95fbf8d53544fca1f20345fd30cd219b737c6e58d3", size = 260738, upload-time = "2025-10-15T15:14:46.436Z" },
+    { url = "https://files.pythonhosted.org/packages/0e/5f/9e883523c4647c860b3812b417a2017e361eca5b635ee658387dc11b13c1/coverage-7.11.0-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:630d0bd7a293ad2fc8b4b94e5758c8b2536fdf36c05f1681270203e463cbfa9b", size = 262994, upload-time = "2025-10-15T15:14:48.3Z" },
+    { url = "https://files.pythonhosted.org/packages/07/bb/43b5a8e94c09c8bf51743ffc65c4c841a4ca5d3ed191d0a6919c379a1b83/coverage-7.11.0-cp314-cp314t-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:e89641f5175d65e2dbb44db15fe4ea48fade5d5bbb9868fdc2b4fce22f4a469d", size = 257282, upload-time = "2025-10-15T15:14:50.236Z" },
+    { url = "https://files.pythonhosted.org/packages/aa/e5/0ead8af411411330b928733e1d201384b39251a5f043c1612970310e8283/coverage-7.11.0-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:c9f08ea03114a637dab06cedb2e914da9dc67fa52c6015c018ff43fdde25b9c2", size = 260430, upload-time = "2025-10-15T15:14:52.413Z" },
+    { url = "https://files.pythonhosted.org/packages/ae/66/03dd8bb0ba5b971620dcaac145461950f6d8204953e535d2b20c6b65d729/coverage-7.11.0-cp314-cp314t-musllinux_1_2_i686.whl", hash = "sha256:ce9f3bde4e9b031eaf1eb61df95c1401427029ea1bfddb8621c1161dcb0fa02e", size = 258190, upload-time = "2025-10-15T15:14:54.268Z" },
+    { url = "https://files.pythonhosted.org/packages/45/ae/28a9cce40bf3174426cb2f7e71ee172d98e7f6446dff936a7ccecee34b14/coverage-7.11.0-cp314-cp314t-musllinux_1_2_riscv64.whl", hash = "sha256:e4dc07e95495923d6fd4d6c27bf70769425b71c89053083843fd78f378558996", size = 256658, upload-time = "2025-10-15T15:14:56.436Z" },
+    { url = "https://files.pythonhosted.org/packages/5c/7c/3a44234a8599513684bfc8684878fd7b126c2760f79712bb78c56f19efc4/coverage-7.11.0-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:424538266794db2861db4922b05d729ade0940ee69dcf0591ce8f69784db0e11", size = 259342, upload-time = "2025-10-15T15:14:58.538Z" },
+    { url = "https://files.pythonhosted.org/packages/e1/e6/0108519cba871af0351725ebdb8660fd7a0fe2ba3850d56d32490c7d9b4b/coverage-7.11.0-cp314-cp314t-win32.whl", hash = "sha256:4c1eeb3fb8eb9e0190bebafd0462936f75717687117339f708f395fe455acc73", size = 219568, upload-time = "2025-10-15T15:15:00.382Z" },
+    { url = "https://files.pythonhosted.org/packages/c9/76/44ba876e0942b4e62fdde23ccb029ddb16d19ba1bef081edd00857ba0b16/coverage-7.11.0-cp314-cp314t-win_amd64.whl", hash = "sha256:b56efee146c98dbf2cf5cffc61b9829d1e94442df4d7398b26892a53992d3547", size = 220687, upload-time = "2025-10-15T15:15:02.322Z" },
+    { url = "https://files.pythonhosted.org/packages/b9/0c/0df55ecb20d0d0ed5c322e10a441775e1a3a5d78c60f0c4e1abfe6fcf949/coverage-7.11.0-cp314-cp314t-win_arm64.whl", hash = "sha256:b5c2705afa83f49bd91962a4094b6b082f94aef7626365ab3f8f4bd159c5acf3", size = 218711, upload-time = "2025-10-15T15:15:04.575Z" },
+    { url = "https://files.pythonhosted.org/packages/5f/04/642c1d8a448ae5ea1369eac8495740a79eb4e581a9fb0cbdce56bbf56da1/coverage-7.11.0-py3-none-any.whl", hash = "sha256:4b7589765348d78fb4e5fb6ea35d07564e387da2fc5efff62e0222971f155f68", size = 207761, upload-time = "2025-10-15T15:15:06.439Z" },
+]
+
+[package.optional-dependencies]
+toml = [
+    { name = "tomli", marker = "python_full_version <= '3.11'" },
+]
+
+[[package]]
+name = "distlib"
+version = "0.4.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/96/8e/709914eb2b5749865801041647dc7f4e6d00b549cfe88b65ca192995f07c/distlib-0.4.0.tar.gz", hash = "sha256:feec40075be03a04501a973d81f633735b4b69f98b05450592310c0f401a4e0d", size = 614605, upload-time = "2025-07-17T16:52:00.465Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/33/6b/e0547afaf41bf2c42e52430072fa5658766e3d65bd4b03a563d1b6336f57/distlib-0.4.0-py2.py3-none-any.whl", hash = "sha256:9659f7d87e46584a30b5780e43ac7a2143098441670ff0a49d5f9034c54a6c16", size = 469047, upload-time = "2025-07-17T16:51:58.613Z" },
+]
+
+[[package]]
+name = "duckdb"
+version = "1.4.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ea/e7/21cf50a3d52ffceee1f0bcc3997fa96a5062e6bab705baee4f6c4e33cce5/duckdb-1.4.1.tar.gz", hash = "sha256:f903882f045d057ebccad12ac69975952832edfe133697694854bb784b8d6c76", size = 18461687, upload-time = "2025-10-07T10:37:28.605Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/d9/52/606f13fa9669a24166d2fe523e28982d8ef9039874b4de774255c7806d1f/duckdb-1.4.1-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:605d563c1d5203ca992497cd33fb386ac3d533deca970f9dcf539f62a34e22a9", size = 29065894, upload-time = "2025-10-07T10:36:29.837Z" },
+    { url = "https://files.pythonhosted.org/packages/84/57/138241952ece868b9577e607858466315bed1739e1fbb47205df4dfdfd88/duckdb-1.4.1-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:d3305c7c4b70336171de7adfdb50431f23671c000f11839b580c4201d9ce6ef5", size = 16163720, upload-time = "2025-10-07T10:36:32.241Z" },
+    { url = "https://files.pythonhosted.org/packages/a3/81/afa3a0a78498a6f4acfea75c48a70c5082032d9ac87822713d7c2d164af1/duckdb-1.4.1-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:a063d6febbe34b32f1ad2e68822db4d0e4b1102036f49aaeeb22b844427a75df", size = 13756223, upload-time = "2025-10-07T10:36:34.673Z" },
+    { url = "https://files.pythonhosted.org/packages/47/dd/5f6064fbd9248e37a3e806a244f81e0390ab8f989d231b584fb954f257fc/duckdb-1.4.1-cp311-cp311-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:d1ffcaaf74f7d1df3684b54685cbf8d3ce732781c541def8e1ced304859733ae", size = 18487022, upload-time = "2025-10-07T10:36:36.759Z" },
+    { url = "https://files.pythonhosted.org/packages/a1/10/b54969a1c42fd9344ad39228d671faceb8aa9f144b67cd9531a63551757f/duckdb-1.4.1-cp311-cp311-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:685d3d1599dc08160e0fa0cf09e93ac4ff8b8ed399cb69f8b5391cd46b5b207c", size = 20491004, upload-time = "2025-10-07T10:36:39.318Z" },
+    { url = "https://files.pythonhosted.org/packages/ed/d5/7332ae8f804869a4e895937821b776199a283f8d9fc775fd3ae5a0558099/duckdb-1.4.1-cp311-cp311-win_amd64.whl", hash = "sha256:78f1d28a15ae73bd449c43f80233732adffa49be1840a32de8f1a6bb5b286764", size = 12327619, upload-time = "2025-10-07T10:36:41.509Z" },
+    { url = "https://files.pythonhosted.org/packages/0e/6c/906a3fe41cd247b5638866fc1245226b528de196588802d4df4df1e6e819/duckdb-1.4.1-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:cd1765a7d180b7482874586859fc23bc9969d7d6c96ced83b245e6c6f49cde7f", size = 29076820, upload-time = "2025-10-07T10:36:43.782Z" },
+    { url = "https://files.pythonhosted.org/packages/66/c7/01dd33083f01f618c2a29f6dd068baf16945b8cbdb132929d3766610bbbb/duckdb-1.4.1-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:8ed7a86725185470953410823762956606693c0813bb64e09c7d44dbd9253a64", size = 16167558, upload-time = "2025-10-07T10:36:46.003Z" },
+    { url = "https://files.pythonhosted.org/packages/81/e2/f983b4b7ae1dfbdd2792dd31dee9a0d35f88554452cbfc6c9d65e22fdfa9/duckdb-1.4.1-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:8a189bdfc64cfb9cc1adfbe4f2dcfde0a4992ec08505ad8ce33c886e4813f0bf", size = 13762226, upload-time = "2025-10-07T10:36:48.55Z" },
+    { url = "https://files.pythonhosted.org/packages/ed/34/fb69a7be19b90f573b3cc890961be7b11870b77514769655657514f10a98/duckdb-1.4.1-cp312-cp312-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:a9090089b6486f7319c92acdeed8acda022d4374032d78a465956f50fc52fabf", size = 18500901, upload-time = "2025-10-07T10:36:52.445Z" },
+    { url = "https://files.pythonhosted.org/packages/e4/a5/1395d7b49d5589e85da9a9d7ffd8b50364c9d159c2807bef72d547f0ad1e/duckdb-1.4.1-cp312-cp312-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:142552ea3e768048e0e8c832077a545ca07792631c59edaee925e3e67401c2a0", size = 20514177, upload-time = "2025-10-07T10:36:55.358Z" },
+    { url = "https://files.pythonhosted.org/packages/c0/21/08f10706d30252753349ec545833fc0cea67c11abd0b5223acf2827f1056/duckdb-1.4.1-cp312-cp312-win_amd64.whl", hash = "sha256:567f3b3a785a9e8650612461893c49ca799661d2345a6024dda48324ece89ded", size = 12336422, upload-time = "2025-10-07T10:36:57.521Z" },
+    { url = "https://files.pythonhosted.org/packages/d7/08/705988c33e38665c969f7876b3ca4328be578554aa7e3dc0f34158da3e64/duckdb-1.4.1-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:46496a2518752ae0c6c5d75d4cdecf56ea23dd098746391176dd8e42cf157791", size = 29077070, upload-time = "2025-10-07T10:36:59.83Z" },
+    { url = "https://files.pythonhosted.org/packages/99/c5/7c9165f1e6b9069441bcda4da1e19382d4a2357783d37ff9ae238c5c41ac/duckdb-1.4.1-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:1c65ae7e9b541cea07d8075343bcfebdecc29a3c0481aa6078ee63d51951cfcd", size = 16167506, upload-time = "2025-10-07T10:37:02.24Z" },
+    { url = "https://files.pythonhosted.org/packages/38/46/267f4a570a0ee3ae6871ddc03435f9942884284e22a7ba9b7cb252ee69b6/duckdb-1.4.1-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:598d1a314e34b65d9399ddd066ccce1eeab6a60a2ef5885a84ce5ed62dbaf729", size = 13762330, upload-time = "2025-10-07T10:37:04.581Z" },
+    { url = "https://files.pythonhosted.org/packages/15/7b/c4f272a40c36d82df20937d93a1780eb39ab0107fe42b62cba889151eab9/duckdb-1.4.1-cp313-cp313-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:e2f16b8def782d484a9f035fc422bb6f06941ed0054b4511ddcdc514a7fb6a75", size = 18504687, upload-time = "2025-10-07T10:37:06.991Z" },
+    { url = "https://files.pythonhosted.org/packages/17/fc/9b958751f0116d7b0406406b07fa6f5a10c22d699be27826d0b896f9bf51/duckdb-1.4.1-cp313-cp313-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:a5a7d0aed068a5c33622a8848857947cab5cfb3f2a315b1251849bac2c74c492", size = 20513823, upload-time = "2025-10-07T10:37:09.349Z" },
+    { url = "https://files.pythonhosted.org/packages/30/79/4f544d73fcc0513b71296cb3ebb28a227d22e80dec27204977039b9fa875/duckdb-1.4.1-cp313-cp313-win_amd64.whl", hash = "sha256:280fd663dacdd12bb3c3bf41f3e5b2e5b95e00b88120afabb8b8befa5f335c6f", size = 12336460, upload-time = "2025-10-07T10:37:12.154Z" },
+]
+
+[[package]]
+name = "et-xmlfile"
+version = "2.0.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/d3/38/af70d7ab1ae9d4da450eeec1fa3918940a5fafb9055e934af8d6eb0c2313/et_xmlfile-2.0.0.tar.gz", hash = "sha256:dab3f4764309081ce75662649be815c4c9081e88f0837825f90fd28317d4da54", size = 17234, upload-time = "2024-10-25T17:25:40.039Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/c1/8b/5fe2cc11fee489817272089c4203e679c63b570a5aaeb18d852ae3cbba6a/et_xmlfile-2.0.0-py3-none-any.whl", hash = "sha256:7a91720bc756843502c3b7504c77b8fe44217c85c537d85037f0f536151b2caa", size = 18059, upload-time = "2024-10-25T17:25:39.051Z" },
+]
+
+[[package]]
+name = "fastexcel"
+version = "0.16.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/b0/7c/77fe2f25c4ff1c798b021cad7cddf00ff2a42118b9b59eec8ef5f0d5b5cf/fastexcel-0.16.0.tar.gz", hash = "sha256:7f6597ee86e0cda296bcc620d20fcf2de9903f8d3b99b365b7f45248d535556d", size = 59038, upload-time = "2025-09-22T12:34:40.041Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/cc/44/2dc31ec48d8f63f1d93e11ef19636a442c39775d49f1472f4123a6b38c34/fastexcel-0.16.0-cp39-abi3-macosx_10_12_x86_64.whl", hash = "sha256:48c56a501abc1cf0890294527dc924cb0d919fd5095f684ebcf52806135e9df8", size = 3061679, upload-time = "2025-09-22T12:34:35.542Z" },
+    { url = "https://files.pythonhosted.org/packages/e2/d8/ef4489cd00fe9fe52bef176ed32a8bb5837dd97518bb950bbd68f546ed1c/fastexcel-0.16.0-cp39-abi3-macosx_11_0_arm64.whl", hash = "sha256:bae61533745fae226ea19f6d198570d5c76a8de816e222ff717aff82d8d6e473", size = 2803453, upload-time = "2025-09-22T12:34:37.168Z" },
+    { url = "https://files.pythonhosted.org/packages/a1/cc/95cf27168d4b4fec3d2e404d70a0fb5d5b7a18872192c8cd8b3a272d31dc/fastexcel-0.16.0-cp39-abi3-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ec1c56b9b3b7b7ff2bde64dbe0e378a707287aff9deeb71ff6d0f8c3b7d24e34", size = 3130831, upload-time = "2025-09-22T12:34:32.22Z" },
+    { url = "https://files.pythonhosted.org/packages/c8/23/02012e9c7e584e6f85e1e7078beff3dc56aaad2e51b0a33bbcaa1dc2aa6e/fastexcel-0.16.0-cp39-abi3-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e1059eac593f4b92843ac9d10901677cccc2a8152c67e315c9dfbd7ce7c722e7", size = 3331124, upload-time = "2025-09-22T12:34:33.974Z" },
+    { url = "https://files.pythonhosted.org/packages/9c/2e/805c2d0e799710e4937d084d9c37821bafa129eda1de62c3279a042ca56d/fastexcel-0.16.0-cp39-abi3-win_amd64.whl", hash = "sha256:04c2b6fea7292e26d76a458f9095f4ec260c864c90be7a7161d20ca81cf77fd8", size = 2819876, upload-time = "2025-09-22T12:34:38.716Z" },
+]
+
+[[package]]
+name = "filelock"
+version = "3.20.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/58/46/0028a82567109b5ef6e4d2a1f04a583fb513e6cf9527fcdd09afd817deeb/filelock-3.20.0.tar.gz", hash = "sha256:711e943b4ec6be42e1d4e6690b48dc175c822967466bb31c0c293f34334c13f4", size = 18922, upload-time = "2025-10-08T18:03:50.056Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/76/91/7216b27286936c16f5b4d0c530087e4a54eead683e6b0b73dd0c64844af6/filelock-3.20.0-py3-none-any.whl", hash = "sha256:339b4732ffda5cd79b13f4e2711a31b0365ce445d95d243bb996273d072546a2", size = 16054, upload-time = "2025-10-08T18:03:48.35Z" },
+]
+
+[[package]]
+name = "google-api-core"
+version = "2.26.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "google-auth" },
+    { name = "googleapis-common-protos" },
+    { name = "proto-plus" },
+    { name = "protobuf" },
+    { name = "requests" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/32/ea/e7b6ac3c7b557b728c2d0181010548cbbdd338e9002513420c5a354fa8df/google_api_core-2.26.0.tar.gz", hash = "sha256:e6e6d78bd6cf757f4aee41dcc85b07f485fbb069d5daa3afb126defba1e91a62", size = 166369, upload-time = "2025-10-08T21:37:38.39Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/77/ad/f73cf9fe9bd95918502b270e3ddb8764e4c900b3bbd7782b90c56fac14bb/google_api_core-2.26.0-py3-none-any.whl", hash = "sha256:2b204bd0da2c81f918e3582c48458e24c11771f987f6258e6e227212af78f3ed", size = 162505, upload-time = "2025-10-08T21:37:36.651Z" },
+]
+
+[package.optional-dependencies]
+grpc = [
+    { name = "grpcio" },
+    { name = "grpcio-status" },
+]
+
+[[package]]
+name = "google-auth"
+version = "2.41.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "cachetools" },
+    { name = "pyasn1-modules" },
+    { name = "rsa" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a8/af/5129ce5b2f9688d2fa49b463e544972a7c82b0fdb50980dafee92e121d9f/google_auth-2.41.1.tar.gz", hash = "sha256:b76b7b1f9e61f0cb7e88870d14f6a94aeef248959ef6992670efee37709cbfd2", size = 292284, upload-time = "2025-09-30T22:51:26.363Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/be/a4/7319a2a8add4cc352be9e3efeff5e2aacee917c85ca2fa1647e29089983c/google_auth-2.41.1-py2.py3-none-any.whl", hash = "sha256:754843be95575b9a19c604a848a41be03f7f2afd8c019f716dc1f51ee41c639d", size = 221302, upload-time = "2025-09-30T22:51:24.212Z" },
+]
+
+[[package]]
+name = "google-cloud-bigquery"
+version = "3.38.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "google-api-core", extra = ["grpc"] },
+    { name = "google-auth" },
+    { name = "google-cloud-core" },
+    { name = "google-resumable-media" },
+    { name = "packaging" },
+    { name = "python-dateutil" },
+    { name = "requests" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/07/b2/a17e40afcf9487e3d17db5e36728ffe75c8d5671c46f419d7b6528a5728a/google_cloud_bigquery-3.38.0.tar.gz", hash = "sha256:8afcb7116f5eac849097a344eb8bfda78b7cfaae128e60e019193dd483873520", size = 503666, upload-time = "2025-09-17T20:33:33.47Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/39/3c/c8cada9ec282b29232ed9aed5a0b5cca6cf5367cb2ffa8ad0d2583d743f1/google_cloud_bigquery-3.38.0-py3-none-any.whl", hash = "sha256:e06e93ff7b245b239945ef59cb59616057598d369edac457ebf292bd61984da6", size = 259257, upload-time = "2025-09-17T20:33:31.404Z" },
+]
+
+[[package]]
+name = "google-cloud-core"
+version = "2.4.3"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "google-api-core" },
+    { name = "google-auth" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/d6/b8/2b53838d2acd6ec6168fd284a990c76695e84c65deee79c9f3a4276f6b4f/google_cloud_core-2.4.3.tar.gz", hash = "sha256:1fab62d7102844b278fe6dead3af32408b1df3eb06f5c7e8634cbd40edc4da53", size = 35861, upload-time = "2025-03-10T21:05:38.948Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/40/86/bda7241a8da2d28a754aad2ba0f6776e35b67e37c36ae0c45d49370f1014/google_cloud_core-2.4.3-py2.py3-none-any.whl", hash = "sha256:5130f9f4c14b4fafdff75c79448f9495cfade0d8775facf1b09c3bf67e027f6e", size = 29348, upload-time = "2025-03-10T21:05:37.785Z" },
+]
+
+[[package]]
+name = "google-cloud-storage"
+version = "3.4.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "google-api-core" },
+    { name = "google-auth" },
+    { name = "google-cloud-core" },
+    { name = "google-crc32c" },
+    { name = "google-resumable-media" },
+    { name = "requests" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/bd/ef/7cefdca67a6c8b3af0ec38612f9e78e5a9f6179dd91352772ae1a9849246/google_cloud_storage-3.4.1.tar.gz", hash = "sha256:6f041a297e23a4b485fad8c305a7a6e6831855c208bcbe74d00332a909f82268", size = 17238203, upload-time = "2025-10-08T18:43:39.665Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/83/6e/b47d83d3a35231c6232566341b0355cce78fd4e6988a7343725408547b2c/google_cloud_storage-3.4.1-py3-none-any.whl", hash = "sha256:972764cc0392aa097be8f49a5354e22eb47c3f62370067fb1571ffff4a1c1189", size = 290142, upload-time = "2025-10-08T18:43:37.524Z" },
+]
+
+[[package]]
+name = "google-crc32c"
+version = "1.7.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/19/ae/87802e6d9f9d69adfaedfcfd599266bf386a54d0be058b532d04c794f76d/google_crc32c-1.7.1.tar.gz", hash = "sha256:2bff2305f98846f3e825dbeec9ee406f89da7962accdb29356e4eadc251bd472", size = 14495, upload-time = "2025-03-26T14:29:13.32Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/f7/94/220139ea87822b6fdfdab4fb9ba81b3fff7ea2c82e2af34adc726085bffc/google_crc32c-1.7.1-cp311-cp311-macosx_12_0_arm64.whl", hash = "sha256:6fbab4b935989e2c3610371963ba1b86afb09537fd0c633049be82afe153ac06", size = 30468, upload-time = "2025-03-26T14:32:52.215Z" },
+    { url = "https://files.pythonhosted.org/packages/94/97/789b23bdeeb9d15dc2904660463ad539d0318286d7633fe2760c10ed0c1c/google_crc32c-1.7.1-cp311-cp311-macosx_12_0_x86_64.whl", hash = "sha256:ed66cbe1ed9cbaaad9392b5259b3eba4a9e565420d734e6238813c428c3336c9", size = 30313, upload-time = "2025-03-26T14:57:38.758Z" },
+    { url = "https://files.pythonhosted.org/packages/81/b8/976a2b843610c211e7ccb3e248996a61e87dbb2c09b1499847e295080aec/google_crc32c-1.7.1-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ee6547b657621b6cbed3562ea7826c3e11cab01cd33b74e1f677690652883e77", size = 33048, upload-time = "2025-03-26T14:41:30.679Z" },
+    { url = "https://files.pythonhosted.org/packages/c9/16/a3842c2cf591093b111d4a5e2bfb478ac6692d02f1b386d2a33283a19dc9/google_crc32c-1.7.1-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d68e17bad8f7dd9a49181a1f5a8f4b251c6dbc8cc96fb79f1d321dfd57d66f53", size = 32669, upload-time = "2025-03-26T14:41:31.432Z" },
+    { url = "https://files.pythonhosted.org/packages/04/17/ed9aba495916fcf5fe4ecb2267ceb851fc5f273c4e4625ae453350cfd564/google_crc32c-1.7.1-cp311-cp311-win_amd64.whl", hash = "sha256:6335de12921f06e1f774d0dd1fbea6bf610abe0887a1638f64d694013138be5d", size = 33476, upload-time = "2025-03-26T14:29:10.211Z" },
+    { url = "https://files.pythonhosted.org/packages/dd/b7/787e2453cf8639c94b3d06c9d61f512234a82e1d12d13d18584bd3049904/google_crc32c-1.7.1-cp312-cp312-macosx_12_0_arm64.whl", hash = "sha256:2d73a68a653c57281401871dd4aeebbb6af3191dcac751a76ce430df4d403194", size = 30470, upload-time = "2025-03-26T14:34:31.655Z" },
+    { url = "https://files.pythonhosted.org/packages/ed/b4/6042c2b0cbac3ec3a69bb4c49b28d2f517b7a0f4a0232603c42c58e22b44/google_crc32c-1.7.1-cp312-cp312-macosx_12_0_x86_64.whl", hash = "sha256:22beacf83baaf59f9d3ab2bbb4db0fb018da8e5aebdce07ef9f09fce8220285e", size = 30315, upload-time = "2025-03-26T15:01:54.634Z" },
+    { url = "https://files.pythonhosted.org/packages/29/ad/01e7a61a5d059bc57b702d9ff6a18b2585ad97f720bd0a0dbe215df1ab0e/google_crc32c-1.7.1-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:19eafa0e4af11b0a4eb3974483d55d2d77ad1911e6cf6f832e1574f6781fd337", size = 33180, upload-time = "2025-03-26T14:41:32.168Z" },
+    { url = "https://files.pythonhosted.org/packages/3b/a5/7279055cf004561894ed3a7bfdf5bf90a53f28fadd01af7cd166e88ddf16/google_crc32c-1.7.1-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:b6d86616faaea68101195c6bdc40c494e4d76f41e07a37ffdef270879c15fb65", size = 32794, upload-time = "2025-03-26T14:41:33.264Z" },
+    { url = "https://files.pythonhosted.org/packages/0f/d6/77060dbd140c624e42ae3ece3df53b9d811000729a5c821b9fd671ceaac6/google_crc32c-1.7.1-cp312-cp312-win_amd64.whl", hash = "sha256:b7491bdc0c7564fcf48c0179d2048ab2f7c7ba36b84ccd3a3e1c3f7a72d3bba6", size = 33477, upload-time = "2025-03-26T14:29:10.94Z" },
+    { url = "https://files.pythonhosted.org/packages/8b/72/b8d785e9184ba6297a8620c8a37cf6e39b81a8ca01bb0796d7cbb28b3386/google_crc32c-1.7.1-cp313-cp313-macosx_12_0_arm64.whl", hash = "sha256:df8b38bdaf1629d62d51be8bdd04888f37c451564c2042d36e5812da9eff3c35", size = 30467, upload-time = "2025-03-26T14:36:06.909Z" },
+    { url = "https://files.pythonhosted.org/packages/34/25/5f18076968212067c4e8ea95bf3b69669f9fc698476e5f5eb97d5b37999f/google_crc32c-1.7.1-cp313-cp313-macosx_12_0_x86_64.whl", hash = "sha256:e42e20a83a29aa2709a0cf271c7f8aefaa23b7ab52e53b322585297bb94d4638", size = 30309, upload-time = "2025-03-26T15:06:15.318Z" },
+    { url = "https://files.pythonhosted.org/packages/92/83/9228fe65bf70e93e419f38bdf6c5ca5083fc6d32886ee79b450ceefd1dbd/google_crc32c-1.7.1-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:905a385140bf492ac300026717af339790921f411c0dfd9aa5a9e69a08ed32eb", size = 33133, upload-time = "2025-03-26T14:41:34.388Z" },
+    { url = "https://files.pythonhosted.org/packages/c3/ca/1ea2fd13ff9f8955b85e7956872fdb7050c4ace8a2306a6d177edb9cf7fe/google_crc32c-1.7.1-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:6b211ddaf20f7ebeec5c333448582c224a7c90a9d98826fbab82c0ddc11348e6", size = 32773, upload-time = "2025-03-26T14:41:35.19Z" },
+    { url = "https://files.pythonhosted.org/packages/89/32/a22a281806e3ef21b72db16f948cad22ec68e4bdd384139291e00ff82fe2/google_crc32c-1.7.1-cp313-cp313-win_amd64.whl", hash = "sha256:0f99eaa09a9a7e642a61e06742856eec8b19fc0037832e03f941fe7cf0c8e4db", size = 33475, upload-time = "2025-03-26T14:29:11.771Z" },
+    { url = "https://files.pythonhosted.org/packages/b8/c5/002975aff514e57fc084ba155697a049b3f9b52225ec3bc0f542871dd524/google_crc32c-1.7.1-cp313-cp313t-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:32d1da0d74ec5634a05f53ef7df18fc646666a25efaaca9fc7dcfd4caf1d98c3", size = 33243, upload-time = "2025-03-26T14:41:35.975Z" },
+    { url = "https://files.pythonhosted.org/packages/61/cb/c585282a03a0cea70fcaa1bf55d5d702d0f2351094d663ec3be1c6c67c52/google_crc32c-1.7.1-cp313-cp313t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e10554d4abc5238823112c2ad7e4560f96c7bf3820b202660373d769d9e6e4c9", size = 32870, upload-time = "2025-03-26T14:41:37.08Z" },
+    { url = "https://files.pythonhosted.org/packages/16/1b/1693372bf423ada422f80fd88260dbfd140754adb15cbc4d7e9a68b1cb8e/google_crc32c-1.7.1-pp311-pypy311_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:85fef7fae11494e747c9fd1359a527e5970fc9603c90764843caabd3a16a0a48", size = 28241, upload-time = "2025-03-26T14:41:45.898Z" },
+    { url = "https://files.pythonhosted.org/packages/fd/3c/2a19a60a473de48717b4efb19398c3f914795b64a96cf3fbe82588044f78/google_crc32c-1.7.1-pp311-pypy311_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:6efb97eb4369d52593ad6f75e7e10d053cf00c48983f7a973105bc70b0ac4d82", size = 28048, upload-time = "2025-03-26T14:41:46.696Z" },
+]
+
+[[package]]
+name = "google-resumable-media"
+version = "2.7.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "google-crc32c" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/58/5a/0efdc02665dca14e0837b62c8a1a93132c264bd02054a15abb2218afe0ae/google_resumable_media-2.7.2.tar.gz", hash = "sha256:5280aed4629f2b60b847b0d42f9857fd4935c11af266744df33d8074cae92fe0", size = 2163099, upload-time = "2024-08-07T22:20:38.555Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/82/35/b8d3baf8c46695858cb9d8835a53baa1eeb9906ddaf2f728a5f5b640fd1e/google_resumable_media-2.7.2-py2.py3-none-any.whl", hash = "sha256:3ce7551e9fe6d99e9a126101d2536612bb73486721951e9562fee0f90c6ababa", size = 81251, upload-time = "2024-08-07T22:20:36.409Z" },
+]
+
+[[package]]
+name = "googleapis-common-protos"
+version = "1.70.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "protobuf" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/39/24/33db22342cf4a2ea27c9955e6713140fedd51e8b141b5ce5260897020f1a/googleapis_common_protos-1.70.0.tar.gz", hash = "sha256:0e1b44e0ea153e6594f9f394fef15193a68aaaea2d843f83e2742717ca753257", size = 145903, upload-time = "2025-04-14T10:17:02.924Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/86/f1/62a193f0227cf15a920390abe675f386dec35f7ae3ffe6da582d3ade42c7/googleapis_common_protos-1.70.0-py3-none-any.whl", hash = "sha256:b8bfcca8c25a2bb253e0e0b0adaf8c00773e5e6af6fd92397576680b807e0fd8", size = 294530, upload-time = "2025-04-14T10:17:01.271Z" },
+]
+
+[[package]]
+name = "grpcio"
+version = "1.75.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/9d/f7/8963848164c7604efb3a3e6ee457fdb3a469653e19002bd24742473254f8/grpcio-1.75.1.tar.gz", hash = "sha256:3e81d89ece99b9ace23a6916880baca613c03a799925afb2857887efa8b1b3d2", size = 12731327, upload-time = "2025-09-26T09:03:36.887Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/0c/3c/35ca9747473a306bfad0cee04504953f7098527cd112a4ab55c55af9e7bd/grpcio-1.75.1-cp311-cp311-linux_armv7l.whl", hash = "sha256:573855ca2e58e35032aff30bfbd1ee103fbcf4472e4b28d4010757700918e326", size = 5709761, upload-time = "2025-09-26T09:01:28.528Z" },
+    { url = "https://files.pythonhosted.org/packages/c9/2c/ecbcb4241e4edbe85ac2663f885726fea0e947767401288b50d8fdcb9200/grpcio-1.75.1-cp311-cp311-macosx_11_0_universal2.whl", hash = "sha256:6a4996a2c8accc37976dc142d5991adf60733e223e5c9a2219e157dc6a8fd3a2", size = 11496691, upload-time = "2025-09-26T09:01:31.214Z" },
+    { url = "https://files.pythonhosted.org/packages/81/40/bc07aee2911f0d426fa53fe636216100c31a8ea65a400894f280274cb023/grpcio-1.75.1-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:b1ea1bbe77ecbc1be00af2769f4ae4a88ce93be57a4f3eebd91087898ed749f9", size = 6296084, upload-time = "2025-09-26T09:01:34.596Z" },
+    { url = "https://files.pythonhosted.org/packages/b8/d1/10c067f6c67396cbf46448b80f27583b5e8c4b46cdfbe18a2a02c2c2f290/grpcio-1.75.1-cp311-cp311-manylinux2014_i686.manylinux_2_17_i686.whl", hash = "sha256:e5b425aee54cc5e3e3c58f00731e8a33f5567965d478d516d35ef99fd648ab68", size = 6950403, upload-time = "2025-09-26T09:01:36.736Z" },
+    { url = "https://files.pythonhosted.org/packages/3f/42/5f628abe360b84dfe8dd8f32be6b0606dc31dc04d3358eef27db791ea4d5/grpcio-1.75.1-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:0049a7bf547dafaeeb1db17079ce79596c298bfe308fc084d023c8907a845b9a", size = 6470166, upload-time = "2025-09-26T09:01:39.474Z" },
+    { url = "https://files.pythonhosted.org/packages/c3/93/a24035080251324019882ee2265cfde642d6476c0cf8eb207fc693fcebdc/grpcio-1.75.1-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:5b8ea230c7f77c0a1a3208a04a1eda164633fb0767b4cefd65a01079b65e5b1f", size = 7107828, upload-time = "2025-09-26T09:01:41.782Z" },
+    { url = "https://files.pythonhosted.org/packages/e4/f8/d18b984c1c9ba0318e3628dbbeb6af77a5007f02abc378c845070f2d3edd/grpcio-1.75.1-cp311-cp311-musllinux_1_2_i686.whl", hash = "sha256:36990d629c3c9fb41e546414e5af52d0a7af37ce7113d9682c46d7e2919e4cca", size = 8045421, upload-time = "2025-09-26T09:01:45.835Z" },
+    { url = "https://files.pythonhosted.org/packages/7e/b6/4bf9aacff45deca5eac5562547ed212556b831064da77971a4e632917da3/grpcio-1.75.1-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:b10ad908118d38c2453ade7ff790e5bce36580c3742919007a2a78e3a1e521ca", size = 7503290, upload-time = "2025-09-26T09:01:49.28Z" },
+    { url = "https://files.pythonhosted.org/packages/3b/15/d8d69d10223cb54c887a2180bd29fe5fa2aec1d4995c8821f7aa6eaf72e4/grpcio-1.75.1-cp311-cp311-win32.whl", hash = "sha256:d6be2b5ee7bea656c954dcf6aa8093c6f0e6a3ef9945c99d99fcbfc88c5c0bfe", size = 3950631, upload-time = "2025-09-26T09:01:51.23Z" },
+    { url = "https://files.pythonhosted.org/packages/8a/40/7b8642d45fff6f83300c24eaac0380a840e5e7fe0e8d80afd31b99d7134e/grpcio-1.75.1-cp311-cp311-win_amd64.whl", hash = "sha256:61c692fb05956b17dd6d1ab480f7f10ad0536dba3bc8fd4e3c7263dc244ed772", size = 4646131, upload-time = "2025-09-26T09:01:53.266Z" },
+    { url = "https://files.pythonhosted.org/packages/3a/81/42be79e73a50aaa20af66731c2defeb0e8c9008d9935a64dd8ea8e8c44eb/grpcio-1.75.1-cp312-cp312-linux_armv7l.whl", hash = "sha256:7b888b33cd14085d86176b1628ad2fcbff94cfbbe7809465097aa0132e58b018", size = 5668314, upload-time = "2025-09-26T09:01:55.424Z" },
+    { url = "https://files.pythonhosted.org/packages/c5/a7/3686ed15822fedc58c22f82b3a7403d9faf38d7c33de46d4de6f06e49426/grpcio-1.75.1-cp312-cp312-macosx_11_0_universal2.whl", hash = "sha256:8775036efe4ad2085975531d221535329f5dac99b6c2a854a995456098f99546", size = 11476125, upload-time = "2025-09-26T09:01:57.927Z" },
+    { url = "https://files.pythonhosted.org/packages/14/85/21c71d674f03345ab183c634ecd889d3330177e27baea8d5d247a89b6442/grpcio-1.75.1-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:bb658f703468d7fbb5dcc4037c65391b7dc34f808ac46ed9136c24fc5eeb041d", size = 6246335, upload-time = "2025-09-26T09:02:00.76Z" },
+    { url = "https://files.pythonhosted.org/packages/fd/db/3beb661bc56a385ae4fa6b0e70f6b91ac99d47afb726fe76aaff87ebb116/grpcio-1.75.1-cp312-cp312-manylinux2014_i686.manylinux_2_17_i686.whl", hash = "sha256:4b7177a1cdb3c51b02b0c0a256b0a72fdab719600a693e0e9037949efffb200b", size = 6916309, upload-time = "2025-09-26T09:02:02.894Z" },
+    { url = "https://files.pythonhosted.org/packages/1e/9c/eda9fe57f2b84343d44c1b66cf3831c973ba29b078b16a27d4587a1fdd47/grpcio-1.75.1-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:7d4fa6ccc3ec2e68a04f7b883d354d7fea22a34c44ce535a2f0c0049cf626ddf", size = 6435419, upload-time = "2025-09-26T09:02:05.055Z" },
+    { url = "https://files.pythonhosted.org/packages/c3/b8/090c98983e0a9d602e3f919a6e2d4e470a8b489452905f9a0fa472cac059/grpcio-1.75.1-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:3d86880ecaeb5b2f0a8afa63824de93adb8ebe4e49d0e51442532f4e08add7d6", size = 7064893, upload-time = "2025-09-26T09:02:07.275Z" },
+    { url = "https://files.pythonhosted.org/packages/ec/c0/6d53d4dbbd00f8bd81571f5478d8a95528b716e0eddb4217cc7cb45aae5f/grpcio-1.75.1-cp312-cp312-musllinux_1_2_i686.whl", hash = "sha256:a8041d2f9e8a742aeae96f4b047ee44e73619f4f9d24565e84d5446c623673b6", size = 8011922, upload-time = "2025-09-26T09:02:09.527Z" },
+    { url = "https://files.pythonhosted.org/packages/f2/7c/48455b2d0c5949678d6982c3e31ea4d89df4e16131b03f7d5c590811cbe9/grpcio-1.75.1-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:3652516048bf4c314ce12be37423c79829f46efffb390ad64149a10c6071e8de", size = 7466181, upload-time = "2025-09-26T09:02:12.279Z" },
+    { url = "https://files.pythonhosted.org/packages/fd/12/04a0e79081e3170b6124f8cba9b6275871276be06c156ef981033f691880/grpcio-1.75.1-cp312-cp312-win32.whl", hash = "sha256:44b62345d8403975513af88da2f3d5cc76f73ca538ba46596f92a127c2aea945", size = 3938543, upload-time = "2025-09-26T09:02:14.77Z" },
+    { url = "https://files.pythonhosted.org/packages/5f/d7/11350d9d7fb5adc73d2b0ebf6ac1cc70135577701e607407fe6739a90021/grpcio-1.75.1-cp312-cp312-win_amd64.whl", hash = "sha256:b1e191c5c465fa777d4cafbaacf0c01e0d5278022082c0abbd2ee1d6454ed94d", size = 4641938, upload-time = "2025-09-26T09:02:16.927Z" },
+    { url = "https://files.pythonhosted.org/packages/46/74/bac4ab9f7722164afdf263ae31ba97b8174c667153510322a5eba4194c32/grpcio-1.75.1-cp313-cp313-linux_armv7l.whl", hash = "sha256:3bed22e750d91d53d9e31e0af35a7b0b51367e974e14a4ff229db5b207647884", size = 5672779, upload-time = "2025-09-26T09:02:19.11Z" },
+    { url = "https://files.pythonhosted.org/packages/a6/52/d0483cfa667cddaa294e3ab88fd2c2a6e9dc1a1928c0e5911e2e54bd5b50/grpcio-1.75.1-cp313-cp313-macosx_11_0_universal2.whl", hash = "sha256:5b8f381eadcd6ecaa143a21e9e80a26424c76a0a9b3d546febe6648f3a36a5ac", size = 11470623, upload-time = "2025-09-26T09:02:22.117Z" },
+    { url = "https://files.pythonhosted.org/packages/cf/e4/d1954dce2972e32384db6a30273275e8c8ea5a44b80347f9055589333b3f/grpcio-1.75.1-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:5bf4001d3293e3414d0cf99ff9b1139106e57c3a66dfff0c5f60b2a6286ec133", size = 6248838, upload-time = "2025-09-26T09:02:26.426Z" },
+    { url = "https://files.pythonhosted.org/packages/06/43/073363bf63826ba8077c335d797a8d026f129dc0912b69c42feaf8f0cd26/grpcio-1.75.1-cp313-cp313-manylinux2014_i686.manylinux_2_17_i686.whl", hash = "sha256:9f82ff474103e26351dacfe8d50214e7c9322960d8d07ba7fa1d05ff981c8b2d", size = 6922663, upload-time = "2025-09-26T09:02:28.724Z" },
+    { url = "https://files.pythonhosted.org/packages/c2/6f/076ac0df6c359117676cacfa8a377e2abcecec6a6599a15a672d331f6680/grpcio-1.75.1-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:0ee119f4f88d9f75414217823d21d75bfe0e6ed40135b0cbbfc6376bc9f7757d", size = 6436149, upload-time = "2025-09-26T09:02:30.971Z" },
+    { url = "https://files.pythonhosted.org/packages/6b/27/1d08824f1d573fcb1fa35ede40d6020e68a04391709939e1c6f4193b445f/grpcio-1.75.1-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:664eecc3abe6d916fa6cf8dd6b778e62fb264a70f3430a3180995bf2da935446", size = 7067989, upload-time = "2025-09-26T09:02:33.233Z" },
+    { url = "https://files.pythonhosted.org/packages/c6/98/98594cf97b8713feb06a8cb04eeef60b4757e3e2fb91aa0d9161da769843/grpcio-1.75.1-cp313-cp313-musllinux_1_2_i686.whl", hash = "sha256:c32193fa08b2fbebf08fe08e84f8a0aad32d87c3ad42999c65e9449871b1c66e", size = 8010717, upload-time = "2025-09-26T09:02:36.011Z" },
+    { url = "https://files.pythonhosted.org/packages/8c/7e/bb80b1bba03c12158f9254762cdf5cced4a9bc2e8ed51ed335915a5a06ef/grpcio-1.75.1-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:5cebe13088b9254f6e615bcf1da9131d46cfa4e88039454aca9cb65f639bd3bc", size = 7463822, upload-time = "2025-09-26T09:02:38.26Z" },
+    { url = "https://files.pythonhosted.org/packages/23/1c/1ea57fdc06927eb5640f6750c697f596f26183573069189eeaf6ef86ba2d/grpcio-1.75.1-cp313-cp313-win32.whl", hash = "sha256:4b4c678e7ed50f8ae8b8dbad15a865ee73ce12668b6aaf411bf3258b5bc3f970", size = 3938490, upload-time = "2025-09-26T09:02:40.268Z" },
+    { url = "https://files.pythonhosted.org/packages/4b/24/fbb8ff1ccadfbf78ad2401c41aceaf02b0d782c084530d8871ddd69a2d49/grpcio-1.75.1-cp313-cp313-win_amd64.whl", hash = "sha256:5573f51e3f296a1bcf71e7a690c092845fb223072120f4bdb7a5b48e111def66", size = 4642538, upload-time = "2025-09-26T09:02:42.519Z" },
+    { url = "https://files.pythonhosted.org/packages/f2/1b/9a0a5cecd24302b9fdbcd55d15ed6267e5f3d5b898ff9ac8cbe17ee76129/grpcio-1.75.1-cp314-cp314-linux_armv7l.whl", hash = "sha256:c05da79068dd96723793bffc8d0e64c45f316248417515f28d22204d9dae51c7", size = 5673319, upload-time = "2025-09-26T09:02:44.742Z" },
+    { url = "https://files.pythonhosted.org/packages/c6/ec/9d6959429a83fbf5df8549c591a8a52bb313976f6646b79852c4884e3225/grpcio-1.75.1-cp314-cp314-macosx_11_0_universal2.whl", hash = "sha256:06373a94fd16ec287116a825161dca179a0402d0c60674ceeec8c9fba344fe66", size = 11480347, upload-time = "2025-09-26T09:02:47.539Z" },
+    { url = "https://files.pythonhosted.org/packages/09/7a/26da709e42c4565c3d7bf999a9569da96243ce34a8271a968dee810a7cf1/grpcio-1.75.1-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:4484f4b7287bdaa7a5b3980f3c7224c3c622669405d20f69549f5fb956ad0421", size = 6254706, upload-time = "2025-09-26T09:02:50.4Z" },
+    { url = "https://files.pythonhosted.org/packages/f1/08/dcb26a319d3725f199c97e671d904d84ee5680de57d74c566a991cfab632/grpcio-1.75.1-cp314-cp314-manylinux2014_i686.manylinux_2_17_i686.whl", hash = "sha256:2720c239c1180eee69f7883c1d4c83fc1a495a2535b5fa322887c70bf02b16e8", size = 6922501, upload-time = "2025-09-26T09:02:52.711Z" },
+    { url = "https://files.pythonhosted.org/packages/78/66/044d412c98408a5e23cb348845979a2d17a2e2b6c3c34c1ec91b920f49d0/grpcio-1.75.1-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:07a554fa31c668cf0e7a188678ceeca3cb8fead29bbe455352e712ec33ca701c", size = 6437492, upload-time = "2025-09-26T09:02:55.542Z" },
+    { url = "https://files.pythonhosted.org/packages/4e/9d/5e3e362815152aa1afd8b26ea613effa005962f9da0eec6e0e4527e7a7d1/grpcio-1.75.1-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:3e71a2105210366bfc398eef7f57a664df99194f3520edb88b9c3a7e46ee0d64", size = 7081061, upload-time = "2025-09-26T09:02:58.261Z" },
+    { url = "https://files.pythonhosted.org/packages/1e/1a/46615682a19e100f46e31ddba9ebc297c5a5ab9ddb47b35443ffadb8776c/grpcio-1.75.1-cp314-cp314-musllinux_1_2_i686.whl", hash = "sha256:8679aa8a5b67976776d3c6b0521e99d1c34db8a312a12bcfd78a7085cb9b604e", size = 8010849, upload-time = "2025-09-26T09:03:00.548Z" },
+    { url = "https://files.pythonhosted.org/packages/67/8e/3204b94ac30b0f675ab1c06540ab5578660dc8b690db71854d3116f20d00/grpcio-1.75.1-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:aad1c774f4ebf0696a7f148a56d39a3432550612597331792528895258966dc0", size = 7464478, upload-time = "2025-09-26T09:03:03.096Z" },
+    { url = "https://files.pythonhosted.org/packages/b7/97/2d90652b213863b2cf466d9c1260ca7e7b67a16780431b3eb1d0420e3d5b/grpcio-1.75.1-cp314-cp314-win32.whl", hash = "sha256:62ce42d9994446b307649cb2a23335fa8e927f7ab2cbf5fcb844d6acb4d85f9c", size = 4012672, upload-time = "2025-09-26T09:03:05.477Z" },
+    { url = "https://files.pythonhosted.org/packages/f9/df/e2e6e9fc1c985cd1a59e6996a05647c720fe8a03b92f5ec2d60d366c531e/grpcio-1.75.1-cp314-cp314-win_amd64.whl", hash = "sha256:f86e92275710bea3000cb79feca1762dc0ad3b27830dd1a74e82ab321d4ee464", size = 4772475, upload-time = "2025-09-26T09:03:07.661Z" },
+]
+
+[[package]]
+name = "grpcio-status"
+version = "1.75.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "googleapis-common-protos" },
+    { name = "grpcio" },
+    { name = "protobuf" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/74/5b/1ce0e3eedcdc08b4739b3da5836f31142ec8bee1a9ae0ad8dc0dc39a14bf/grpcio_status-1.75.1.tar.gz", hash = "sha256:8162afa21833a2085c91089cc395ad880fac1378a1d60233d976649ed724cbf8", size = 13671, upload-time = "2025-09-26T09:13:16.412Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/d8/ad/6f414bb0b36eee20d93af6907256f208ffcda992ae6d3d7b6a778afe31e6/grpcio_status-1.75.1-py3-none-any.whl", hash = "sha256:f681b301be26dcf7abf5c765d4a22e4098765e1a65cbdfa3efca384edf8e4e3c", size = 14428, upload-time = "2025-09-26T09:12:55.516Z" },
+]
+
+[[package]]
+name = "identify"
+version = "2.6.15"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ff/e7/685de97986c916a6d93b3876139e00eef26ad5bbbd61925d670ae8013449/identify-2.6.15.tar.gz", hash = "sha256:e4f4864b96c6557ef2a1e1c951771838f4edc9df3a72ec7118b338801b11c7bf", size = 99311, upload-time = "2025-10-02T17:43:40.631Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/0f/1c/e5fd8f973d4f375adb21565739498e2e9a1e54c858a97b9a8ccfdc81da9b/identify-2.6.15-py2.py3-none-any.whl", hash = "sha256:1181ef7608e00704db228516541eb83a88a9f94433a8c80bb9b5bd54b1d81757", size = 99183, upload-time = "2025-10-02T17:43:39.137Z" },
+]
+
+[[package]]
+name = "idna"
+version = "3.11"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/6f/6d/0703ccc57f3a7233505399edb88de3cbd678da106337b9fcde432b65ed60/idna-3.11.tar.gz", hash = "sha256:795dafcc9c04ed0c1fb032c2aa73654d8e8c5023a7df64a53f39190ada629902", size = 194582, upload-time = "2025-10-12T14:55:20.501Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/0e/61/66938bbb5fc52dbdf84594873d5b51fb1f7c7794e9c0f5bd885f30bc507b/idna-3.11-py3-none-any.whl", hash = "sha256:771a87f49d9defaf64091e6e6fe9c18d4833f140bd19464795bc32d966ca37ea", size = 71008, upload-time = "2025-10-12T14:55:18.883Z" },
+]
+
+[[package]]
+name = "iniconfig"
+version = "2.3.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/72/34/14ca021ce8e5dfedc35312d08ba8bf51fdd999c576889fc2c24cb97f4f10/iniconfig-2.3.0.tar.gz", hash = "sha256:c76315c77db068650d49c5b56314774a7804df16fee4402c1f19d6d15d8c4730", size = 20503, upload-time = "2025-10-18T21:55:43.219Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/cb/b1/3846dd7f199d53cb17f49cba7e651e9ce294d8497c8c150530ed11865bb8/iniconfig-2.3.0-py3-none-any.whl", hash = "sha256:f631c04d2c48c52b84d0d0549c99ff3859c98df65b3101406327ecc7d53fbf12", size = 7484, upload-time = "2025-10-18T21:55:41.639Z" },
+]
+
+[[package]]
+name = "loguru"
+version = "0.7.3"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "colorama", marker = "sys_platform == 'win32'" },
+    { name = "win32-setctime", marker = "sys_platform == 'win32'" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/3a/05/a1dae3dffd1116099471c643b8924f5aa6524411dc6c63fdae648c4f1aca/loguru-0.7.3.tar.gz", hash = "sha256:19480589e77d47b8d85b2c827ad95d49bf31b0dcde16593892eb51dd18706eb6", size = 63559, upload-time = "2024-12-06T11:20:56.608Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/0c/29/0348de65b8cc732daa3e33e67806420b2ae89bdce2b04af740289c5c6c8c/loguru-0.7.3-py3-none-any.whl", hash = "sha256:31a33c10c8e1e10422bfd431aeb5d351c7cf7fa671e3c4df004162264b28220c", size = 61595, upload-time = "2024-12-06T11:20:54.538Z" },
+]
+
+[[package]]
+name = "markdown-it-py"
+version = "4.0.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "mdurl" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/5b/f5/4ec618ed16cc4f8fb3b701563655a69816155e79e24a17b651541804721d/markdown_it_py-4.0.0.tar.gz", hash = "sha256:cb0a2b4aa34f932c007117b194e945bd74e0ec24133ceb5bac59009cda1cb9f3", size = 73070, upload-time = "2025-08-11T12:57:52.854Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/94/54/e7d793b573f298e1c9013b8c4dade17d481164aa517d1d7148619c2cedbf/markdown_it_py-4.0.0-py3-none-any.whl", hash = "sha256:87327c59b172c5011896038353a81343b6754500a08cd7a4973bb48c6d578147", size = 87321, upload-time = "2025-08-11T12:57:51.923Z" },
+]
+
+[[package]]
+name = "mdurl"
+version = "0.1.2"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/d6/54/cfe61301667036ec958cb99bd3efefba235e65cdeb9c84d24a8293ba1d90/mdurl-0.1.2.tar.gz", hash = "sha256:bb413d29f5eea38f31dd4754dd7377d4465116fb207585f97bf925588687c1ba", size = 8729, upload-time = "2022-08-14T12:40:10.846Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/b3/38/89ba8ad64ae25be8de66a6d463314cf1eb366222074cfda9ee839c56a4b4/mdurl-0.1.2-py3-none-any.whl", hash = "sha256:84008a41e51615a49fc9966191ff91509e3c40b939176e643fd50a5c2196b8f8", size = 9979, upload-time = "2022-08-14T12:40:09.779Z" },
+]
+
+[[package]]
+name = "mypy-extensions"
+version = "1.1.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/a2/6e/371856a3fb9d31ca8dac321cda606860fa4548858c0cc45d9d1d4ca2628b/mypy_extensions-1.1.0.tar.gz", hash = "sha256:52e68efc3284861e772bbcd66823fde5ae21fd2fdb51c62a211403730b916558", size = 6343, upload-time = "2025-04-22T14:54:24.164Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/79/7b/2c79738432f5c924bef5071f933bcc9efd0473bac3b4aa584a6f7c1c8df8/mypy_extensions-1.1.0-py3-none-any.whl", hash = "sha256:1be4cccdb0f2482337c4743e60421de3a356cd97508abadd57d47403e94f5505", size = 4963, upload-time = "2025-04-22T14:54:22.983Z" },
+]
+
+[[package]]
+name = "nodeenv"
+version = "1.9.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/43/16/fc88b08840de0e0a72a2f9d8c6bae36be573e475a6326ae854bcc549fc45/nodeenv-1.9.1.tar.gz", hash = "sha256:6ec12890a2dab7946721edbfbcd91f3319c6ccc9aec47be7c7e6b7011ee6645f", size = 47437, upload-time = "2024-06-04T18:44:11.171Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/d2/1d/1b658dbd2b9fa9c4c9f32accbfc0205d532c8c6194dc0f2a4c0428e7128a/nodeenv-1.9.1-py2.py3-none-any.whl", hash = "sha256:ba11c9782d29c27c70ffbdda2d7415098754709be8a7056d79a737cd901155c9", size = 22314, upload-time = "2024-06-04T18:44:08.352Z" },
+]
+
+[[package]]
+name = "openpyxl"
+version = "3.1.5"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "et-xmlfile" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/3d/f9/88d94a75de065ea32619465d2f77b29a0469500e99012523b91cc4141cd1/openpyxl-3.1.5.tar.gz", hash = "sha256:cf0e3cf56142039133628b5acffe8ef0c12bc902d2aadd3e0fe5878dc08d1050", size = 186464, upload-time = "2024-06-28T14:03:44.161Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/c0/da/977ded879c29cbd04de313843e76868e6e13408a94ed6b987245dc7c8506/openpyxl-3.1.5-py2.py3-none-any.whl", hash = "sha256:5282c12b107bffeef825f4617dc029afaf41d0ea60823bbb665ef3079dc79de2", size = 250910, upload-time = "2024-06-28T14:03:41.161Z" },
+]
+
+[[package]]
+name = "packaging"
+version = "25.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/a1/d4/1fc4078c65507b51b96ca8f8c3ba19e6a61c8253c72794544580a7b6c24d/packaging-25.0.tar.gz", hash = "sha256:d443872c98d677bf60f6a1f2f8c1cb748e8fe762d2bf9d3148b5599295b0fc4f", size = 165727, upload-time = "2025-04-19T11:48:59.673Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/20/12/38679034af332785aac8774540895e234f4d07f7545804097de4b666afd8/packaging-25.0-py3-none-any.whl", hash = "sha256:29572ef2b1f17581046b3a2227d5c611fb25ec70ca1ba8554b24b0e69331a484", size = 66469, upload-time = "2025-04-19T11:48:57.875Z" },
+]
+
+[[package]]
+name = "pandera"
+version = "0.26.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "packaging" },
+    { name = "pydantic" },
+    { name = "typeguard" },
+    { name = "typing-extensions" },
+    { name = "typing-inspect" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/ff/0b/bb312b98a92b00ff48e869e2769ce5ca6c7bc4ec793a429d450dc3c9bba2/pandera-0.26.1.tar.gz", hash = "sha256:81a55a6429770d31b3bf4c3e8e1096a38296bd3009f9eca5780fad3c3c17fd82", size = 560263, upload-time = "2025-08-26T17:06:30.907Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/db/3b/91622e08086a6be44d2c0f34947d94c5282b53d217003d3ba390ee2d174b/pandera-0.26.1-py3-none-any.whl", hash = "sha256:1ff5b70556ce2f85c6b27e8fbe835a1761972f4d05f6548b4686b0db26ecb73b", size = 292907, upload-time = "2025-08-26T17:06:29.193Z" },
+]
+
+[package.optional-dependencies]
+polars = [
+    { name = "polars" },
+]
+
+[[package]]
+name = "platformdirs"
+version = "4.5.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/61/33/9611380c2bdb1225fdef633e2a9610622310fed35ab11dac9620972ee088/platformdirs-4.5.0.tar.gz", hash = "sha256:70ddccdd7c99fc5942e9fc25636a8b34d04c24b335100223152c2803e4063312", size = 21632, upload-time = "2025-10-08T17:44:48.791Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/73/cb/ac7874b3e5d58441674fb70742e6c374b28b0c7cb988d37d991cde47166c/platformdirs-4.5.0-py3-none-any.whl", hash = "sha256:e578a81bb873cbb89a41fcc904c7ef523cc18284b7e3b3ccf06aca1403b7ebd3", size = 18651, upload-time = "2025-10-08T17:44:47.223Z" },
+]
+
+[[package]]
+name = "pluggy"
+version = "1.6.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/f9/e2/3e91f31a7d2b083fe6ef3fa267035b518369d9511ffab804f839851d2779/pluggy-1.6.0.tar.gz", hash = "sha256:7dcc130b76258d33b90f61b658791dede3486c3e6bfb003ee5c9bfb396dd22f3", size = 69412, upload-time = "2025-05-15T12:30:07.975Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/54/20/4d324d65cc6d9205fabedc306948156824eb9f0ee1633355a8f7ec5c66bf/pluggy-1.6.0-py3-none-any.whl", hash = "sha256:e920276dd6813095e9377c0bc5566d94c932c33b27a3e3945d8389c374dd4746", size = 20538, upload-time = "2025-05-15T12:30:06.134Z" },
+]
+
+[[package]]
+name = "polars"
+version = "1.34.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "polars-runtime-32" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a1/3e/35fcf5bf51404371bb172b289a5065778dc97adca4416e199c294125eb05/polars-1.34.0.tar.gz", hash = "sha256:5de5f871027db4b11bcf39215a2d6b13b4a80baf8a55c5862d4ebedfd5cd4013", size = 684309, upload-time = "2025-10-02T18:31:04.396Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/6b/80/1791ac226bb989bef30fe8fde752b2021b6ec5dfd6e880262596aedf4c05/polars-1.34.0-py3-none-any.whl", hash = "sha256:40d2f357b4d9e447ad28bd2c9923e4318791a7c18eb68f31f1fbf11180f41391", size = 772686, upload-time = "2025-10-02T18:29:59.492Z" },
+]
+
+[[package]]
+name = "polars-runtime-32"
+version = "1.34.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/02/10/1189afb14cc47ed215ccf7fbd00ed21c48edfd89e51c16f8628a33ae4b1b/polars_runtime_32-1.34.0.tar.gz", hash = "sha256:ebe6f865128a0d833f53a3f6828360761ad86d1698bceb22bef9fd999500dc1c", size = 2634491, upload-time = "2025-10-02T18:31:05.502Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/97/35/bc4f1a9dcef61845e8e4e5d2318470b002b93a3564026f0643f562761ecb/polars_runtime_32-1.34.0-cp39-abi3-macosx_10_12_x86_64.whl", hash = "sha256:2878f9951e91121afe60c25433ef270b9a221e6ebf3de5f6642346b38cab3f03", size = 39655423, upload-time = "2025-10-02T18:30:02.846Z" },
+    { url = "https://files.pythonhosted.org/packages/a6/bb/d655a103e75b7c81c47a3c2d276be0200c0c15cfb6fd47f17932ddcf7519/polars_runtime_32-1.34.0-cp39-abi3-macosx_11_0_arm64.whl", hash = "sha256:fbc329c7d34a924228cc5dcdbbd4696d94411a3a5b15ad8bb868634c204e1951", size = 35986049, upload-time = "2025-10-02T18:30:05.848Z" },
+    { url = "https://files.pythonhosted.org/packages/9e/ce/11ca850b7862cb43605e5d86cdf655614376e0a059871cf8305af5406554/polars_runtime_32-1.34.0-cp39-abi3-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:93fa51d88a2d12ea996a5747aad5647d22a86cce73c80f208e61f487b10bc448", size = 40261269, upload-time = "2025-10-02T18:30:08.48Z" },
+    { url = "https://files.pythonhosted.org/packages/d8/25/77d12018c35489e19f7650b40679714a834effafc25d61e8dcee7c4fafce/polars_runtime_32-1.34.0-cp39-abi3-manylinux_2_24_aarch64.whl", hash = "sha256:79e4d696392c6d8d51f4347f0b167c52eef303c9d87093c0c68e8651198735b7", size = 37049077, upload-time = "2025-10-02T18:30:11.162Z" },
+    { url = "https://files.pythonhosted.org/packages/e2/75/c30049d45ea1365151f86f650ed5354124ff3209f0abe588664c8eb13a31/polars_runtime_32-1.34.0-cp39-abi3-win_amd64.whl", hash = "sha256:2501d6b29d9001ea5ea2fd9b598787e10ddf45d8c4a87c2bead75159e8a15711", size = 40105782, upload-time = "2025-10-02T18:30:14.597Z" },
+    { url = "https://files.pythonhosted.org/packages/a3/31/84efa27aa3478c8670bac1a720c8b1aee5c58c9c657c980e5e5c47fde883/polars_runtime_32-1.34.0-cp39-abi3-win_arm64.whl", hash = "sha256:f9ed1765378dfe0bcd1ac5ec570dd9eab27ea728bbc980cc9a76eebc55586559", size = 35873216, upload-time = "2025-10-02T18:30:17.439Z" },
+]
+
+[[package]]
+name = "pre-commit"
+version = "4.3.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "cfgv" },
+    { name = "identify" },
+    { name = "nodeenv" },
+    { name = "pyyaml" },
+    { name = "virtualenv" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/ff/29/7cf5bbc236333876e4b41f56e06857a87937ce4bf91e117a6991a2dbb02a/pre_commit-4.3.0.tar.gz", hash = "sha256:499fe450cc9d42e9d58e606262795ecb64dd05438943c62b66f6a8673da30b16", size = 193792, upload-time = "2025-08-09T18:56:14.651Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/5b/a5/987a405322d78a73b66e39e4a90e4ef156fd7141bf71df987e50717c321b/pre_commit-4.3.0-py2.py3-none-any.whl", hash = "sha256:2b0747ad7e6e967169136edffee14c16e148a778a54e4f967921aa1ebf2308d8", size = 220965, upload-time = "2025-08-09T18:56:13.192Z" },
+]
+
+[[package]]
+name = "proto-plus"
+version = "1.26.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "protobuf" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/f4/ac/87285f15f7cce6d4a008f33f1757fb5a13611ea8914eb58c3d0d26243468/proto_plus-1.26.1.tar.gz", hash = "sha256:21a515a4c4c0088a773899e23c7bbade3d18f9c66c73edd4c7ee3816bc96a012", size = 56142, upload-time = "2025-03-10T15:54:38.843Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/4e/6d/280c4c2ce28b1593a19ad5239c8b826871fc6ec275c21afc8e1820108039/proto_plus-1.26.1-py3-none-any.whl", hash = "sha256:13285478c2dcf2abb829db158e1047e2f1e8d63a077d94263c2b88b043c75a66", size = 50163, upload-time = "2025-03-10T15:54:37.335Z" },
+]
+
+[[package]]
+name = "protobuf"
+version = "6.33.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/19/ff/64a6c8f420818bb873713988ca5492cba3a7946be57e027ac63495157d97/protobuf-6.33.0.tar.gz", hash = "sha256:140303d5c8d2037730c548f8c7b93b20bb1dc301be280c378b82b8894589c954", size = 443463, upload-time = "2025-10-15T20:39:52.159Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/7e/ee/52b3fa8feb6db4a833dfea4943e175ce645144532e8a90f72571ad85df4e/protobuf-6.33.0-cp310-abi3-win32.whl", hash = "sha256:d6101ded078042a8f17959eccd9236fb7a9ca20d3b0098bbcb91533a5680d035", size = 425593, upload-time = "2025-10-15T20:39:40.29Z" },
+    { url = "https://files.pythonhosted.org/packages/7b/c6/7a465f1825872c55e0341ff4a80198743f73b69ce5d43ab18043699d1d81/protobuf-6.33.0-cp310-abi3-win_amd64.whl", hash = "sha256:9a031d10f703f03768f2743a1c403af050b6ae1f3480e9c140f39c45f81b13ee", size = 436882, upload-time = "2025-10-15T20:39:42.841Z" },
+    { url = "https://files.pythonhosted.org/packages/e1/a9/b6eee662a6951b9c3640e8e452ab3e09f117d99fc10baa32d1581a0d4099/protobuf-6.33.0-cp39-abi3-macosx_10_9_universal2.whl", hash = "sha256:905b07a65f1a4b72412314082c7dbfae91a9e8b68a0cc1577515f8df58ecf455", size = 427521, upload-time = "2025-10-15T20:39:43.803Z" },
+    { url = "https://files.pythonhosted.org/packages/10/35/16d31e0f92c6d2f0e77c2a3ba93185130ea13053dd16200a57434c882f2b/protobuf-6.33.0-cp39-abi3-manylinux2014_aarch64.whl", hash = "sha256:e0697ece353e6239b90ee43a9231318302ad8353c70e6e45499fa52396debf90", size = 324445, upload-time = "2025-10-15T20:39:44.932Z" },
+    { url = "https://files.pythonhosted.org/packages/e6/eb/2a981a13e35cda8b75b5585aaffae2eb904f8f351bdd3870769692acbd8a/protobuf-6.33.0-cp39-abi3-manylinux2014_s390x.whl", hash = "sha256:e0a1715e4f27355afd9570f3ea369735afc853a6c3951a6afe1f80d8569ad298", size = 339159, upload-time = "2025-10-15T20:39:46.186Z" },
+    { url = "https://files.pythonhosted.org/packages/21/51/0b1cbad62074439b867b4e04cc09b93f6699d78fd191bed2bbb44562e077/protobuf-6.33.0-cp39-abi3-manylinux2014_x86_64.whl", hash = "sha256:35be49fd3f4fefa4e6e2aacc35e8b837d6703c37a2168a55ac21e9b1bc7559ef", size = 323172, upload-time = "2025-10-15T20:39:47.465Z" },
+    { url = "https://files.pythonhosted.org/packages/07/d1/0a28c21707807c6aacd5dc9c3704b2aa1effbf37adebd8caeaf68b17a636/protobuf-6.33.0-py3-none-any.whl", hash = "sha256:25c9e1963c6734448ea2d308cfa610e692b801304ba0908d7bfa564ac5132995", size = 170477, upload-time = "2025-10-15T20:39:51.311Z" },
+]
+
+[[package]]
+name = "pyasn1"
+version = "0.6.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ba/e9/01f1a64245b89f039897cb0130016d79f77d52669aae6ee7b159a6c4c018/pyasn1-0.6.1.tar.gz", hash = "sha256:6f580d2bdd84365380830acf45550f2511469f673cb4a5ae3857a3170128b034", size = 145322, upload-time = "2024-09-10T22:41:42.55Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/c8/f1/d6a797abb14f6283c0ddff96bbdd46937f64122b8c925cab503dd37f8214/pyasn1-0.6.1-py3-none-any.whl", hash = "sha256:0d632f46f2ba09143da3a8afe9e33fb6f92fa2320ab7e886e2d0f7672af84629", size = 83135, upload-time = "2024-09-11T16:00:36.122Z" },
+]
+
+[[package]]
+name = "pyasn1-modules"
+version = "0.4.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "pyasn1" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/e9/e6/78ebbb10a8c8e4b61a59249394a4a594c1a7af95593dc933a349c8d00964/pyasn1_modules-0.4.2.tar.gz", hash = "sha256:677091de870a80aae844b1ca6134f54652fa2c8c5a52aa396440ac3106e941e6", size = 307892, upload-time = "2025-03-28T02:41:22.17Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/47/8d/d529b5d697919ba8c11ad626e835d4039be708a35b0d22de83a269a6682c/pyasn1_modules-0.4.2-py3-none-any.whl", hash = "sha256:29253a9207ce32b64c3ac6600edc75368f98473906e8fd1043bd6b5b1de2c14a", size = 181259, upload-time = "2025-03-28T02:41:19.028Z" },
+]
+
+[[package]]
+name = "pydantic"
+version = "2.12.3"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "annotated-types" },
+    { name = "pydantic-core" },
+    { name = "typing-extensions" },
+    { name = "typing-inspection" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/f3/1e/4f0a3233767010308f2fd6bd0814597e3f63f1dc98304a9112b8759df4ff/pydantic-2.12.3.tar.gz", hash = "sha256:1da1c82b0fc140bb0103bc1441ffe062154c8d38491189751ee00fd8ca65ce74", size = 819383, upload-time = "2025-10-17T15:04:21.222Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/a1/6b/83661fa77dcefa195ad5f8cd9af3d1a7450fd57cc883ad04d65446ac2029/pydantic-2.12.3-py3-none-any.whl", hash = "sha256:6986454a854bc3bc6e5443e1369e06a3a456af9d339eda45510f517d9ea5c6bf", size = 462431, upload-time = "2025-10-17T15:04:19.346Z" },
+]
+
+[[package]]
+name = "pydantic-core"
+version = "2.41.4"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/df/18/d0944e8eaaa3efd0a91b0f1fc537d3be55ad35091b6a87638211ba691964/pydantic_core-2.41.4.tar.gz", hash = "sha256:70e47929a9d4a1905a67e4b687d5946026390568a8e952b92824118063cee4d5", size = 457557, upload-time = "2025-10-14T10:23:47.909Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/62/4c/f6cbfa1e8efacd00b846764e8484fe173d25b8dab881e277a619177f3384/pydantic_core-2.41.4-cp311-cp311-macosx_10_12_x86_64.whl", hash = "sha256:28ff11666443a1a8cf2a044d6a545ebffa8382b5f7973f22c36109205e65dc80", size = 2109062, upload-time = "2025-10-14T10:20:04.486Z" },
+    { url = "https://files.pythonhosted.org/packages/21/f8/40b72d3868896bfcd410e1bd7e516e762d326201c48e5b4a06446f6cf9e8/pydantic_core-2.41.4-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:61760c3925d4633290292bad462e0f737b840508b4f722247d8729684f6539ae", size = 1916301, upload-time = "2025-10-14T10:20:06.857Z" },
+    { url = "https://files.pythonhosted.org/packages/94/4d/d203dce8bee7faeca791671c88519969d98d3b4e8f225da5b96dad226fc8/pydantic_core-2.41.4-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:eae547b7315d055b0de2ec3965643b0ab82ad0106a7ffd29615ee9f266a02827", size = 1968728, upload-time = "2025-10-14T10:20:08.353Z" },
+    { url = "https://files.pythonhosted.org/packages/65/f5/6a66187775df87c24d526985b3a5d78d861580ca466fbd9d4d0e792fcf6c/pydantic_core-2.41.4-cp311-cp311-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:ef9ee5471edd58d1fcce1c80ffc8783a650e3e3a193fe90d52e43bb4d87bff1f", size = 2050238, upload-time = "2025-10-14T10:20:09.766Z" },
+    { url = "https://files.pythonhosted.org/packages/5e/b9/78336345de97298cf53236b2f271912ce11f32c1e59de25a374ce12f9cce/pydantic_core-2.41.4-cp311-cp311-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:15dd504af121caaf2c95cb90c0ebf71603c53de98305621b94da0f967e572def", size = 2249424, upload-time = "2025-10-14T10:20:11.732Z" },
+    { url = "https://files.pythonhosted.org/packages/99/bb/a4584888b70ee594c3d374a71af5075a68654d6c780369df269118af7402/pydantic_core-2.41.4-cp311-cp311-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:3a926768ea49a8af4d36abd6a8968b8790f7f76dd7cbd5a4c180db2b4ac9a3a2", size = 2366047, upload-time = "2025-10-14T10:20:13.647Z" },
+    { url = "https://files.pythonhosted.org/packages/5f/8d/17fc5de9d6418e4d2ae8c675f905cdafdc59d3bf3bf9c946b7ab796a992a/pydantic_core-2.41.4-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:6916b9b7d134bff5440098a4deb80e4cb623e68974a87883299de9124126c2a8", size = 2071163, upload-time = "2025-10-14T10:20:15.307Z" },
+    { url = "https://files.pythonhosted.org/packages/54/e7/03d2c5c0b8ed37a4617430db68ec5e7dbba66358b629cd69e11b4d564367/pydantic_core-2.41.4-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:5cf90535979089df02e6f17ffd076f07237efa55b7343d98760bde8743c4b265", size = 2190585, upload-time = "2025-10-14T10:20:17.3Z" },
+    { url = "https://files.pythonhosted.org/packages/be/fc/15d1c9fe5ad9266a5897d9b932b7f53d7e5cfc800573917a2c5d6eea56ec/pydantic_core-2.41.4-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:7533c76fa647fade2d7ec75ac5cc079ab3f34879626dae5689b27790a6cf5a5c", size = 2150109, upload-time = "2025-10-14T10:20:19.143Z" },
+    { url = "https://files.pythonhosted.org/packages/26/ef/e735dd008808226c83ba56972566138665b71477ad580fa5a21f0851df48/pydantic_core-2.41.4-cp311-cp311-musllinux_1_1_armv7l.whl", hash = "sha256:37e516bca9264cbf29612539801ca3cd5d1be465f940417b002905e6ed79d38a", size = 2315078, upload-time = "2025-10-14T10:20:20.742Z" },
+    { url = "https://files.pythonhosted.org/packages/90/00/806efdcf35ff2ac0f938362350cd9827b8afb116cc814b6b75cf23738c7c/pydantic_core-2.41.4-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:0c19cb355224037c83642429b8ce261ae108e1c5fbf5c028bac63c77b0f8646e", size = 2318737, upload-time = "2025-10-14T10:20:22.306Z" },
+    { url = "https://files.pythonhosted.org/packages/41/7e/6ac90673fe6cb36621a2283552897838c020db343fa86e513d3f563b196f/pydantic_core-2.41.4-cp311-cp311-win32.whl", hash = "sha256:09c2a60e55b357284b5f31f5ab275ba9f7f70b7525e18a132ec1f9160b4f1f03", size = 1974160, upload-time = "2025-10-14T10:20:23.817Z" },
+    { url = "https://files.pythonhosted.org/packages/e0/9d/7c5e24ee585c1f8b6356e1d11d40ab807ffde44d2db3b7dfd6d20b09720e/pydantic_core-2.41.4-cp311-cp311-win_amd64.whl", hash = "sha256:711156b6afb5cb1cb7c14a2cc2c4a8b4c717b69046f13c6b332d8a0a8f41ca3e", size = 2021883, upload-time = "2025-10-14T10:20:25.48Z" },
+    { url = "https://files.pythonhosted.org/packages/33/90/5c172357460fc28b2871eb4a0fb3843b136b429c6fa827e4b588877bf115/pydantic_core-2.41.4-cp311-cp311-win_arm64.whl", hash = "sha256:6cb9cf7e761f4f8a8589a45e49ed3c0d92d1d696a45a6feaee8c904b26efc2db", size = 1968026, upload-time = "2025-10-14T10:20:27.039Z" },
+    { url = "https://files.pythonhosted.org/packages/e9/81/d3b3e95929c4369d30b2a66a91db63c8ed0a98381ae55a45da2cd1cc1288/pydantic_core-2.41.4-cp312-cp312-macosx_10_12_x86_64.whl", hash = "sha256:ab06d77e053d660a6faaf04894446df7b0a7e7aba70c2797465a0a1af00fc887", size = 2099043, upload-time = "2025-10-14T10:20:28.561Z" },
+    { url = "https://files.pythonhosted.org/packages/58/da/46fdac49e6717e3a94fc9201403e08d9d61aa7a770fab6190b8740749047/pydantic_core-2.41.4-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:c53ff33e603a9c1179a9364b0a24694f183717b2e0da2b5ad43c316c956901b2", size = 1910699, upload-time = "2025-10-14T10:20:30.217Z" },
+    { url = "https://files.pythonhosted.org/packages/1e/63/4d948f1b9dd8e991a5a98b77dd66c74641f5f2e5225fee37994b2e07d391/pydantic_core-2.41.4-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:304c54176af2c143bd181d82e77c15c41cbacea8872a2225dd37e6544dce9999", size = 1952121, upload-time = "2025-10-14T10:20:32.246Z" },
+    { url = "https://files.pythonhosted.org/packages/b2/a7/e5fc60a6f781fc634ecaa9ecc3c20171d238794cef69ae0af79ac11b89d7/pydantic_core-2.41.4-cp312-cp312-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:025ba34a4cf4fb32f917d5d188ab5e702223d3ba603be4d8aca2f82bede432a4", size = 2041590, upload-time = "2025-10-14T10:20:34.332Z" },
+    { url = "https://files.pythonhosted.org/packages/70/69/dce747b1d21d59e85af433428978a1893c6f8a7068fa2bb4a927fba7a5ff/pydantic_core-2.41.4-cp312-cp312-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:b9f5f30c402ed58f90c70e12eff65547d3ab74685ffe8283c719e6bead8ef53f", size = 2219869, upload-time = "2025-10-14T10:20:35.965Z" },
+    { url = "https://files.pythonhosted.org/packages/83/6a/c070e30e295403bf29c4df1cb781317b6a9bac7cd07b8d3acc94d501a63c/pydantic_core-2.41.4-cp312-cp312-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:dd96e5d15385d301733113bcaa324c8bcf111275b7675a9c6e88bfb19fc05e3b", size = 2345169, upload-time = "2025-10-14T10:20:37.627Z" },
+    { url = "https://files.pythonhosted.org/packages/f0/83/06d001f8043c336baea7fd202a9ac7ad71f87e1c55d8112c50b745c40324/pydantic_core-2.41.4-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:98f348cbb44fae6e9653c1055db7e29de67ea6a9ca03a5fa2c2e11a47cff0e47", size = 2070165, upload-time = "2025-10-14T10:20:39.246Z" },
+    { url = "https://files.pythonhosted.org/packages/14/0a/e567c2883588dd12bcbc110232d892cf385356f7c8a9910311ac997ab715/pydantic_core-2.41.4-cp312-cp312-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:ec22626a2d14620a83ca583c6f5a4080fa3155282718b6055c2ea48d3ef35970", size = 2189067, upload-time = "2025-10-14T10:20:41.015Z" },
+    { url = "https://files.pythonhosted.org/packages/f4/1d/3d9fca34273ba03c9b1c5289f7618bc4bd09c3ad2289b5420481aa051a99/pydantic_core-2.41.4-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:3a95d4590b1f1a43bf33ca6d647b990a88f4a3824a8c4572c708f0b45a5290ed", size = 2132997, upload-time = "2025-10-14T10:20:43.106Z" },
+    { url = "https://files.pythonhosted.org/packages/52/70/d702ef7a6cd41a8afc61f3554922b3ed8d19dd54c3bd4bdbfe332e610827/pydantic_core-2.41.4-cp312-cp312-musllinux_1_1_armv7l.whl", hash = "sha256:f9672ab4d398e1b602feadcffcdd3af44d5f5e6ddc15bc7d15d376d47e8e19f8", size = 2307187, upload-time = "2025-10-14T10:20:44.849Z" },
+    { url = "https://files.pythonhosted.org/packages/68/4c/c06be6e27545d08b802127914156f38d10ca287a9e8489342793de8aae3c/pydantic_core-2.41.4-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:84d8854db5f55fead3b579f04bda9a36461dab0730c5d570e1526483e7bb8431", size = 2305204, upload-time = "2025-10-14T10:20:46.781Z" },
+    { url = "https://files.pythonhosted.org/packages/b0/e5/35ae4919bcd9f18603419e23c5eaf32750224a89d41a8df1a3704b69f77e/pydantic_core-2.41.4-cp312-cp312-win32.whl", hash = "sha256:9be1c01adb2ecc4e464392c36d17f97e9110fbbc906bcbe1c943b5b87a74aabd", size = 1972536, upload-time = "2025-10-14T10:20:48.39Z" },
+    { url = "https://files.pythonhosted.org/packages/1e/c2/49c5bb6d2a49eb2ee3647a93e3dae7080c6409a8a7558b075027644e879c/pydantic_core-2.41.4-cp312-cp312-win_amd64.whl", hash = "sha256:d682cf1d22bab22a5be08539dca3d1593488a99998f9f412137bc323179067ff", size = 2031132, upload-time = "2025-10-14T10:20:50.421Z" },
+    { url = "https://files.pythonhosted.org/packages/06/23/936343dbcba6eec93f73e95eb346810fc732f71ba27967b287b66f7b7097/pydantic_core-2.41.4-cp312-cp312-win_arm64.whl", hash = "sha256:833eebfd75a26d17470b58768c1834dfc90141b7afc6eb0429c21fc5a21dcfb8", size = 1969483, upload-time = "2025-10-14T10:20:52.35Z" },
+    { url = "https://files.pythonhosted.org/packages/13/d0/c20adabd181a029a970738dfe23710b52a31f1258f591874fcdec7359845/pydantic_core-2.41.4-cp313-cp313-macosx_10_12_x86_64.whl", hash = "sha256:85e050ad9e5f6fe1004eec65c914332e52f429bc0ae12d6fa2092407a462c746", size = 2105688, upload-time = "2025-10-14T10:20:54.448Z" },
+    { url = "https://files.pythonhosted.org/packages/00/b6/0ce5c03cec5ae94cca220dfecddc453c077d71363b98a4bbdb3c0b22c783/pydantic_core-2.41.4-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:e7393f1d64792763a48924ba31d1e44c2cfbc05e3b1c2c9abb4ceeadd912cced", size = 1910807, upload-time = "2025-10-14T10:20:56.115Z" },
+    { url = "https://files.pythonhosted.org/packages/68/3e/800d3d02c8beb0b5c069c870cbb83799d085debf43499c897bb4b4aaff0d/pydantic_core-2.41.4-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:94dab0940b0d1fb28bcab847adf887c66a27a40291eedf0b473be58761c9799a", size = 1956669, upload-time = "2025-10-14T10:20:57.874Z" },
+    { url = "https://files.pythonhosted.org/packages/60/a4/24271cc71a17f64589be49ab8bd0751f6a0a03046c690df60989f2f95c2c/pydantic_core-2.41.4-cp313-cp313-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:de7c42f897e689ee6f9e93c4bec72b99ae3b32a2ade1c7e4798e690ff5246e02", size = 2051629, upload-time = "2025-10-14T10:21:00.006Z" },
+    { url = "https://files.pythonhosted.org/packages/68/de/45af3ca2f175d91b96bfb62e1f2d2f1f9f3b14a734afe0bfeff079f78181/pydantic_core-2.41.4-cp313-cp313-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:664b3199193262277b8b3cd1e754fb07f2c6023289c815a1e1e8fb415cb247b1", size = 2224049, upload-time = "2025-10-14T10:21:01.801Z" },
+    { url = "https://files.pythonhosted.org/packages/af/8f/ae4e1ff84672bf869d0a77af24fd78387850e9497753c432875066b5d622/pydantic_core-2.41.4-cp313-cp313-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:d95b253b88f7d308b1c0b417c4624f44553ba4762816f94e6986819b9c273fb2", size = 2342409, upload-time = "2025-10-14T10:21:03.556Z" },
+    { url = "https://files.pythonhosted.org/packages/18/62/273dd70b0026a085c7b74b000394e1ef95719ea579c76ea2f0cc8893736d/pydantic_core-2.41.4-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a1351f5bbdbbabc689727cb91649a00cb9ee7203e0a6e54e9f5ba9e22e384b84", size = 2069635, upload-time = "2025-10-14T10:21:05.385Z" },
+    { url = "https://files.pythonhosted.org/packages/30/03/cf485fff699b4cdaea469bc481719d3e49f023241b4abb656f8d422189fc/pydantic_core-2.41.4-cp313-cp313-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:1affa4798520b148d7182da0615d648e752de4ab1a9566b7471bc803d88a062d", size = 2194284, upload-time = "2025-10-14T10:21:07.122Z" },
+    { url = "https://files.pythonhosted.org/packages/f9/7e/c8e713db32405dfd97211f2fc0a15d6bf8adb7640f3d18544c1f39526619/pydantic_core-2.41.4-cp313-cp313-musllinux_1_1_aarch64.whl", hash = "sha256:7b74e18052fea4aa8dea2fb7dbc23d15439695da6cbe6cfc1b694af1115df09d", size = 2137566, upload-time = "2025-10-14T10:21:08.981Z" },
+    { url = "https://files.pythonhosted.org/packages/04/f7/db71fd4cdccc8b75990f79ccafbbd66757e19f6d5ee724a6252414483fb4/pydantic_core-2.41.4-cp313-cp313-musllinux_1_1_armv7l.whl", hash = "sha256:285b643d75c0e30abda9dc1077395624f314a37e3c09ca402d4015ef5979f1a2", size = 2316809, upload-time = "2025-10-14T10:21:10.805Z" },
+    { url = "https://files.pythonhosted.org/packages/76/63/a54973ddb945f1bca56742b48b144d85c9fc22f819ddeb9f861c249d5464/pydantic_core-2.41.4-cp313-cp313-musllinux_1_1_x86_64.whl", hash = "sha256:f52679ff4218d713b3b33f88c89ccbf3a5c2c12ba665fb80ccc4192b4608dbab", size = 2311119, upload-time = "2025-10-14T10:21:12.583Z" },
+    { url = "https://files.pythonhosted.org/packages/f8/03/5d12891e93c19218af74843a27e32b94922195ded2386f7b55382f904d2f/pydantic_core-2.41.4-cp313-cp313-win32.whl", hash = "sha256:ecde6dedd6fff127c273c76821bb754d793be1024bc33314a120f83a3c69460c", size = 1981398, upload-time = "2025-10-14T10:21:14.584Z" },
+    { url = "https://files.pythonhosted.org/packages/be/d8/fd0de71f39db91135b7a26996160de71c073d8635edfce8b3c3681be0d6d/pydantic_core-2.41.4-cp313-cp313-win_amd64.whl", hash = "sha256:d081a1f3800f05409ed868ebb2d74ac39dd0c1ff6c035b5162356d76030736d4", size = 2030735, upload-time = "2025-10-14T10:21:16.432Z" },
+    { url = "https://files.pythonhosted.org/packages/72/86/c99921c1cf6650023c08bfab6fe2d7057a5142628ef7ccfa9921f2dda1d5/pydantic_core-2.41.4-cp313-cp313-win_arm64.whl", hash = "sha256:f8e49c9c364a7edcbe2a310f12733aad95b022495ef2a8d653f645e5d20c1564", size = 1973209, upload-time = "2025-10-14T10:21:18.213Z" },
+    { url = "https://files.pythonhosted.org/packages/36/0d/b5706cacb70a8414396efdda3d72ae0542e050b591119e458e2490baf035/pydantic_core-2.41.4-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:ed97fd56a561f5eb5706cebe94f1ad7c13b84d98312a05546f2ad036bafe87f4", size = 1877324, upload-time = "2025-10-14T10:21:20.363Z" },
+    { url = "https://files.pythonhosted.org/packages/de/2d/cba1fa02cfdea72dfb3a9babb067c83b9dff0bbcb198368e000a6b756ea7/pydantic_core-2.41.4-cp313-cp313t-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:a870c307bf1ee91fc58a9a61338ff780d01bfae45922624816878dce784095d2", size = 1884515, upload-time = "2025-10-14T10:21:22.339Z" },
+    { url = "https://files.pythonhosted.org/packages/07/ea/3df927c4384ed9b503c9cc2d076cf983b4f2adb0c754578dfb1245c51e46/pydantic_core-2.41.4-cp313-cp313t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d25e97bc1f5f8f7985bdc2335ef9e73843bb561eb1fa6831fdfc295c1c2061cf", size = 2042819, upload-time = "2025-10-14T10:21:26.683Z" },
+    { url = "https://files.pythonhosted.org/packages/6a/ee/df8e871f07074250270a3b1b82aad4cd0026b588acd5d7d3eb2fcb1471a3/pydantic_core-2.41.4-cp313-cp313t-win_amd64.whl", hash = "sha256:d405d14bea042f166512add3091c1af40437c2e7f86988f3915fabd27b1e9cd2", size = 1995866, upload-time = "2025-10-14T10:21:28.951Z" },
+    { url = "https://files.pythonhosted.org/packages/fc/de/b20f4ab954d6d399499c33ec4fafc46d9551e11dc1858fb7f5dca0748ceb/pydantic_core-2.41.4-cp313-cp313t-win_arm64.whl", hash = "sha256:19f3684868309db5263a11bace3c45d93f6f24afa2ffe75a647583df22a2ff89", size = 1970034, upload-time = "2025-10-14T10:21:30.869Z" },
+    { url = "https://files.pythonhosted.org/packages/54/28/d3325da57d413b9819365546eb9a6e8b7cbd9373d9380efd5f74326143e6/pydantic_core-2.41.4-cp314-cp314-macosx_10_12_x86_64.whl", hash = "sha256:e9205d97ed08a82ebb9a307e92914bb30e18cdf6f6b12ca4bedadb1588a0bfe1", size = 2102022, upload-time = "2025-10-14T10:21:32.809Z" },
+    { url = "https://files.pythonhosted.org/packages/9e/24/b58a1bc0d834bf1acc4361e61233ee217169a42efbdc15a60296e13ce438/pydantic_core-2.41.4-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:82df1f432b37d832709fbcc0e24394bba04a01b6ecf1ee87578145c19cde12ac", size = 1905495, upload-time = "2025-10-14T10:21:34.812Z" },
+    { url = "https://files.pythonhosted.org/packages/fb/a4/71f759cc41b7043e8ecdaab81b985a9b6cad7cec077e0b92cff8b71ecf6b/pydantic_core-2.41.4-cp314-cp314-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:fc3b4cc4539e055cfa39a3763c939f9d409eb40e85813257dcd761985a108554", size = 1956131, upload-time = "2025-10-14T10:21:36.924Z" },
+    { url = "https://files.pythonhosted.org/packages/b0/64/1e79ac7aa51f1eec7c4cda8cbe456d5d09f05fdd68b32776d72168d54275/pydantic_core-2.41.4-cp314-cp314-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:b1eb1754fce47c63d2ff57fdb88c351a6c0150995890088b33767a10218eaa4e", size = 2052236, upload-time = "2025-10-14T10:21:38.927Z" },
+    { url = "https://files.pythonhosted.org/packages/e9/e3/a3ffc363bd4287b80f1d43dc1c28ba64831f8dfc237d6fec8f2661138d48/pydantic_core-2.41.4-cp314-cp314-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:e6ab5ab30ef325b443f379ddb575a34969c333004fca5a1daa0133a6ffaad616", size = 2223573, upload-time = "2025-10-14T10:21:41.574Z" },
+    { url = "https://files.pythonhosted.org/packages/28/27/78814089b4d2e684a9088ede3790763c64693c3d1408ddc0a248bc789126/pydantic_core-2.41.4-cp314-cp314-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:31a41030b1d9ca497634092b46481b937ff9397a86f9f51bd41c4767b6fc04af", size = 2342467, upload-time = "2025-10-14T10:21:44.018Z" },
+    { url = "https://files.pythonhosted.org/packages/92/97/4de0e2a1159cb85ad737e03306717637842c88c7fd6d97973172fb183149/pydantic_core-2.41.4-cp314-cp314-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a44ac1738591472c3d020f61c6df1e4015180d6262ebd39bf2aeb52571b60f12", size = 2063754, upload-time = "2025-10-14T10:21:46.466Z" },
+    { url = "https://files.pythonhosted.org/packages/0f/50/8cb90ce4b9efcf7ae78130afeb99fd1c86125ccdf9906ef64b9d42f37c25/pydantic_core-2.41.4-cp314-cp314-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:d72f2b5e6e82ab8f94ea7d0d42f83c487dc159c5240d8f83beae684472864e2d", size = 2196754, upload-time = "2025-10-14T10:21:48.486Z" },
+    { url = "https://files.pythonhosted.org/packages/34/3b/ccdc77af9cd5082723574a1cc1bcae7a6acacc829d7c0a06201f7886a109/pydantic_core-2.41.4-cp314-cp314-musllinux_1_1_aarch64.whl", hash = "sha256:c4d1e854aaf044487d31143f541f7aafe7b482ae72a022c664b2de2e466ed0ad", size = 2137115, upload-time = "2025-10-14T10:21:50.63Z" },
+    { url = "https://files.pythonhosted.org/packages/ca/ba/e7c7a02651a8f7c52dc2cff2b64a30c313e3b57c7d93703cecea76c09b71/pydantic_core-2.41.4-cp314-cp314-musllinux_1_1_armv7l.whl", hash = "sha256:b568af94267729d76e6ee5ececda4e283d07bbb28e8148bb17adad93d025d25a", size = 2317400, upload-time = "2025-10-14T10:21:52.959Z" },
+    { url = "https://files.pythonhosted.org/packages/2c/ba/6c533a4ee8aec6b812c643c49bb3bd88d3f01e3cebe451bb85512d37f00f/pydantic_core-2.41.4-cp314-cp314-musllinux_1_1_x86_64.whl", hash = "sha256:6d55fb8b1e8929b341cc313a81a26e0d48aa3b519c1dbaadec3a6a2b4fcad025", size = 2312070, upload-time = "2025-10-14T10:21:55.419Z" },
+    { url = "https://files.pythonhosted.org/packages/22/ae/f10524fcc0ab8d7f96cf9a74c880243576fd3e72bd8ce4f81e43d22bcab7/pydantic_core-2.41.4-cp314-cp314-win32.whl", hash = "sha256:5b66584e549e2e32a1398df11da2e0a7eff45d5c2d9db9d5667c5e6ac764d77e", size = 1982277, upload-time = "2025-10-14T10:21:57.474Z" },
+    { url = "https://files.pythonhosted.org/packages/b4/dc/e5aa27aea1ad4638f0c3fb41132f7eb583bd7420ee63204e2d4333a3bbf9/pydantic_core-2.41.4-cp314-cp314-win_amd64.whl", hash = "sha256:557a0aab88664cc552285316809cab897716a372afaf8efdbef756f8b890e894", size = 2024608, upload-time = "2025-10-14T10:21:59.557Z" },
+    { url = "https://files.pythonhosted.org/packages/3e/61/51d89cc2612bd147198e120a13f150afbf0bcb4615cddb049ab10b81b79e/pydantic_core-2.41.4-cp314-cp314-win_arm64.whl", hash = "sha256:3f1ea6f48a045745d0d9f325989d8abd3f1eaf47dd00485912d1a3a63c623a8d", size = 1967614, upload-time = "2025-10-14T10:22:01.847Z" },
+    { url = "https://files.pythonhosted.org/packages/0d/c2/472f2e31b95eff099961fa050c376ab7156a81da194f9edb9f710f68787b/pydantic_core-2.41.4-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:6c1fe4c5404c448b13188dd8bd2ebc2bdd7e6727fa61ff481bcc2cca894018da", size = 1876904, upload-time = "2025-10-14T10:22:04.062Z" },
+    { url = "https://files.pythonhosted.org/packages/4a/07/ea8eeb91173807ecdae4f4a5f4b150a520085b35454350fc219ba79e66a3/pydantic_core-2.41.4-cp314-cp314t-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:523e7da4d43b113bf8e7b49fa4ec0c35bf4fe66b2230bfc5c13cc498f12c6c3e", size = 1882538, upload-time = "2025-10-14T10:22:06.39Z" },
+    { url = "https://files.pythonhosted.org/packages/1e/29/b53a9ca6cd366bfc928823679c6a76c7a4c69f8201c0ba7903ad18ebae2f/pydantic_core-2.41.4-cp314-cp314t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:5729225de81fb65b70fdb1907fcf08c75d498f4a6f15af005aabb1fdadc19dfa", size = 2041183, upload-time = "2025-10-14T10:22:08.812Z" },
+    { url = "https://files.pythonhosted.org/packages/c7/3d/f8c1a371ceebcaf94d6dd2d77c6cf4b1c078e13a5837aee83f760b4f7cfd/pydantic_core-2.41.4-cp314-cp314t-win_amd64.whl", hash = "sha256:de2cfbb09e88f0f795fd90cf955858fc2c691df65b1f21f0aa00b99f3fbc661d", size = 1993542, upload-time = "2025-10-14T10:22:11.332Z" },
+    { url = "https://files.pythonhosted.org/packages/8a/ac/9fc61b4f9d079482a290afe8d206b8f490e9fd32d4fc03ed4fc698214e01/pydantic_core-2.41.4-cp314-cp314t-win_arm64.whl", hash = "sha256:d34f950ae05a83e0ede899c595f312ca976023ea1db100cd5aa188f7005e3ab0", size = 1973897, upload-time = "2025-10-14T10:22:13.444Z" },
+    { url = "https://files.pythonhosted.org/packages/b0/12/5ba58daa7f453454464f92b3ca7b9d7c657d8641c48e370c3ebc9a82dd78/pydantic_core-2.41.4-graalpy311-graalpy242_311_native-macosx_10_12_x86_64.whl", hash = "sha256:a1b2cfec3879afb742a7b0bcfa53e4f22ba96571c9e54d6a3afe1052d17d843b", size = 2122139, upload-time = "2025-10-14T10:22:47.288Z" },
+    { url = "https://files.pythonhosted.org/packages/21/fb/6860126a77725c3108baecd10fd3d75fec25191d6381b6eb2ac660228eac/pydantic_core-2.41.4-graalpy311-graalpy242_311_native-macosx_11_0_arm64.whl", hash = "sha256:d175600d975b7c244af6eb9c9041f10059f20b8bbffec9e33fdd5ee3f67cdc42", size = 1936674, upload-time = "2025-10-14T10:22:49.555Z" },
+    { url = "https://files.pythonhosted.org/packages/de/be/57dcaa3ed595d81f8757e2b44a38240ac5d37628bce25fb20d02c7018776/pydantic_core-2.41.4-graalpy311-graalpy242_311_native-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:0f184d657fa4947ae5ec9c47bd7e917730fa1cbb78195037e32dcbab50aca5ee", size = 1956398, upload-time = "2025-10-14T10:22:52.19Z" },
+    { url = "https://files.pythonhosted.org/packages/2f/1d/679a344fadb9695f1a6a294d739fbd21d71fa023286daeea8c0ed49e7c2b/pydantic_core-2.41.4-graalpy311-graalpy242_311_native-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1ed810568aeffed3edc78910af32af911c835cc39ebbfacd1f0ab5dd53028e5c", size = 2138674, upload-time = "2025-10-14T10:22:54.499Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/48/ae937e5a831b7c0dc646b2ef788c27cd003894882415300ed21927c21efa/pydantic_core-2.41.4-graalpy312-graalpy250_312_native-macosx_10_12_x86_64.whl", hash = "sha256:4f5d640aeebb438517150fdeec097739614421900e4a08db4a3ef38898798537", size = 2112087, upload-time = "2025-10-14T10:22:56.818Z" },
+    { url = "https://files.pythonhosted.org/packages/5e/db/6db8073e3d32dae017da7e0d16a9ecb897d0a4d92e00634916e486097961/pydantic_core-2.41.4-graalpy312-graalpy250_312_native-macosx_11_0_arm64.whl", hash = "sha256:4a9ab037b71927babc6d9e7fc01aea9e66dc2a4a34dff06ef0724a4049629f94", size = 1920387, upload-time = "2025-10-14T10:22:59.342Z" },
+    { url = "https://files.pythonhosted.org/packages/0d/c1/dd3542d072fcc336030d66834872f0328727e3b8de289c662faa04aa270e/pydantic_core-2.41.4-graalpy312-graalpy250_312_native-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:e4dab9484ec605c3016df9ad4fd4f9a390bc5d816a3b10c6550f8424bb80b18c", size = 1951495, upload-time = "2025-10-14T10:23:02.089Z" },
+    { url = "https://files.pythonhosted.org/packages/2b/c6/db8d13a1f8ab3f1eb08c88bd00fd62d44311e3456d1e85c0e59e0a0376e7/pydantic_core-2.41.4-graalpy312-graalpy250_312_native-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:bd8a5028425820731d8c6c098ab642d7b8b999758e24acae03ed38a66eca8335", size = 2139008, upload-time = "2025-10-14T10:23:04.539Z" },
+    { url = "https://files.pythonhosted.org/packages/7e/7d/138e902ed6399b866f7cfe4435d22445e16fff888a1c00560d9dc79a780f/pydantic_core-2.41.4-pp311-pypy311_pp73-macosx_10_12_x86_64.whl", hash = "sha256:491535d45cd7ad7e4a2af4a5169b0d07bebf1adfd164b0368da8aa41e19907a5", size = 2104721, upload-time = "2025-10-14T10:23:26.906Z" },
+    { url = "https://files.pythonhosted.org/packages/47/13/0525623cf94627f7b53b4c2034c81edc8491cbfc7c28d5447fa318791479/pydantic_core-2.41.4-pp311-pypy311_pp73-macosx_11_0_arm64.whl", hash = "sha256:54d86c0cada6aba4ec4c047d0e348cbad7063b87ae0f005d9f8c9ad04d4a92a2", size = 1931608, upload-time = "2025-10-14T10:23:29.306Z" },
+    { url = "https://files.pythonhosted.org/packages/d6/f9/744bc98137d6ef0a233f808bfc9b18cf94624bf30836a18d3b05d08bf418/pydantic_core-2.41.4-pp311-pypy311_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:eca1124aced216b2500dc2609eade086d718e8249cb9696660ab447d50a758bd", size = 2132986, upload-time = "2025-10-14T10:23:32.057Z" },
+    { url = "https://files.pythonhosted.org/packages/17/c8/629e88920171173f6049386cc71f893dff03209a9ef32b4d2f7e7c264bcf/pydantic_core-2.41.4-pp311-pypy311_pp73-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:6c9024169becccf0cb470ada03ee578d7348c119a0d42af3dcf9eda96e3a247c", size = 2187516, upload-time = "2025-10-14T10:23:34.871Z" },
+    { url = "https://files.pythonhosted.org/packages/2e/0f/4f2734688d98488782218ca61bcc118329bf5de05bb7fe3adc7dd79b0b86/pydantic_core-2.41.4-pp311-pypy311_pp73-musllinux_1_1_aarch64.whl", hash = "sha256:26895a4268ae5a2849269f4991cdc97236e4b9c010e51137becf25182daac405", size = 2146146, upload-time = "2025-10-14T10:23:37.342Z" },
+    { url = "https://files.pythonhosted.org/packages/ed/f2/ab385dbd94a052c62224b99cf99002eee99dbec40e10006c78575aead256/pydantic_core-2.41.4-pp311-pypy311_pp73-musllinux_1_1_armv7l.whl", hash = "sha256:ca4df25762cf71308c446e33c9b1fdca2923a3f13de616e2a949f38bf21ff5a8", size = 2311296, upload-time = "2025-10-14T10:23:40.145Z" },
+    { url = "https://files.pythonhosted.org/packages/fc/8e/e4f12afe1beeb9823bba5375f8f258df0cc61b056b0195fb1cf9f62a1a58/pydantic_core-2.41.4-pp311-pypy311_pp73-musllinux_1_1_x86_64.whl", hash = "sha256:5a28fcedd762349519276c36634e71853b4541079cab4acaaac60c4421827308", size = 2315386, upload-time = "2025-10-14T10:23:42.624Z" },
+    { url = "https://files.pythonhosted.org/packages/48/f7/925f65d930802e3ea2eb4d5afa4cb8730c8dc0d2cb89a59dc4ed2fcb2d74/pydantic_core-2.41.4-pp311-pypy311_pp73-win_amd64.whl", hash = "sha256:c173ddcd86afd2535e2b695217e82191580663a1d1928239f877f5a1649ef39f", size = 2147775, upload-time = "2025-10-14T10:23:45.406Z" },
+]
+
+[[package]]
+name = "pydantic-settings"
+version = "2.11.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "pydantic" },
+    { name = "python-dotenv" },
+    { name = "typing-inspection" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/20/c5/dbbc27b814c71676593d1c3f718e6cd7d4f00652cefa24b75f7aa3efb25e/pydantic_settings-2.11.0.tar.gz", hash = "sha256:d0e87a1c7d33593beb7194adb8470fc426e95ba02af83a0f23474a04c9a08180", size = 188394, upload-time = "2025-09-24T14:19:11.764Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/83/d6/887a1ff844e64aa823fb4905978d882a633cfe295c32eacad582b78a7d8b/pydantic_settings-2.11.0-py3-none-any.whl", hash = "sha256:fe2cea3413b9530d10f3a5875adffb17ada5c1e1bab0b2885546d7310415207c", size = 48608, upload-time = "2025-09-24T14:19:10.015Z" },
+]
+
+[[package]]
+name = "pygments"
+version = "2.19.2"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/b0/77/a5b8c569bf593b0140bde72ea885a803b82086995367bf2037de0159d924/pygments-2.19.2.tar.gz", hash = "sha256:636cb2477cec7f8952536970bc533bc43743542f70392ae026374600add5b887", size = 4968631, upload-time = "2025-06-21T13:39:12.283Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/c7/21/705964c7812476f378728bdf590ca4b771ec72385c533964653c68e86bdc/pygments-2.19.2-py3-none-any.whl", hash = "sha256:86540386c03d588bb81d44bc3928634ff26449851e99741617ecb9037ee5ec0b", size = 1225217, upload-time = "2025-06-21T13:39:07.939Z" },
+]
+
+[[package]]
+name = "pytest"
+version = "8.4.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "colorama", marker = "sys_platform == 'win32'" },
+    { name = "iniconfig" },
+    { name = "packaging" },
+    { name = "pluggy" },
+    { name = "pygments" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a3/5c/00a0e072241553e1a7496d638deababa67c5058571567b92a7eaa258397c/pytest-8.4.2.tar.gz", hash = "sha256:86c0d0b93306b961d58d62a4db4879f27fe25513d4b969df351abdddb3c30e01", size = 1519618, upload-time = "2025-09-04T14:34:22.711Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/a8/a4/20da314d277121d6534b3a980b29035dcd51e6744bd79075a6ce8fa4eb8d/pytest-8.4.2-py3-none-any.whl", hash = "sha256:872f880de3fc3a5bdc88a11b39c9710c3497a547cfa9320bc3c5e62fbf272e79", size = 365750, upload-time = "2025-09-04T14:34:20.226Z" },
+]
+
+[[package]]
+name = "pytest-cov"
+version = "7.0.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "coverage", extra = ["toml"] },
+    { name = "pluggy" },
+    { name = "pytest" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/5e/f7/c933acc76f5208b3b00089573cf6a2bc26dc80a8aece8f52bb7d6b1855ca/pytest_cov-7.0.0.tar.gz", hash = "sha256:33c97eda2e049a0c5298e91f519302a1334c26ac65c1a483d6206fd458361af1", size = 54328, upload-time = "2025-09-09T10:57:02.113Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/ee/49/1377b49de7d0c1ce41292161ea0f721913fa8722c19fb9c1e3aa0367eecb/pytest_cov-7.0.0-py3-none-any.whl", hash = "sha256:3b8e9558b16cc1479da72058bdecf8073661c7f57f7d3c5f22a1c23507f2d861", size = 22424, upload-time = "2025-09-09T10:57:00.695Z" },
+]
+
+[[package]]
+name = "pytest-mock"
+version = "3.15.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "pytest" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/68/14/eb014d26be205d38ad5ad20d9a80f7d201472e08167f0bb4361e251084a9/pytest_mock-3.15.1.tar.gz", hash = "sha256:1849a238f6f396da19762269de72cb1814ab44416fa73a8686deac10b0d87a0f", size = 34036, upload-time = "2025-09-16T16:37:27.081Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/5a/cc/06253936f4a7fa2e0f48dfe6d851d9c56df896a9ab09ac019d70b760619c/pytest_mock-3.15.1-py3-none-any.whl", hash = "sha256:0a25e2eb88fe5168d535041d09a4529a188176ae608a6d249ee65abc0949630d", size = 10095, upload-time = "2025-09-16T16:37:25.734Z" },
+]
+
+[[package]]
+name = "python-dateutil"
+version = "2.9.0.post0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "six" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/66/c0/0c8b6ad9f17a802ee498c46e004a0eb49bc148f2fd230864601a86dcf6db/python-dateutil-2.9.0.post0.tar.gz", hash = "sha256:37dd54208da7e1cd875388217d5e00ebd4179249f90fb72437e91a35459a0ad3", size = 342432, upload-time = "2024-03-01T18:36:20.211Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/ec/57/56b9bcc3c9c6a792fcbaf139543cee77261f3651ca9da0c93f5c1221264b/python_dateutil-2.9.0.post0-py2.py3-none-any.whl", hash = "sha256:a8b2bc7bffae282281c8140a97d3aa9c14da0b136dfe83f850eea9a5f7470427", size = 229892, upload-time = "2024-03-01T18:36:18.57Z" },
+]
+
+[[package]]
+name = "python-dotenv"
+version = "1.1.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/f6/b0/4bc07ccd3572a2f9df7e6782f52b0c6c90dcbb803ac4a167702d7d0dfe1e/python_dotenv-1.1.1.tar.gz", hash = "sha256:a8a6399716257f45be6a007360200409fce5cda2661e3dec71d23dc15f6189ab", size = 41978, upload-time = "2025-06-24T04:21:07.341Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/5f/ed/539768cf28c661b5b068d66d96a2f155c4971a5d55684a514c1a0e0dec2f/python_dotenv-1.1.1-py3-none-any.whl", hash = "sha256:31f23644fe2602f88ff55e1f5c79ba497e01224ee7737937930c448e4d0e24dc", size = 20556, upload-time = "2025-06-24T04:21:06.073Z" },
+]
+
+[[package]]
+name = "pyyaml"
+version = "6.0.3"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/05/8e/961c0007c59b8dd7729d542c61a4d537767a59645b82a0b521206e1e25c2/pyyaml-6.0.3.tar.gz", hash = "sha256:d76623373421df22fb4cf8817020cbb7ef15c725b9d5e45f17e189bfc384190f", size = 130960, upload-time = "2025-09-25T21:33:16.546Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/6d/16/a95b6757765b7b031c9374925bb718d55e0a9ba8a1b6a12d25962ea44347/pyyaml-6.0.3-cp311-cp311-macosx_10_13_x86_64.whl", hash = "sha256:44edc647873928551a01e7a563d7452ccdebee747728c1080d881d68af7b997e", size = 185826, upload-time = "2025-09-25T21:31:58.655Z" },
+    { url = "https://files.pythonhosted.org/packages/16/19/13de8e4377ed53079ee996e1ab0a9c33ec2faf808a4647b7b4c0d46dd239/pyyaml-6.0.3-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:652cb6edd41e718550aad172851962662ff2681490a8a711af6a4d288dd96824", size = 175577, upload-time = "2025-09-25T21:32:00.088Z" },
+    { url = "https://files.pythonhosted.org/packages/0c/62/d2eb46264d4b157dae1275b573017abec435397aa59cbcdab6fc978a8af4/pyyaml-6.0.3-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:10892704fc220243f5305762e276552a0395f7beb4dbf9b14ec8fd43b57f126c", size = 775556, upload-time = "2025-09-25T21:32:01.31Z" },
+    { url = "https://files.pythonhosted.org/packages/10/cb/16c3f2cf3266edd25aaa00d6c4350381c8b012ed6f5276675b9eba8d9ff4/pyyaml-6.0.3-cp311-cp311-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:850774a7879607d3a6f50d36d04f00ee69e7fc816450e5f7e58d7f17f1ae5c00", size = 882114, upload-time = "2025-09-25T21:32:03.376Z" },
+    { url = "https://files.pythonhosted.org/packages/71/60/917329f640924b18ff085ab889a11c763e0b573da888e8404ff486657602/pyyaml-6.0.3-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:b8bb0864c5a28024fac8a632c443c87c5aa6f215c0b126c449ae1a150412f31d", size = 806638, upload-time = "2025-09-25T21:32:04.553Z" },
+    { url = "https://files.pythonhosted.org/packages/dd/6f/529b0f316a9fd167281a6c3826b5583e6192dba792dd55e3203d3f8e655a/pyyaml-6.0.3-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:1d37d57ad971609cf3c53ba6a7e365e40660e3be0e5175fa9f2365a379d6095a", size = 767463, upload-time = "2025-09-25T21:32:06.152Z" },
+    { url = "https://files.pythonhosted.org/packages/f2/6a/b627b4e0c1dd03718543519ffb2f1deea4a1e6d42fbab8021936a4d22589/pyyaml-6.0.3-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:37503bfbfc9d2c40b344d06b2199cf0e96e97957ab1c1b546fd4f87e53e5d3e4", size = 794986, upload-time = "2025-09-25T21:32:07.367Z" },
+    { url = "https://files.pythonhosted.org/packages/45/91/47a6e1c42d9ee337c4839208f30d9f09caa9f720ec7582917b264defc875/pyyaml-6.0.3-cp311-cp311-win32.whl", hash = "sha256:8098f252adfa6c80ab48096053f512f2321f0b998f98150cea9bd23d83e1467b", size = 142543, upload-time = "2025-09-25T21:32:08.95Z" },
+    { url = "https://files.pythonhosted.org/packages/da/e3/ea007450a105ae919a72393cb06f122f288ef60bba2dc64b26e2646fa315/pyyaml-6.0.3-cp311-cp311-win_amd64.whl", hash = "sha256:9f3bfb4965eb874431221a3ff3fdcddc7e74e3b07799e0e84ca4a0f867d449bf", size = 158763, upload-time = "2025-09-25T21:32:09.96Z" },
+    { url = "https://files.pythonhosted.org/packages/d1/33/422b98d2195232ca1826284a76852ad5a86fe23e31b009c9886b2d0fb8b2/pyyaml-6.0.3-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:7f047e29dcae44602496db43be01ad42fc6f1cc0d8cd6c83d342306c32270196", size = 182063, upload-time = "2025-09-25T21:32:11.445Z" },
+    { url = "https://files.pythonhosted.org/packages/89/a0/6cf41a19a1f2f3feab0e9c0b74134aa2ce6849093d5517a0c550fe37a648/pyyaml-6.0.3-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:fc09d0aa354569bc501d4e787133afc08552722d3ab34836a80547331bb5d4a0", size = 173973, upload-time = "2025-09-25T21:32:12.492Z" },
+    { url = "https://files.pythonhosted.org/packages/ed/23/7a778b6bd0b9a8039df8b1b1d80e2e2ad78aa04171592c8a5c43a56a6af4/pyyaml-6.0.3-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:9149cad251584d5fb4981be1ecde53a1ca46c891a79788c0df828d2f166bda28", size = 775116, upload-time = "2025-09-25T21:32:13.652Z" },
+    { url = "https://files.pythonhosted.org/packages/65/30/d7353c338e12baef4ecc1b09e877c1970bd3382789c159b4f89d6a70dc09/pyyaml-6.0.3-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:5fdec68f91a0c6739b380c83b951e2c72ac0197ace422360e6d5a959d8d97b2c", size = 844011, upload-time = "2025-09-25T21:32:15.21Z" },
+    { url = "https://files.pythonhosted.org/packages/8b/9d/b3589d3877982d4f2329302ef98a8026e7f4443c765c46cfecc8858c6b4b/pyyaml-6.0.3-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:ba1cc08a7ccde2d2ec775841541641e4548226580ab850948cbfda66a1befcdc", size = 807870, upload-time = "2025-09-25T21:32:16.431Z" },
+    { url = "https://files.pythonhosted.org/packages/05/c0/b3be26a015601b822b97d9149ff8cb5ead58c66f981e04fedf4e762f4bd4/pyyaml-6.0.3-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:8dc52c23056b9ddd46818a57b78404882310fb473d63f17b07d5c40421e47f8e", size = 761089, upload-time = "2025-09-25T21:32:17.56Z" },
+    { url = "https://files.pythonhosted.org/packages/be/8e/98435a21d1d4b46590d5459a22d88128103f8da4c2d4cb8f14f2a96504e1/pyyaml-6.0.3-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:41715c910c881bc081f1e8872880d3c650acf13dfa8214bad49ed4cede7c34ea", size = 790181, upload-time = "2025-09-25T21:32:18.834Z" },
+    { url = "https://files.pythonhosted.org/packages/74/93/7baea19427dcfbe1e5a372d81473250b379f04b1bd3c4c5ff825e2327202/pyyaml-6.0.3-cp312-cp312-win32.whl", hash = "sha256:96b533f0e99f6579b3d4d4995707cf36df9100d67e0c8303a0c55b27b5f99bc5", size = 137658, upload-time = "2025-09-25T21:32:20.209Z" },
+    { url = "https://files.pythonhosted.org/packages/86/bf/899e81e4cce32febab4fb42bb97dcdf66bc135272882d1987881a4b519e9/pyyaml-6.0.3-cp312-cp312-win_amd64.whl", hash = "sha256:5fcd34e47f6e0b794d17de1b4ff496c00986e1c83f7ab2fb8fcfe9616ff7477b", size = 154003, upload-time = "2025-09-25T21:32:21.167Z" },
+    { url = "https://files.pythonhosted.org/packages/1a/08/67bd04656199bbb51dbed1439b7f27601dfb576fb864099c7ef0c3e55531/pyyaml-6.0.3-cp312-cp312-win_arm64.whl", hash = "sha256:64386e5e707d03a7e172c0701abfb7e10f0fb753ee1d773128192742712a98fd", size = 140344, upload-time = "2025-09-25T21:32:22.617Z" },
+    { url = "https://files.pythonhosted.org/packages/d1/11/0fd08f8192109f7169db964b5707a2f1e8b745d4e239b784a5a1dd80d1db/pyyaml-6.0.3-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:8da9669d359f02c0b91ccc01cac4a67f16afec0dac22c2ad09f46bee0697eba8", size = 181669, upload-time = "2025-09-25T21:32:23.673Z" },
+    { url = "https://files.pythonhosted.org/packages/b1/16/95309993f1d3748cd644e02e38b75d50cbc0d9561d21f390a76242ce073f/pyyaml-6.0.3-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:2283a07e2c21a2aa78d9c4442724ec1eb15f5e42a723b99cb3d822d48f5f7ad1", size = 173252, upload-time = "2025-09-25T21:32:25.149Z" },
+    { url = "https://files.pythonhosted.org/packages/50/31/b20f376d3f810b9b2371e72ef5adb33879b25edb7a6d072cb7ca0c486398/pyyaml-6.0.3-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:ee2922902c45ae8ccada2c5b501ab86c36525b883eff4255313a253a3160861c", size = 767081, upload-time = "2025-09-25T21:32:26.575Z" },
+    { url = "https://files.pythonhosted.org/packages/49/1e/a55ca81e949270d5d4432fbbd19dfea5321eda7c41a849d443dc92fd1ff7/pyyaml-6.0.3-cp313-cp313-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:a33284e20b78bd4a18c8c2282d549d10bc8408a2a7ff57653c0cf0b9be0afce5", size = 841159, upload-time = "2025-09-25T21:32:27.727Z" },
+    { url = "https://files.pythonhosted.org/packages/74/27/e5b8f34d02d9995b80abcef563ea1f8b56d20134d8f4e5e81733b1feceb2/pyyaml-6.0.3-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:0f29edc409a6392443abf94b9cf89ce99889a1dd5376d94316ae5145dfedd5d6", size = 801626, upload-time = "2025-09-25T21:32:28.878Z" },
+    { url = "https://files.pythonhosted.org/packages/f9/11/ba845c23988798f40e52ba45f34849aa8a1f2d4af4b798588010792ebad6/pyyaml-6.0.3-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:f7057c9a337546edc7973c0d3ba84ddcdf0daa14533c2065749c9075001090e6", size = 753613, upload-time = "2025-09-25T21:32:30.178Z" },
+    { url = "https://files.pythonhosted.org/packages/3d/e0/7966e1a7bfc0a45bf0a7fb6b98ea03fc9b8d84fa7f2229e9659680b69ee3/pyyaml-6.0.3-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:eda16858a3cab07b80edaf74336ece1f986ba330fdb8ee0d6c0d68fe82bc96be", size = 794115, upload-time = "2025-09-25T21:32:31.353Z" },
+    { url = "https://files.pythonhosted.org/packages/de/94/980b50a6531b3019e45ddeada0626d45fa85cbe22300844a7983285bed3b/pyyaml-6.0.3-cp313-cp313-win32.whl", hash = "sha256:d0eae10f8159e8fdad514efdc92d74fd8d682c933a6dd088030f3834bc8e6b26", size = 137427, upload-time = "2025-09-25T21:32:32.58Z" },
+    { url = "https://files.pythonhosted.org/packages/97/c9/39d5b874e8b28845e4ec2202b5da735d0199dbe5b8fb85f91398814a9a46/pyyaml-6.0.3-cp313-cp313-win_amd64.whl", hash = "sha256:79005a0d97d5ddabfeeea4cf676af11e647e41d81c9a7722a193022accdb6b7c", size = 154090, upload-time = "2025-09-25T21:32:33.659Z" },
+    { url = "https://files.pythonhosted.org/packages/73/e8/2bdf3ca2090f68bb3d75b44da7bbc71843b19c9f2b9cb9b0f4ab7a5a4329/pyyaml-6.0.3-cp313-cp313-win_arm64.whl", hash = "sha256:5498cd1645aa724a7c71c8f378eb29ebe23da2fc0d7a08071d89469bf1d2defb", size = 140246, upload-time = "2025-09-25T21:32:34.663Z" },
+    { url = "https://files.pythonhosted.org/packages/9d/8c/f4bd7f6465179953d3ac9bc44ac1a8a3e6122cf8ada906b4f96c60172d43/pyyaml-6.0.3-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:8d1fab6bb153a416f9aeb4b8763bc0f22a5586065f86f7664fc23339fc1c1fac", size = 181814, upload-time = "2025-09-25T21:32:35.712Z" },
+    { url = "https://files.pythonhosted.org/packages/bd/9c/4d95bb87eb2063d20db7b60faa3840c1b18025517ae857371c4dd55a6b3a/pyyaml-6.0.3-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:34d5fcd24b8445fadc33f9cf348c1047101756fd760b4dacb5c3e99755703310", size = 173809, upload-time = "2025-09-25T21:32:36.789Z" },
+    { url = "https://files.pythonhosted.org/packages/92/b5/47e807c2623074914e29dabd16cbbdd4bf5e9b2db9f8090fa64411fc5382/pyyaml-6.0.3-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:501a031947e3a9025ed4405a168e6ef5ae3126c59f90ce0cd6f2bfc477be31b7", size = 766454, upload-time = "2025-09-25T21:32:37.966Z" },
+    { url = "https://files.pythonhosted.org/packages/02/9e/e5e9b168be58564121efb3de6859c452fccde0ab093d8438905899a3a483/pyyaml-6.0.3-cp314-cp314-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:b3bc83488de33889877a0f2543ade9f70c67d66d9ebb4ac959502e12de895788", size = 836355, upload-time = "2025-09-25T21:32:39.178Z" },
+    { url = "https://files.pythonhosted.org/packages/88/f9/16491d7ed2a919954993e48aa941b200f38040928474c9e85ea9e64222c3/pyyaml-6.0.3-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:c458b6d084f9b935061bc36216e8a69a7e293a2f1e68bf956dcd9e6cbcd143f5", size = 794175, upload-time = "2025-09-25T21:32:40.865Z" },
+    { url = "https://files.pythonhosted.org/packages/dd/3f/5989debef34dc6397317802b527dbbafb2b4760878a53d4166579111411e/pyyaml-6.0.3-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:7c6610def4f163542a622a73fb39f534f8c101d690126992300bf3207eab9764", size = 755228, upload-time = "2025-09-25T21:32:42.084Z" },
+    { url = "https://files.pythonhosted.org/packages/d7/ce/af88a49043cd2e265be63d083fc75b27b6ed062f5f9fd6cdc223ad62f03e/pyyaml-6.0.3-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:5190d403f121660ce8d1d2c1bb2ef1bd05b5f68533fc5c2ea899bd15f4399b35", size = 789194, upload-time = "2025-09-25T21:32:43.362Z" },
+    { url = "https://files.pythonhosted.org/packages/23/20/bb6982b26a40bb43951265ba29d4c246ef0ff59c9fdcdf0ed04e0687de4d/pyyaml-6.0.3-cp314-cp314-win_amd64.whl", hash = "sha256:4a2e8cebe2ff6ab7d1050ecd59c25d4c8bd7e6f400f5f82b96557ac0abafd0ac", size = 156429, upload-time = "2025-09-25T21:32:57.844Z" },
+    { url = "https://files.pythonhosted.org/packages/f4/f4/a4541072bb9422c8a883ab55255f918fa378ecf083f5b85e87fc2b4eda1b/pyyaml-6.0.3-cp314-cp314-win_arm64.whl", hash = "sha256:93dda82c9c22deb0a405ea4dc5f2d0cda384168e466364dec6255b293923b2f3", size = 143912, upload-time = "2025-09-25T21:32:59.247Z" },
+    { url = "https://files.pythonhosted.org/packages/7c/f9/07dd09ae774e4616edf6cda684ee78f97777bdd15847253637a6f052a62f/pyyaml-6.0.3-cp314-cp314t-macosx_10_13_x86_64.whl", hash = "sha256:02893d100e99e03eda1c8fd5c441d8c60103fd175728e23e431db1b589cf5ab3", size = 189108, upload-time = "2025-09-25T21:32:44.377Z" },
+    { url = "https://files.pythonhosted.org/packages/4e/78/8d08c9fb7ce09ad8c38ad533c1191cf27f7ae1effe5bb9400a46d9437fcf/pyyaml-6.0.3-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:c1ff362665ae507275af2853520967820d9124984e0f7466736aea23d8611fba", size = 183641, upload-time = "2025-09-25T21:32:45.407Z" },
+    { url = "https://files.pythonhosted.org/packages/7b/5b/3babb19104a46945cf816d047db2788bcaf8c94527a805610b0289a01c6b/pyyaml-6.0.3-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:6adc77889b628398debc7b65c073bcb99c4a0237b248cacaf3fe8a557563ef6c", size = 831901, upload-time = "2025-09-25T21:32:48.83Z" },
+    { url = "https://files.pythonhosted.org/packages/8b/cc/dff0684d8dc44da4d22a13f35f073d558c268780ce3c6ba1b87055bb0b87/pyyaml-6.0.3-cp314-cp314t-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:a80cb027f6b349846a3bf6d73b5e95e782175e52f22108cfa17876aaeff93702", size = 861132, upload-time = "2025-09-25T21:32:50.149Z" },
+    { url = "https://files.pythonhosted.org/packages/b1/5e/f77dc6b9036943e285ba76b49e118d9ea929885becb0a29ba8a7c75e29fe/pyyaml-6.0.3-cp314-cp314t-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:00c4bdeba853cc34e7dd471f16b4114f4162dc03e6b7afcc2128711f0eca823c", size = 839261, upload-time = "2025-09-25T21:32:51.808Z" },
+    { url = "https://files.pythonhosted.org/packages/ce/88/a9db1376aa2a228197c58b37302f284b5617f56a5d959fd1763fb1675ce6/pyyaml-6.0.3-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:66e1674c3ef6f541c35191caae2d429b967b99e02040f5ba928632d9a7f0f065", size = 805272, upload-time = "2025-09-25T21:32:52.941Z" },
+    { url = "https://files.pythonhosted.org/packages/da/92/1446574745d74df0c92e6aa4a7b0b3130706a4142b2d1a5869f2eaa423c6/pyyaml-6.0.3-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:16249ee61e95f858e83976573de0f5b2893b3677ba71c9dd36b9cf8be9ac6d65", size = 829923, upload-time = "2025-09-25T21:32:54.537Z" },
+    { url = "https://files.pythonhosted.org/packages/f0/7a/1c7270340330e575b92f397352af856a8c06f230aa3e76f86b39d01b416a/pyyaml-6.0.3-cp314-cp314t-win_amd64.whl", hash = "sha256:4ad1906908f2f5ae4e5a8ddfce73c320c2a1429ec52eafd27138b7f1cbe341c9", size = 174062, upload-time = "2025-09-25T21:32:55.767Z" },
+    { url = "https://files.pythonhosted.org/packages/f1/12/de94a39c2ef588c7e6455cfbe7343d3b2dc9d6b6b2f40c4c6565744c873d/pyyaml-6.0.3-cp314-cp314t-win_arm64.whl", hash = "sha256:ebc55a14a21cb14062aa4162f906cd962b28e2e9ea38f9b4391244cd8de4ae0b", size = 149341, upload-time = "2025-09-25T21:32:56.828Z" },
+]
+
+[[package]]
+name = "requests"
+version = "2.32.5"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "certifi" },
+    { name = "charset-normalizer" },
+    { name = "idna" },
+    { name = "urllib3" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/c9/74/b3ff8e6c8446842c3f5c837e9c3dfcfe2018ea6ecef224c710c85ef728f4/requests-2.32.5.tar.gz", hash = "sha256:dbba0bac56e100853db0ea71b82b4dfd5fe2bf6d3754a8893c3af500cec7d7cf", size = 134517, upload-time = "2025-08-18T20:46:02.573Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/1e/db/4254e3eabe8020b458f1a747140d32277ec7a271daf1d235b70dc0b4e6e3/requests-2.32.5-py3-none-any.whl", hash = "sha256:2462f94637a34fd532264295e186976db0f5d453d1cdd31473c85a6a161affb6", size = 64738, upload-time = "2025-08-18T20:46:00.542Z" },
+]
+
+[[package]]
+name = "rich"
+version = "14.2.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "markdown-it-py" },
+    { name = "pygments" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/fb/d2/8920e102050a0de7bfabeb4c4614a49248cf8d5d7a8d01885fbb24dc767a/rich-14.2.0.tar.gz", hash = "sha256:73ff50c7c0c1c77c8243079283f4edb376f0f6442433aecb8ce7e6d0b92d1fe4", size = 219990, upload-time = "2025-10-09T14:16:53.064Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/25/7a/b0178788f8dc6cafce37a212c99565fa1fe7872c70c6c9c1e1a372d9d88f/rich-14.2.0-py3-none-any.whl", hash = "sha256:76bc51fe2e57d2b1be1f96c524b890b816e334ab4c1e45888799bfaab0021edd", size = 243393, upload-time = "2025-10-09T14:16:51.245Z" },
+]
+
+[[package]]
+name = "rsa"
+version = "4.9.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "pyasn1" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/da/8a/22b7beea3ee0d44b1916c0c1cb0ee3af23b700b6da9f04991899d0c555d4/rsa-4.9.1.tar.gz", hash = "sha256:e7bdbfdb5497da4c07dfd35530e1a902659db6ff241e39d9953cad06ebd0ae75", size = 29034, upload-time = "2025-04-16T09:51:18.218Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/64/8d/0133e4eb4beed9e425d9a98ed6e081a55d195481b7632472be1af08d2f6b/rsa-4.9.1-py3-none-any.whl", hash = "sha256:68635866661c6836b8d39430f97a996acbd61bfa49406748ea243539fe239762", size = 34696, upload-time = "2025-04-16T09:51:17.142Z" },
+]
+
+[[package]]
+name = "ruff"
+version = "0.14.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/9e/58/6ca66896635352812de66f71cdf9ff86b3a4f79071ca5730088c0cd0fc8d/ruff-0.14.1.tar.gz", hash = "sha256:1dd86253060c4772867c61791588627320abcb6ed1577a90ef432ee319729b69", size = 5513429, upload-time = "2025-10-16T18:05:41.766Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/8d/39/9cc5ab181478d7a18adc1c1e051a84ee02bec94eb9bdfd35643d7c74ca31/ruff-0.14.1-py3-none-linux_armv6l.whl", hash = "sha256:083bfc1f30f4a391ae09c6f4f99d83074416b471775b59288956f5bc18e82f8b", size = 12445415, upload-time = "2025-10-16T18:04:48.227Z" },
+    { url = "https://files.pythonhosted.org/packages/ef/2e/1226961855ccd697255988f5a2474890ac7c5863b080b15bd038df820818/ruff-0.14.1-py3-none-macosx_10_12_x86_64.whl", hash = "sha256:f6fa757cd717f791009f7669fefb09121cc5f7d9bd0ef211371fad68c2b8b224", size = 12784267, upload-time = "2025-10-16T18:04:52.515Z" },
+    { url = "https://files.pythonhosted.org/packages/c1/ea/fd9e95863124ed159cd0667ec98449ae461de94acda7101f1acb6066da00/ruff-0.14.1-py3-none-macosx_11_0_arm64.whl", hash = "sha256:d6191903d39ac156921398e9c86b7354d15e3c93772e7dbf26c9fcae59ceccd5", size = 11781872, upload-time = "2025-10-16T18:04:55.396Z" },
+    { url = "https://files.pythonhosted.org/packages/1e/5a/e890f7338ff537dba4589a5e02c51baa63020acfb7c8cbbaea4831562c96/ruff-0.14.1-py3-none-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ed04f0e04f7a4587244e5c9d7df50e6b5bf2705d75059f409a6421c593a35896", size = 12226558, upload-time = "2025-10-16T18:04:58.166Z" },
+    { url = "https://files.pythonhosted.org/packages/a6/7a/8ab5c3377f5bf31e167b73651841217542bcc7aa1c19e83030835cc25204/ruff-0.14.1-py3-none-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:5c9e6cf6cd4acae0febbce29497accd3632fe2025c0c583c8b87e8dbdeae5f61", size = 12187898, upload-time = "2025-10-16T18:05:01.455Z" },
+    { url = "https://files.pythonhosted.org/packages/48/8d/ba7c33aa55406955fc124e62c8259791c3d42e3075a71710fdff9375134f/ruff-0.14.1-py3-none-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:a6fa2458527794ecdfbe45f654e42c61f2503a230545a91af839653a0a93dbc6", size = 12939168, upload-time = "2025-10-16T18:05:04.397Z" },
+    { url = "https://files.pythonhosted.org/packages/b4/c2/70783f612b50f66d083380e68cbd1696739d88e9b4f6164230375532c637/ruff-0.14.1-py3-none-manylinux_2_17_ppc64.manylinux2014_ppc64.whl", hash = "sha256:39f1c392244e338b21d42ab29b8a6392a722c5090032eb49bb4d6defcdb34345", size = 14386942, upload-time = "2025-10-16T18:05:07.102Z" },
+    { url = "https://files.pythonhosted.org/packages/48/44/cd7abb9c776b66d332119d67f96acf15830d120f5b884598a36d9d3f4d83/ruff-0.14.1-py3-none-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:7382fa12a26cce1f95070ce450946bec357727aaa428983036362579eadcc5cf", size = 13990622, upload-time = "2025-10-16T18:05:09.882Z" },
+    { url = "https://files.pythonhosted.org/packages/eb/56/4259b696db12ac152fe472764b4f78bbdd9b477afd9bc3a6d53c01300b37/ruff-0.14.1-py3-none-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:dd0bf2be3ae8521e1093a487c4aa3b455882f139787770698530d28ed3fbb37c", size = 13431143, upload-time = "2025-10-16T18:05:13.46Z" },
+    { url = "https://files.pythonhosted.org/packages/e0/35/266a80d0eb97bd224b3265b9437bd89dde0dcf4faf299db1212e81824e7e/ruff-0.14.1-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:cabcaa9ccf8089fb4fdb78d17cc0e28241520f50f4c2e88cb6261ed083d85151", size = 13132844, upload-time = "2025-10-16T18:05:16.1Z" },
+    { url = "https://files.pythonhosted.org/packages/65/6e/d31ce218acc11a8d91ef208e002a31acf315061a85132f94f3df7a252b18/ruff-0.14.1-py3-none-manylinux_2_31_riscv64.whl", hash = "sha256:747d583400f6125ec11a4c14d1c8474bf75d8b419ad22a111a537ec1a952d192", size = 13401241, upload-time = "2025-10-16T18:05:19.395Z" },
+    { url = "https://files.pythonhosted.org/packages/9f/b5/dbc4221bf0b03774b3b2f0d47f39e848d30664157c15b965a14d890637d2/ruff-0.14.1-py3-none-musllinux_1_2_aarch64.whl", hash = "sha256:5a6e74c0efd78515a1d13acbfe6c90f0f5bd822aa56b4a6d43a9ffb2ae6e56cd", size = 12132476, upload-time = "2025-10-16T18:05:22.163Z" },
+    { url = "https://files.pythonhosted.org/packages/98/4b/ac99194e790ccd092d6a8b5f341f34b6e597d698e3077c032c502d75ea84/ruff-0.14.1-py3-none-musllinux_1_2_armv7l.whl", hash = "sha256:0ea6a864d2fb41a4b6d5b456ed164302a0d96f4daac630aeba829abfb059d020", size = 12139749, upload-time = "2025-10-16T18:05:25.162Z" },
+    { url = "https://files.pythonhosted.org/packages/47/26/7df917462c3bb5004e6fdfcc505a49e90bcd8a34c54a051953118c00b53a/ruff-0.14.1-py3-none-musllinux_1_2_i686.whl", hash = "sha256:0826b8764f94229604fa255918d1cc45e583e38c21c203248b0bfc9a0e930be5", size = 12544758, upload-time = "2025-10-16T18:05:28.018Z" },
+    { url = "https://files.pythonhosted.org/packages/64/d0/81e7f0648e9764ad9b51dd4be5e5dac3fcfff9602428ccbae288a39c2c22/ruff-0.14.1-py3-none-musllinux_1_2_x86_64.whl", hash = "sha256:cbc52160465913a1a3f424c81c62ac8096b6a491468e7d872cb9444a860bc33d", size = 13221811, upload-time = "2025-10-16T18:05:30.707Z" },
+    { url = "https://files.pythonhosted.org/packages/c3/07/3c45562c67933cc35f6d5df4ca77dabbcd88fddaca0d6b8371693d29fd56/ruff-0.14.1-py3-none-win32.whl", hash = "sha256:e037ea374aaaff4103240ae79168c0945ae3d5ae8db190603de3b4012bd1def6", size = 12319467, upload-time = "2025-10-16T18:05:33.261Z" },
+    { url = "https://files.pythonhosted.org/packages/02/88/0ee4ca507d4aa05f67e292d2e5eb0b3e358fbcfe527554a2eda9ac422d6b/ruff-0.14.1-py3-none-win_amd64.whl", hash = "sha256:59d599cdff9c7f925a017f6f2c256c908b094e55967f93f2821b1439928746a1", size = 13401123, upload-time = "2025-10-16T18:05:35.984Z" },
+    { url = "https://files.pythonhosted.org/packages/b8/81/4b6387be7014858d924b843530e1b2a8e531846807516e9bea2ee0936bf7/ruff-0.14.1-py3-none-win_arm64.whl", hash = "sha256:e3b443c4c9f16ae850906b8d0a707b2a4c16f8d2f0a7fe65c475c5886665ce44", size = 12436636, upload-time = "2025-10-16T18:05:38.995Z" },
+]
+
+[[package]]
+name = "shellingham"
+version = "1.5.4"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/58/15/8b3609fd3830ef7b27b655beb4b4e9c62313a4e8da8c676e142cc210d58e/shellingham-1.5.4.tar.gz", hash = "sha256:8dbca0739d487e5bd35ab3ca4b36e11c4078f3a234bfce294b0a0291363404de", size = 10310, upload-time = "2023-10-24T04:13:40.426Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/e0/f9/0595336914c5619e5f28a1fb793285925a8cd4b432c9da0a987836c7f822/shellingham-1.5.4-py2.py3-none-any.whl", hash = "sha256:7ecfff8f2fd72616f7481040475a65b2bf8af90a56c89140852d1120324e8686", size = 9755, upload-time = "2023-10-24T04:13:38.866Z" },
+]
+
+[[package]]
+name = "six"
+version = "1.17.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/94/e7/b2c673351809dca68a0e064b6af791aa332cf192da575fd474ed7d6f16a2/six-1.17.0.tar.gz", hash = "sha256:ff70335d468e7eb6ec65b95b99d3a2836546063f63acc5171de367e834932a81", size = 34031, upload-time = "2024-12-04T17:35:28.174Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/b7/ce/149a00dd41f10bc29e5921b496af8b574d8413afcd5e30dfa0ed46c2cc5e/six-1.17.0-py2.py3-none-any.whl", hash = "sha256:4721f391ed90541fddacab5acf947aa0d3dc7d27b2e1e8eda2be8970586c3274", size = 11050, upload-time = "2024-12-04T17:35:26.475Z" },
+]
+
+[[package]]
+name = "tomli"
+version = "2.3.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/52/ed/3f73f72945444548f33eba9a87fc7a6e969915e7b1acc8260b30e1f76a2f/tomli-2.3.0.tar.gz", hash = "sha256:64be704a875d2a59753d80ee8a533c3fe183e3f06807ff7dc2232938ccb01549", size = 17392, upload-time = "2025-10-08T22:01:47.119Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/b3/2e/299f62b401438d5fe1624119c723f5d877acc86a4c2492da405626665f12/tomli-2.3.0-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:88bd15eb972f3664f5ed4b57c1634a97153b4bac4479dcb6a495f41921eb7f45", size = 153236, upload-time = "2025-10-08T22:01:00.137Z" },
+    { url = "https://files.pythonhosted.org/packages/86/7f/d8fffe6a7aefdb61bced88fcb5e280cfd71e08939da5894161bd71bea022/tomli-2.3.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:883b1c0d6398a6a9d29b508c331fa56adbcdff647f6ace4dfca0f50e90dfd0ba", size = 148084, upload-time = "2025-10-08T22:01:01.63Z" },
+    { url = "https://files.pythonhosted.org/packages/47/5c/24935fb6a2ee63e86d80e4d3b58b222dafaf438c416752c8b58537c8b89a/tomli-2.3.0-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:d1381caf13ab9f300e30dd8feadb3de072aeb86f1d34a8569453ff32a7dea4bf", size = 234832, upload-time = "2025-10-08T22:01:02.543Z" },
+    { url = "https://files.pythonhosted.org/packages/89/da/75dfd804fc11e6612846758a23f13271b76d577e299592b4371a4ca4cd09/tomli-2.3.0-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:a0e285d2649b78c0d9027570d4da3425bdb49830a6156121360b3f8511ea3441", size = 242052, upload-time = "2025-10-08T22:01:03.836Z" },
+    { url = "https://files.pythonhosted.org/packages/70/8c/f48ac899f7b3ca7eb13af73bacbc93aec37f9c954df3c08ad96991c8c373/tomli-2.3.0-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:0a154a9ae14bfcf5d8917a59b51ffd5a3ac1fd149b71b47a3a104ca4edcfa845", size = 239555, upload-time = "2025-10-08T22:01:04.834Z" },
+    { url = "https://files.pythonhosted.org/packages/ba/28/72f8afd73f1d0e7829bfc093f4cb98ce0a40ffc0cc997009ee1ed94ba705/tomli-2.3.0-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:74bf8464ff93e413514fefd2be591c3b0b23231a77f901db1eb30d6f712fc42c", size = 245128, upload-time = "2025-10-08T22:01:05.84Z" },
+    { url = "https://files.pythonhosted.org/packages/b6/eb/a7679c8ac85208706d27436e8d421dfa39d4c914dcf5fa8083a9305f58d9/tomli-2.3.0-cp311-cp311-win32.whl", hash = "sha256:00b5f5d95bbfc7d12f91ad8c593a1659b6387b43f054104cda404be6bda62456", size = 96445, upload-time = "2025-10-08T22:01:06.896Z" },
+    { url = "https://files.pythonhosted.org/packages/0a/fe/3d3420c4cb1ad9cb462fb52967080575f15898da97e21cb6f1361d505383/tomli-2.3.0-cp311-cp311-win_amd64.whl", hash = "sha256:4dc4ce8483a5d429ab602f111a93a6ab1ed425eae3122032db7e9acf449451be", size = 107165, upload-time = "2025-10-08T22:01:08.107Z" },
+    { url = "https://files.pythonhosted.org/packages/ff/b7/40f36368fcabc518bb11c8f06379a0fd631985046c038aca08c6d6a43c6e/tomli-2.3.0-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:d7d86942e56ded512a594786a5ba0a5e521d02529b3826e7761a05138341a2ac", size = 154891, upload-time = "2025-10-08T22:01:09.082Z" },
+    { url = "https://files.pythonhosted.org/packages/f9/3f/d9dd692199e3b3aab2e4e4dd948abd0f790d9ded8cd10cbaae276a898434/tomli-2.3.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:73ee0b47d4dad1c5e996e3cd33b8a76a50167ae5f96a2607cbe8cc773506ab22", size = 148796, upload-time = "2025-10-08T22:01:10.266Z" },
+    { url = "https://files.pythonhosted.org/packages/60/83/59bff4996c2cf9f9387a0f5a3394629c7efa5ef16142076a23a90f1955fa/tomli-2.3.0-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:792262b94d5d0a466afb5bc63c7daa9d75520110971ee269152083270998316f", size = 242121, upload-time = "2025-10-08T22:01:11.332Z" },
+    { url = "https://files.pythonhosted.org/packages/45/e5/7c5119ff39de8693d6baab6c0b6dcb556d192c165596e9fc231ea1052041/tomli-2.3.0-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:4f195fe57ecceac95a66a75ac24d9d5fbc98ef0962e09b2eddec5d39375aae52", size = 250070, upload-time = "2025-10-08T22:01:12.498Z" },
+    { url = "https://files.pythonhosted.org/packages/45/12/ad5126d3a278f27e6701abde51d342aa78d06e27ce2bb596a01f7709a5a2/tomli-2.3.0-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:e31d432427dcbf4d86958c184b9bfd1e96b5b71f8eb17e6d02531f434fd335b8", size = 245859, upload-time = "2025-10-08T22:01:13.551Z" },
+    { url = "https://files.pythonhosted.org/packages/fb/a1/4d6865da6a71c603cfe6ad0e6556c73c76548557a8d658f9e3b142df245f/tomli-2.3.0-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:7b0882799624980785240ab732537fcfc372601015c00f7fc367c55308c186f6", size = 250296, upload-time = "2025-10-08T22:01:14.614Z" },
+    { url = "https://files.pythonhosted.org/packages/a0/b7/a7a7042715d55c9ba6e8b196d65d2cb662578b4d8cd17d882d45322b0d78/tomli-2.3.0-cp312-cp312-win32.whl", hash = "sha256:ff72b71b5d10d22ecb084d345fc26f42b5143c5533db5e2eaba7d2d335358876", size = 97124, upload-time = "2025-10-08T22:01:15.629Z" },
+    { url = "https://files.pythonhosted.org/packages/06/1e/f22f100db15a68b520664eb3328fb0ae4e90530887928558112c8d1f4515/tomli-2.3.0-cp312-cp312-win_amd64.whl", hash = "sha256:1cb4ed918939151a03f33d4242ccd0aa5f11b3547d0cf30f7c74a408a5b99878", size = 107698, upload-time = "2025-10-08T22:01:16.51Z" },
+    { url = "https://files.pythonhosted.org/packages/89/48/06ee6eabe4fdd9ecd48bf488f4ac783844fd777f547b8d1b61c11939974e/tomli-2.3.0-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:5192f562738228945d7b13d4930baffda67b69425a7f0da96d360b0a3888136b", size = 154819, upload-time = "2025-10-08T22:01:17.964Z" },
+    { url = "https://files.pythonhosted.org/packages/f1/01/88793757d54d8937015c75dcdfb673c65471945f6be98e6a0410fba167ed/tomli-2.3.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:be71c93a63d738597996be9528f4abe628d1adf5e6eb11607bc8fe1a510b5dae", size = 148766, upload-time = "2025-10-08T22:01:18.959Z" },
+    { url = "https://files.pythonhosted.org/packages/42/17/5e2c956f0144b812e7e107f94f1cc54af734eb17b5191c0bbfb72de5e93e/tomli-2.3.0-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:c4665508bcbac83a31ff8ab08f424b665200c0e1e645d2bd9ab3d3e557b6185b", size = 240771, upload-time = "2025-10-08T22:01:20.106Z" },
+    { url = "https://files.pythonhosted.org/packages/d5/f4/0fbd014909748706c01d16824eadb0307115f9562a15cbb012cd9b3512c5/tomli-2.3.0-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:4021923f97266babc6ccab9f5068642a0095faa0a51a246a6a02fccbb3514eaf", size = 248586, upload-time = "2025-10-08T22:01:21.164Z" },
+    { url = "https://files.pythonhosted.org/packages/30/77/fed85e114bde5e81ecf9bc5da0cc69f2914b38f4708c80ae67d0c10180c5/tomli-2.3.0-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:a4ea38c40145a357d513bffad0ed869f13c1773716cf71ccaa83b0fa0cc4e42f", size = 244792, upload-time = "2025-10-08T22:01:22.417Z" },
+    { url = "https://files.pythonhosted.org/packages/55/92/afed3d497f7c186dc71e6ee6d4fcb0acfa5f7d0a1a2878f8beae379ae0cc/tomli-2.3.0-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:ad805ea85eda330dbad64c7ea7a4556259665bdf9d2672f5dccc740eb9d3ca05", size = 248909, upload-time = "2025-10-08T22:01:23.859Z" },
+    { url = "https://files.pythonhosted.org/packages/f8/84/ef50c51b5a9472e7265ce1ffc7f24cd4023d289e109f669bdb1553f6a7c2/tomli-2.3.0-cp313-cp313-win32.whl", hash = "sha256:97d5eec30149fd3294270e889b4234023f2c69747e555a27bd708828353ab606", size = 96946, upload-time = "2025-10-08T22:01:24.893Z" },
+    { url = "https://files.pythonhosted.org/packages/b2/b7/718cd1da0884f281f95ccfa3a6cc572d30053cba64603f79d431d3c9b61b/tomli-2.3.0-cp313-cp313-win_amd64.whl", hash = "sha256:0c95ca56fbe89e065c6ead5b593ee64b84a26fca063b5d71a1122bf26e533999", size = 107705, upload-time = "2025-10-08T22:01:26.153Z" },
+    { url = "https://files.pythonhosted.org/packages/19/94/aeafa14a52e16163008060506fcb6aa1949d13548d13752171a755c65611/tomli-2.3.0-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:cebc6fe843e0733ee827a282aca4999b596241195f43b4cc371d64fc6639da9e", size = 154244, upload-time = "2025-10-08T22:01:27.06Z" },
+    { url = "https://files.pythonhosted.org/packages/db/e4/1e58409aa78eefa47ccd19779fc6f36787edbe7d4cd330eeeedb33a4515b/tomli-2.3.0-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:4c2ef0244c75aba9355561272009d934953817c49f47d768070c3c94355c2aa3", size = 148637, upload-time = "2025-10-08T22:01:28.059Z" },
+    { url = "https://files.pythonhosted.org/packages/26/b6/d1eccb62f665e44359226811064596dd6a366ea1f985839c566cd61525ae/tomli-2.3.0-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:c22a8bf253bacc0cf11f35ad9808b6cb75ada2631c2d97c971122583b129afbc", size = 241925, upload-time = "2025-10-08T22:01:29.066Z" },
+    { url = "https://files.pythonhosted.org/packages/70/91/7cdab9a03e6d3d2bb11beae108da5bdc1c34bdeb06e21163482544ddcc90/tomli-2.3.0-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:0eea8cc5c5e9f89c9b90c4896a8deefc74f518db5927d0e0e8d4a80953d774d0", size = 249045, upload-time = "2025-10-08T22:01:31.98Z" },
+    { url = "https://files.pythonhosted.org/packages/15/1b/8c26874ed1f6e4f1fcfeb868db8a794cbe9f227299402db58cfcc858766c/tomli-2.3.0-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:b74a0e59ec5d15127acdabd75ea17726ac4c5178ae51b85bfe39c4f8a278e879", size = 245835, upload-time = "2025-10-08T22:01:32.989Z" },
+    { url = "https://files.pythonhosted.org/packages/fd/42/8e3c6a9a4b1a1360c1a2a39f0b972cef2cc9ebd56025168c4137192a9321/tomli-2.3.0-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:b5870b50c9db823c595983571d1296a6ff3e1b88f734a4c8f6fc6188397de005", size = 253109, upload-time = "2025-10-08T22:01:34.052Z" },
+    { url = "https://files.pythonhosted.org/packages/22/0c/b4da635000a71b5f80130937eeac12e686eefb376b8dee113b4a582bba42/tomli-2.3.0-cp314-cp314-win32.whl", hash = "sha256:feb0dacc61170ed7ab602d3d972a58f14ee3ee60494292d384649a3dc38ef463", size = 97930, upload-time = "2025-10-08T22:01:35.082Z" },
+    { url = "https://files.pythonhosted.org/packages/b9/74/cb1abc870a418ae99cd5c9547d6bce30701a954e0e721821df483ef7223c/tomli-2.3.0-cp314-cp314-win_amd64.whl", hash = "sha256:b273fcbd7fc64dc3600c098e39136522650c49bca95df2d11cf3b626422392c8", size = 107964, upload-time = "2025-10-08T22:01:36.057Z" },
+    { url = "https://files.pythonhosted.org/packages/54/78/5c46fff6432a712af9f792944f4fcd7067d8823157949f4e40c56b8b3c83/tomli-2.3.0-cp314-cp314t-macosx_10_13_x86_64.whl", hash = "sha256:940d56ee0410fa17ee1f12b817b37a4d4e4dc4d27340863cc67236c74f582e77", size = 163065, upload-time = "2025-10-08T22:01:37.27Z" },
+    { url = "https://files.pythonhosted.org/packages/39/67/f85d9bd23182f45eca8939cd2bc7050e1f90c41f4a2ecbbd5963a1d1c486/tomli-2.3.0-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:f85209946d1fe94416debbb88d00eb92ce9cd5266775424ff81bc959e001acaf", size = 159088, upload-time = "2025-10-08T22:01:38.235Z" },
+    { url = "https://files.pythonhosted.org/packages/26/5a/4b546a0405b9cc0659b399f12b6adb750757baf04250b148d3c5059fc4eb/tomli-2.3.0-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:a56212bdcce682e56b0aaf79e869ba5d15a6163f88d5451cbde388d48b13f530", size = 268193, upload-time = "2025-10-08T22:01:39.712Z" },
+    { url = "https://files.pythonhosted.org/packages/42/4f/2c12a72ae22cf7b59a7fe75b3465b7aba40ea9145d026ba41cb382075b0e/tomli-2.3.0-cp314-cp314t-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:c5f3ffd1e098dfc032d4d3af5c0ac64f6d286d98bc148698356847b80fa4de1b", size = 275488, upload-time = "2025-10-08T22:01:40.773Z" },
+    { url = "https://files.pythonhosted.org/packages/92/04/a038d65dbe160c3aa5a624e93ad98111090f6804027d474ba9c37c8ae186/tomli-2.3.0-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:5e01decd096b1530d97d5d85cb4dff4af2d8347bd35686654a004f8dea20fc67", size = 272669, upload-time = "2025-10-08T22:01:41.824Z" },
+    { url = "https://files.pythonhosted.org/packages/be/2f/8b7c60a9d1612a7cbc39ffcca4f21a73bf368a80fc25bccf8253e2563267/tomli-2.3.0-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:8a35dd0e643bb2610f156cca8db95d213a90015c11fee76c946aa62b7ae7e02f", size = 279709, upload-time = "2025-10-08T22:01:43.177Z" },
+    { url = "https://files.pythonhosted.org/packages/7e/46/cc36c679f09f27ded940281c38607716c86cf8ba4a518d524e349c8b4874/tomli-2.3.0-cp314-cp314t-win32.whl", hash = "sha256:a1f7f282fe248311650081faafa5f4732bdbfef5d45fe3f2e702fbc6f2d496e0", size = 107563, upload-time = "2025-10-08T22:01:44.233Z" },
+    { url = "https://files.pythonhosted.org/packages/84/ff/426ca8683cf7b753614480484f6437f568fd2fda2edbdf57a2d3d8b27a0b/tomli-2.3.0-cp314-cp314t-win_amd64.whl", hash = "sha256:70a251f8d4ba2d9ac2542eecf008b3c8a9fc5c3f9f02c56a9d7952612be2fdba", size = 119756, upload-time = "2025-10-08T22:01:45.234Z" },
+    { url = "https://files.pythonhosted.org/packages/77/b8/0135fadc89e73be292b473cb820b4f5a08197779206b33191e801feeae40/tomli-2.3.0-py3-none-any.whl", hash = "sha256:e95b1af3c5b07d9e643909b5abbec77cd9f1217e6d0bca72b0234736b9fb1f1b", size = 14408, upload-time = "2025-10-08T22:01:46.04Z" },
+]
+
+[[package]]
+name = "tqdm"
+version = "4.67.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "colorama", marker = "sys_platform == 'win32'" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a8/4b/29b4ef32e036bb34e4ab51796dd745cdba7ed47ad142a9f4a1eb8e0c744d/tqdm-4.67.1.tar.gz", hash = "sha256:f8aef9c52c08c13a65f30ea34f4e5aac3fd1a34959879d7e59e63027286627f2", size = 169737, upload-time = "2024-11-24T20:12:22.481Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/d0/30/dc54f88dd4a2b5dc8a0279bdd7270e735851848b762aeb1c1184ed1f6b14/tqdm-4.67.1-py3-none-any.whl", hash = "sha256:26445eca388f82e72884e0d580d5464cd801a3ea01e63e5601bdff9ba6a48de2", size = 78540, upload-time = "2024-11-24T20:12:19.698Z" },
+]
+
+[[package]]
+name = "ty"
+version = "0.0.1a23"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/5f/98/e9c6cc74e7f81d49f1c06db3a455a5bff6d9e47b73408d053e81daef77fb/ty-0.0.1a23.tar.gz", hash = "sha256:d3b4a81b47f306f571fd99bc71a4fa5607eae61079a18e77fadcf8401b19a6c9", size = 4360335, upload-time = "2025-10-16T18:18:59.475Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/9c/45/d662cd4c0c5f6254c4ff0d05edad9cbbac23e01bb277602eaed276bb53ba/ty-0.0.1a23-py3-none-linux_armv6l.whl", hash = "sha256:7c76debd57623ac8712a9d2a32529a2b98915434aa3521cab92318bfe3f34dfc", size = 8735928, upload-time = "2025-10-16T18:18:23.161Z" },
+    { url = "https://files.pythonhosted.org/packages/db/89/8aa7c303a55181fc121ecce143464a156b51f03481607ef0f58f67dc936c/ty-0.0.1a23-py3-none-macosx_10_12_x86_64.whl", hash = "sha256:1d9b63c72cb94bcfe8f36b4527fd18abc46bdecc8f774001bcf7a8dd83e8c81a", size = 8584084, upload-time = "2025-10-16T18:18:25.579Z" },
+    { url = "https://files.pythonhosted.org/packages/02/43/7a3bec50f440028153c0ee0044fd47e409372d41012f5f6073103a90beac/ty-0.0.1a23-py3-none-macosx_11_0_arm64.whl", hash = "sha256:1a875135cdb77b60280eb74d3c97ce3c44f872bf4176f5e71602a0a9401341ca", size = 8061268, upload-time = "2025-10-16T18:18:27.668Z" },
+    { url = "https://files.pythonhosted.org/packages/7c/c2/75ddb10084cc7da8de077ae09fe5d8d76fec977c2ab71929c21b6fea622f/ty-0.0.1a23-py3-none-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:9ddf5f4d057a023409a926e3be5ba0388aa8c93a01ddc6c87cca03af22c78a0c", size = 8319954, upload-time = "2025-10-16T18:18:29.54Z" },
+    { url = "https://files.pythonhosted.org/packages/b2/57/0762763e9a29a1bd393b804a950c03d9ceb18aaf5e5baa7122afc50c2387/ty-0.0.1a23-py3-none-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:ad89d894ef414d5607c3611ab68298581a444fd51570e0e4facdd7c8e8856748", size = 8550745, upload-time = "2025-10-16T18:18:31.548Z" },
+    { url = "https://files.pythonhosted.org/packages/89/0a/855ca77e454955acddba2149ad7fe20fd24946289b8fd1d66b025b2afef1/ty-0.0.1a23-py3-none-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:6306ad146748390675871b0c7731e595ceb2241724bc7d2d46e56f392949fbb9", size = 8899930, upload-time = "2025-10-16T18:18:34.003Z" },
+    { url = "https://files.pythonhosted.org/packages/ad/f0/9282da70da435d1890c5b1dff844a3139fc520d0a61747bb1e84fbf311d5/ty-0.0.1a23-py3-none-manylinux_2_17_ppc64.manylinux2014_ppc64.whl", hash = "sha256:fa2155c0a66faeb515b88d7dc6b9f3fb393373798e97c01f05b1436c60d2c6b1", size = 9561714, upload-time = "2025-10-16T18:18:36.238Z" },
+    { url = "https://files.pythonhosted.org/packages/b8/95/ffea2138629875a2083ccc64cc80585ecf0e487500835fe7c1b6f6305bf8/ty-0.0.1a23-py3-none-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:d7d75d1f264afbe9a294d88e1e7736c003567a74f3a433c72231c36999a61e42", size = 9231064, upload-time = "2025-10-16T18:18:38.877Z" },
+    { url = "https://files.pythonhosted.org/packages/ff/92/dac340d2d10e81788801e7580bad0168b190ba5a5c6cf6e4f798e094ee80/ty-0.0.1a23-py3-none-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:af8eb2341e804f8e1748b6d638a314102020dca5591cacae67fe420211d59369", size = 9428468, upload-time = "2025-10-16T18:18:40.984Z" },
+    { url = "https://files.pythonhosted.org/packages/37/21/d376393ecaf26cb84aa475f46137a59ae6d50508acbf1a044d414d8f6d47/ty-0.0.1a23-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e7516ee783ba3eba373fb82db8b989a14ed8620a45a9bb6e3a90571bc83b3e2a", size = 8880687, upload-time = "2025-10-16T18:18:43.34Z" },
+    { url = "https://files.pythonhosted.org/packages/fd/f4/7cf58a02e0a8d062dd20d7816396587faba9ddfe4098ee88bb6ee3c272d4/ty-0.0.1a23-py3-none-musllinux_1_2_aarch64.whl", hash = "sha256:6c8f9a861b51bbcf10f35d134a3c568a79a3acd3b0f2f1c004a2ccb00efdf7c1", size = 8281532, upload-time = "2025-10-16T18:18:45.806Z" },
+    { url = "https://files.pythonhosted.org/packages/14/1b/ae616bbc4588b50ff1875588e734572a2b00102415e131bc20d794827865/ty-0.0.1a23-py3-none-musllinux_1_2_armv7l.whl", hash = "sha256:d44a7ca68f4e79e7f06f23793397edfa28c2ac38e1330bf7100dce93015e412a", size = 8579585, upload-time = "2025-10-16T18:18:47.638Z" },
+    { url = "https://files.pythonhosted.org/packages/b5/0c/3f4fc4721eb34abd7d86b43958b741b73727c9003f9977bacc3c91b3d7ca/ty-0.0.1a23-py3-none-musllinux_1_2_i686.whl", hash = "sha256:80a6818b22b25a27d5761a3cf377784f07d7a799f24b3ebcf9b4144b35b88871", size = 8675719, upload-time = "2025-10-16T18:18:49.536Z" },
+    { url = "https://files.pythonhosted.org/packages/60/36/07d2c4e0230407419c10d3aa7c5035e023d9f70f07f4da2266fa0108109c/ty-0.0.1a23-py3-none-musllinux_1_2_x86_64.whl", hash = "sha256:ef52c927ed6b5ebec290332ded02ce49ffdb3576683920b7013a7b2cd6bd5685", size = 8978349, upload-time = "2025-10-16T18:18:51.299Z" },
+    { url = "https://files.pythonhosted.org/packages/7b/f9/abf666971434ea259a8d2006d2943eac0727a14aeccd24359341d377c2d1/ty-0.0.1a23-py3-none-win32.whl", hash = "sha256:0cc7500131a6a533d4000401026427cd538e33fda4e9004d7ad0db5a6f5500b1", size = 8279664, upload-time = "2025-10-16T18:18:53.132Z" },
+    { url = "https://files.pythonhosted.org/packages/c6/3d/cb99e90adba6296f260ceaf3d02cc20563ec623b23a92ab94d17791cb537/ty-0.0.1a23-py3-none-win_amd64.whl", hash = "sha256:c89564e90dcc2f9564564d4a02cd703ed71cd9ccbb5a6a38ee49c44d86375f24", size = 8912398, upload-time = "2025-10-16T18:18:55.585Z" },
+    { url = "https://files.pythonhosted.org/packages/77/33/9fffb57f66317082fe3de4d08bb71557105c47676a114bdc9d52f6d3a910/ty-0.0.1a23-py3-none-win_arm64.whl", hash = "sha256:71aa203d6ae4de863a7f4626a8fe5f723beaa219988d176a6667f021b78a2af3", size = 8400343, upload-time = "2025-10-16T18:18:57.387Z" },
+]
+
+[[package]]
+name = "typeguard"
+version = "4.4.4"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/c7/68/71c1a15b5f65f40e91b65da23b8224dad41349894535a97f63a52e462196/typeguard-4.4.4.tar.gz", hash = "sha256:3a7fd2dffb705d4d0efaed4306a704c89b9dee850b688f060a8b1615a79e5f74", size = 75203, upload-time = "2025-06-18T09:56:07.624Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/1b/a9/e3aee762739c1d7528da1c3e06d518503f8b6c439c35549b53735ba52ead/typeguard-4.4.4-py3-none-any.whl", hash = "sha256:b5f562281b6bfa1f5492470464730ef001646128b180769880468bd84b68b09e", size = 34874, upload-time = "2025-06-18T09:56:05.999Z" },
+]
+
+[[package]]
+name = "typer"
+version = "0.19.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "click" },
+    { name = "rich" },
+    { name = "shellingham" },
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/21/ca/950278884e2ca20547ff3eb109478c6baf6b8cf219318e6bc4f666fad8e8/typer-0.19.2.tar.gz", hash = "sha256:9ad824308ded0ad06cc716434705f691d4ee0bfd0fb081839d2e426860e7fdca", size = 104755, upload-time = "2025-09-23T09:47:48.256Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/00/22/35617eee79080a5d071d0f14ad698d325ee6b3bf824fc0467c03b30e7fa8/typer-0.19.2-py3-none-any.whl", hash = "sha256:755e7e19670ffad8283db353267cb81ef252f595aa6834a0d1ca9312d9326cb9", size = 46748, upload-time = "2025-09-23T09:47:46.777Z" },
+]
+
+[[package]]
+name = "typing-extensions"
+version = "4.15.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/72/94/1a15dd82efb362ac84269196e94cf00f187f7ed21c242792a923cdb1c61f/typing_extensions-4.15.0.tar.gz", hash = "sha256:0cea48d173cc12fa28ecabc3b837ea3cf6f38c6d1136f85cbaaf598984861466", size = 109391, upload-time = "2025-08-25T13:49:26.313Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/18/67/36e9267722cc04a6b9f15c7f3441c2363321a3ea07da7ae0c0707beb2a9c/typing_extensions-4.15.0-py3-none-any.whl", hash = "sha256:f0fa19c6845758ab08074a0cfa8b7aecb71c999ca73d62883bc25cc018c4e548", size = 44614, upload-time = "2025-08-25T13:49:24.86Z" },
+]
+
+[[package]]
+name = "typing-inspect"
+version = "0.9.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "mypy-extensions" },
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/dc/74/1789779d91f1961fa9438e9a8710cdae6bd138c80d7303996933d117264a/typing_inspect-0.9.0.tar.gz", hash = "sha256:b23fc42ff6f6ef6954e4852c1fb512cdd18dbea03134f91f856a95ccc9461f78", size = 13825, upload-time = "2023-05-24T20:25:47.612Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/65/f3/107a22063bf27bdccf2024833d3445f4eea42b2e598abfbd46f6a63b6cb0/typing_inspect-0.9.0-py3-none-any.whl", hash = "sha256:9ee6fc59062311ef8547596ab6b955e1b8aa46242d854bfc78f4f6b0eff35f9f", size = 8827, upload-time = "2023-05-24T20:25:45.287Z" },
+]
+
+[[package]]
+name = "typing-inspection"
+version = "0.4.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/55/e3/70399cb7dd41c10ac53367ae42139cf4b1ca5f36bb3dc6c9d33acdb43655/typing_inspection-0.4.2.tar.gz", hash = "sha256:ba561c48a67c5958007083d386c3295464928b01faa735ab8547c5692e87f464", size = 75949, upload-time = "2025-10-01T02:14:41.687Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/dc/9b/47798a6c91d8bdb567fe2698fe81e0c6b7cb7ef4d13da4114b41d239f65d/typing_inspection-0.4.2-py3-none-any.whl", hash = "sha256:4ed1cacbdc298c220f1bd249ed5287caa16f34d44ef4e9c3d0cbad5b521545e7", size = 14611, upload-time = "2025-10-01T02:14:40.154Z" },
+]
+
+[[package]]
+name = "urllib3"
+version = "2.5.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/15/22/9ee70a2574a4f4599c47dd506532914ce044817c7752a79b6a51286319bc/urllib3-2.5.0.tar.gz", hash = "sha256:3fc47733c7e419d4bc3f6b3dc2b4f890bb743906a30d56ba4a5bfa4bbff92760", size = 393185, upload-time = "2025-06-18T14:07:41.644Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/a7/c2/fe1e52489ae3122415c51f387e221dd0773709bad6c6cdaa599e8a2c5185/urllib3-2.5.0-py3-none-any.whl", hash = "sha256:e6b01673c0fa6a13e374b50871808eb3bf7046c4b125b216f6bf1cc604cff0dc", size = 129795, upload-time = "2025-06-18T14:07:40.39Z" },
+]
+
+[[package]]
+name = "virtualenv"
+version = "20.35.3"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "distlib" },
+    { name = "filelock" },
+    { name = "platformdirs" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a4/d5/b0ccd381d55c8f45d46f77df6ae59fbc23d19e901e2d523395598e5f4c93/virtualenv-20.35.3.tar.gz", hash = "sha256:4f1a845d131133bdff10590489610c98c168ff99dc75d6c96853801f7f67af44", size = 6002907, upload-time = "2025-10-10T21:23:33.178Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/27/73/d9a94da0e9d470a543c1b9d3ccbceb0f59455983088e727b8a1824ed90fb/virtualenv-20.35.3-py3-none-any.whl", hash = "sha256:63d106565078d8c8d0b206d48080f938a8b25361e19432d2c9db40d2899c810a", size = 5981061, upload-time = "2025-10-10T21:23:30.433Z" },
+]
+
+[[package]]
+name = "win32-setctime"
+version = "1.2.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/b3/8f/705086c9d734d3b663af0e9bb3d4de6578d08f46b1b101c2442fd9aecaa2/win32_setctime-1.2.0.tar.gz", hash = "sha256:ae1fdf948f5640aae05c511ade119313fb6a30d7eabe25fef9764dca5873c4c0", size = 4867, upload-time = "2024-12-07T15:28:28.314Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/e1/07/c6fe3ad3e685340704d314d765b7912993bcb8dc198f0e7a89382d37974b/win32_setctime-1.2.0-py3-none-any.whl", hash = "sha256:95d644c4e708aba81dc3704a116d8cbc974d70b3bdb8be1d150e36be6e9d1390", size = 4083, upload-time = "2024-12-07T15:28:26.465Z" },
+]
diff --git a/config.yml b/config.yml
index abb9128..bb71b4d 100644
--- a/config.yml
+++ b/config.yml
@@ -8,6 +8,3 @@ default:
 
 production:
     data_root: "/home/rstudio/data"
-
-cloud-run:
-    data_root: "/workspace/data"
diff --git a/scripts/R/run_pipeline.R b/scripts/R/run_pipeline.R
index 5c161da..09408b3 100644
--- a/scripts/R/run_pipeline.R
+++ b/scripts/R/run_pipeline.R
@@ -31,19 +31,21 @@ upload_data <- function(bucket, data_dir) {
     print("Finished uploading data to GCP Storage")
 }
 
-ingest_data <- function(project_id, cluster_fields, dataset, table, source) {
-    print("Deleting old table in GCP Big Query")
-    command <- paste(
-        "bq rm",
-        "-f",
-        "-t",
-        paste0(project_id, ":", dataset, ".", table)
-    )
-    cat(command)
-    exit_code <- system(command)
-    if (exit_code != 0) {
-        paste("Error while executing", command)
-        stop("Error during ingesting data")
+ingest_data <- function(project_id, cluster_fields, dataset, table, source, delete=T) {
+    if (delete) {
+        print("Deleting old table in GCP Big Query")
+        command <- paste(
+            "bq rm",
+            "-f",
+            "-t",
+            paste0(project_id, ":", dataset, ".", table)
+        )
+        cat(command)
+        exit_code <- system(command)
+        if (exit_code != 0) {
+            paste("Error while executing", command)
+            stop("Error during ingesting data")
+        }
     }
 
     print("Ingesting data to GCP Big Query")
diff --git a/scripts/gcp/deploy.sh b/scripts/gcp/deploy.sh
index 5d86027..ffa5542 100755
--- a/scripts/gcp/deploy.sh
+++ b/scripts/gcp/deploy.sh
@@ -1,6 +1,9 @@
 #!/bin/bash
 # Build the Docker image, push it to Artifact Registry, and deploy the A4D
-# pipeline as a Cloud Run Job that can be triggered manually.
+# Python pipeline as a Cloud Run Job that can be triggered manually.
+#
+# The Docker image is built from the repo root (to include reference_data/)
+# using a4d-python/Dockerfile as the build file.
 #
 # Prerequisites:
 #   - gcloud CLI authenticated with sufficient permissions
@@ -10,11 +13,11 @@
 #       roles/storage.objectCreator      (write output files to GCS)
 #       roles/bigquery.dataEditor        (write tables to BigQuery)
 #       roles/bigquery.jobUser           (run BigQuery load jobs)
-#       roles/secretmanager.secretAccessor (access the SA key secret)
-#   - Secret "a4d-gcp-sa" created in Secret Manager containing the service
-#     account JSON key used to authenticate googlesheets4/googledrive
 #
-# Usage:
+#   Authentication inside the container uses Workload Identity / ADC via the
+#   Cloud Run service account — no JSON key file is required.
+#
+# Usage (run from the repo root):
 #   PROJECT_ID=my-project SERVICE_ACCOUNT=sa@my-project.iam.gserviceaccount.com \
 #     bash scripts/gcp/deploy.sh
 #
@@ -43,7 +46,12 @@ gcloud artifacts repositories create "${REPOSITORY}" \
     --quiet 2>/dev/null || true
 
 echo "==> Building Docker image: ${IMAGE_URI}"
-docker build --cache-from "${IMAGE_URI}" -t "${IMAGE_URI}" .
+# Build context is the repo root so that reference_data/ can be copied into the image.
+docker build \
+    --cache-from "${IMAGE_URI}" \
+    -f a4d-python/Dockerfile \
+    -t "${IMAGE_URI}" \
+    .
 
 echo "==> Pushing Docker image to Artifact Registry..."
 docker push "${IMAGE_URI}"
@@ -58,7 +66,7 @@ gcloud run jobs deploy "${JOB_NAME}" \
     --cpu=4 \
     --max-retries=0 \
     --task-timeout=3h \
-    --set-secrets="/workspace/secrets/a4d-gcp-sa.json=a4d-gcp-sa:latest"
+    --set-env-vars="A4D_PROJECT_ID=${PROJECT_ID},A4D_ENVIRONMENT=production,A4D_DATA_ROOT=/workspace/data"
 
 echo ""
 echo "==> Deployment complete."
@@ -66,3 +74,4 @@ echo ""
 echo "To run the pipeline manually, execute:"
 echo "  gcloud run jobs execute ${JOB_NAME} \\"
 echo "    --region=${REGION} --project=${PROJECT_ID} --wait"
+

From c488a8c95646b10a15791549e6dbed832288a36c Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 24 Feb 2026 23:59:42 +0000
Subject: [PATCH 4/6] Fix PR diff: sync migration branch files, leaving only
 the 4 new deployment files

Co-authored-by: pmayd <9614291+pmayd@users.noreply.github.com>
---
 .github/workflows/python-ci.yml               |  52 +++++
 .gitignore                                    |   8 +-
 .vscode/settings.json                         |   9 +
 CLAUDE.md                                     |  61 ++++++
 R/script2_helper_patient_data_fix.R           |   9 +
 reference_data/synonyms/synonyms_patient.yaml |   1 +
 reference_data/validation_rules.yaml          | 138 +++++++++++++
 test_full_pipeline_debug.R                    | 181 ++++++++++++++++++
 8 files changed, 458 insertions(+), 1 deletion(-)
 create mode 100644 .github/workflows/python-ci.yml
 create mode 100644 .vscode/settings.json
 create mode 100644 CLAUDE.md
 create mode 100644 reference_data/validation_rules.yaml
 create mode 100644 test_full_pipeline_debug.R

diff --git a/.github/workflows/python-ci.yml b/.github/workflows/python-ci.yml
new file mode 100644
index 0000000..3048080
--- /dev/null
+++ b/.github/workflows/python-ci.yml
@@ -0,0 +1,52 @@
+name: Python CI
+
+on:
+  push:
+    branches: [migration]
+    paths:
+      - 'a4d-python/**'
+      - '.github/workflows/python-ci.yml'
+  pull_request:
+    branches: [main, develop, migration]
+    paths:
+      - 'a4d-python/**'
+      - '.github/workflows/python-ci.yml'
+
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    defaults:
+      run:
+        working-directory: a4d-python
+
+    steps:
+    - uses: actions/checkout@v4
+
+    - name: Install uv
+      uses: astral-sh/setup-uv@v2
+      with:
+        enable-cache: true
+
+    - name: Set up Python
+      run: uv python install 3.11
+
+    - name: Install dependencies
+      run: uv sync --all-extras
+
+    - name: Run ruff linting
+      run: uv run ruff check .
+
+    - name: Run ruff formatting check
+      run: uv run ruff format --check .
+
+    - name: Run type checking with ty
+      run: uv run ty check src/
+
+    - name: Run tests
+      run: uv run pytest --cov --cov-report=xml
+
+    - name: Upload coverage
+      uses: codecov/codecov-action@v3
+      with:
+        files: ./a4d-python/coverage.xml
+        flags: python
diff --git a/.gitignore b/.gitignore
index 0791f1a..f682ea3 100644
--- a/.gitignore
+++ b/.gitignore
@@ -10,4 +10,10 @@
 rsconnect
 
 data/output
-data/mapping_table.csv
\ No newline at end of file
+data/mapping_table.csv
+
+# Serena (MCP server state)
+.serena/
+
+# Secrets (GCP service accounts, etc.)
+secrets/
\ No newline at end of file
diff --git a/.vscode/settings.json b/.vscode/settings.json
new file mode 100644
index 0000000..0da1d06
--- /dev/null
+++ b/.vscode/settings.json
@@ -0,0 +1,9 @@
+{
+    "python.testing.pytestEnabled": true,
+    "python.testing.unittestEnabled": false,
+    "python.testing.cwd": "${workspaceFolder}/a4d-python",
+    "python.testing.pytestArgs": [
+        "${workspaceFolder}/a4d-python/tests"
+    ],
+    "python.defaultInterpreterPath": "${workspaceFolder}/a4d-python/.venv/bin/python"
+}
\ No newline at end of file
diff --git a/CLAUDE.md b/CLAUDE.md
new file mode 100644
index 0000000..df025ae
--- /dev/null
+++ b/CLAUDE.md
@@ -0,0 +1,61 @@
+# CLAUDE.md
+
+This repository contains **two projects**:
+
+## 1. R Pipeline (Production - Legacy)
+
+**Location**: Root directory
+**Status**: Production (being phased out)
+
+The original R implementation of the A4D medical tracker data processing pipeline.
+
+**Key Files**:
+- `R/` - R package code
+- `scripts/R/` - Pipeline scripts
+- `reference_data/` - Shared YAML configurations
+
+**Commands**: See README.md for R-specific commands
+
+---
+
+## 2. Python Pipeline (Active Development)
+
+**Location**: `a4d-python/`
+**Status**: Active migration
+**Branch**: `migration`
+
+New Python implementation with better performance and incremental processing.
+
+**Documentation**: [a4d-python/docs/CLAUDE.md](a4d-python/docs/CLAUDE.md)
+
+**Quick Start**:
+```bash
+cd a4d-python
+uv sync
+uv run pytest
+```
+
+**Migration Guide**: [a4d-python/docs/migration/MIGRATION_GUIDE.md](a4d-python/docs/migration/MIGRATION_GUIDE.md)
+
+---
+
+## Working on This Repository
+
+**If working on R code**: Stay in root, use R commands
+
+**If working on Python migration**:
+```bash
+cd a4d-python
+# See a4d-python/docs/CLAUDE.md for Python-specific guidance
+```
+
+## Shared Resources
+
+Both projects use the same reference data:
+- `reference_data/synonyms/` - Column name mappings
+- `reference_data/data_cleaning.yaml` - Validation rules
+- `reference_data/provinces/` - Allowed provinces
+
+**Do not modify these** without testing both R and Python pipelines.
+- Always check your implementation against the original R pipeline and check if the logic is the same
+- Limit comments to explain why a desigin was made or give important context information for the migration but do not use comments for obvious code otherwise
\ No newline at end of file
diff --git a/R/script2_helper_patient_data_fix.R b/R/script2_helper_patient_data_fix.R
index 278ab1c..d18ef7f 100644
--- a/R/script2_helper_patient_data_fix.R
+++ b/R/script2_helper_patient_data_fix.R
@@ -176,6 +176,15 @@ parse_dates <- function(date) {
         return(lubridate::NA_Date_)
     }
 
+    # Handle Excel serial numbers (e.g., "45341.0", "39920.0")
+    # Excel stores dates as days since 1899-12-30
+    numeric_date <- suppressWarnings(as.numeric(date))
+    if (!is.na(numeric_date) && numeric_date > 1 && numeric_date < 100000) {
+        # This is likely an Excel serial number
+        excel_origin <- as.Date("1899-12-30")
+        return(excel_origin + as.integer(numeric_date))
+    }
+
     parsed_date <- suppressWarnings(lubridate::as_date(date))
 
     if (is.na(parsed_date)) {
diff --git a/reference_data/synonyms/synonyms_patient.yaml b/reference_data/synonyms/synonyms_patient.yaml
index 3844198..cdb3527 100644
--- a/reference_data/synonyms/synonyms_patient.yaml
+++ b/reference_data/synonyms/synonyms_patient.yaml
@@ -74,6 +74,7 @@ complication_screening_kidney_test_date:
 - Kidney Function Test Date (dd-mmm-yyyy)
 complication_screening_kidney_test_value:
 - Kidney Function Test UACR (mg/mmol)
+- Kidney Function Test UACR (mg/g)
 complication_screening_lipid_profile_cholesterol_value:
 - Lipid Profile Cholesterol
 complication_screening_lipid_profile_date:
diff --git a/reference_data/validation_rules.yaml b/reference_data/validation_rules.yaml
new file mode 100644
index 0000000..5fbb423
--- /dev/null
+++ b/reference_data/validation_rules.yaml
@@ -0,0 +1,138 @@
+# Python Pipeline Validation Rules
+#
+# This file defines allowed values for data validation in the Python pipeline.
+# It is separate from data_cleaning.yaml (used by R pipeline) to allow
+# independent evolution of the two pipelines.
+#
+# Structure:
+#   column_name:
+#     allowed_values: [list of valid values]
+#     replace_invalid: true/false (whether to replace with error value)
+#
+# Note: Data transformations are hardcoded in src/a4d/clean/transformers.py,
+# not defined in YAML.
+
+analog_insulin_long_acting:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+analog_insulin_rapid_acting:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+clinic_visit:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+complication_screening_eye_exam_value:
+  allowed_values: ["Normal", "Abnormal"]
+  replace_invalid: true
+
+complication_screening_foot_exam_value:
+  allowed_values: ["Normal", "Abnormal"]
+  replace_invalid: true
+
+dm_complication_eye:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+dm_complication_kidney:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+dm_complication_others:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+hospitalisation_cause:
+  allowed_values: ["DKA", "HYPO", "HYPER", "OTHER"]
+  replace_invalid: true
+
+human_insulin_intermediate_acting:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+human_insulin_pre_mixed:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+human_insulin_short_acting:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+insulin_regimen:
+  # Note: Values are transformed by extract_regimen() in transformers.py first
+  allowed_values:
+    - "Basal-bolus (MDI)"
+    - "Premixed 30/70 BD"
+    - "Self-mixed BD"
+    - "Modified conventional TID"
+  replace_invalid: false  # Don't replace - these are post-transformation values
+
+insulin_type:
+  allowed_values: ["Human Insulin", "Analog Insulin"]
+  replace_invalid: true
+
+insulin_subtype:
+  # Note: R derives "rapic-acting" (typo) but validates against "Rapid-acting" (correct)
+  # This causes ALL derived values to become "Undefined" because:
+  # 1. Single values like "rapic-acting" don't match "Rapid-acting"
+  # 2. Comma-separated values like "rapic-acting,long-acting" don't match any single allowed value
+  allowed_values:
+    - "Pre-mixed"
+    - "Short-acting"
+    - "Intermediate-acting"
+    - "Rapid-acting"  # R expects this, but derives "rapic-acting" (typo)
+    - "Long-acting"
+  replace_invalid: true
+
+observations_category:
+  allowed_values:
+    - "Status IN"
+    - "Status OUT"
+    - "Clinic Follow Up"
+    - "Hospitalisation"
+    - "Support"
+    - "DM Complication"
+    - "Insulin Regimen"
+    - "Other"
+  replace_invalid: false
+
+patient_consent:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+remote_followup:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
+
+status:
+  # Canonical values in Title Case. Validation is case-insensitive.
+  # If matched, returns the canonical value (e.g., "active" → "Active")
+  allowed_values:
+    - "Active"
+    - "Active - Remote"
+    - "Active Remote"
+    - "Active Monitoring"
+    - "Query"
+    - "Inactive"
+    - "Transferred"
+    - "Lost Follow Up"
+    - "Deceased"
+    - "Discontinued"
+  replace_invalid: true
+
+support_level:
+  allowed_values:
+    - "Standard"
+    - "Partial"
+    - "Partial - A"
+    - "Partial - B"
+    - "Semi-Partial"
+    - "SAC"
+    - "Monitoring"
+  replace_invalid: true
+
+t1d_diagnosis_with_dka:
+  allowed_values: ["N", "Y"]
+  replace_invalid: true
diff --git a/test_full_pipeline_debug.R b/test_full_pipeline_debug.R
new file mode 100644
index 0000000..1f4c7a6
--- /dev/null
+++ b/test_full_pipeline_debug.R
@@ -0,0 +1,181 @@
+#!/usr/bin/env Rscript
+
+# Debug the full pipeline to find where it fails
+library(arrow)
+library(dplyr)
+library(tidyselect)
+
+# Load the package
+devtools::load_all(".")
+
+# Setup error values
+ERROR_VAL_NUMERIC <<- 999999
+ERROR_VAL_CHARACTER <<- "Undefined"
+ERROR_VAL_DATE <<- "9999-09-09"
+
+# Read the raw parquet
+df_raw <- read_parquet("/Volumes/USB SanDisk 3.2Gen1 Media/a4d/a4dphase2_upload/output/patient_data_raw/2024_Sibu Hospital A4D Tracker_patient_raw.parquet")
+
+cat("Step 1: Load schema and merge\n")
+schema <- tibble::tibble(
+    age = integer(),
+    analog_insulin_long_acting = character(),
+    analog_insulin_rapid_acting = character(),
+    blood_pressure_dias_mmhg = integer(),
+    blood_pressure_sys_mmhg = integer(),
+    blood_pressure_updated = lubridate::as_date(1),
+    bmi = numeric(),
+    bmi_date = lubridate::as_date(1),
+    clinic_id = character(),
+    clinic_visit = character(),
+    complication_screening_eye_exam_date = lubridate::as_date(1),
+    complication_screening_eye_exam_value = character(),
+    complication_screening_foot_exam_date = lubridate::as_date(1),
+    complication_screening_foot_exam_value = character(),
+    complication_screening_kidney_test_date = lubridate::as_date(1),
+    complication_screening_kidney_test_value = character(),
+    complication_screening_lipid_profile_cholesterol_value = character(),
+    complication_screening_lipid_profile_date = lubridate::as_date(1),
+    complication_screening_lipid_profile_hdl_mmol_value = numeric(),
+    complication_screening_lipid_profile_hdl_mg_value = numeric(),
+    complication_screening_lipid_profile_ldl_mmol_value = numeric(),
+    complication_screening_lipid_profile_ldl_mg_value = numeric(),
+    complication_screening_lipid_profile_triglycerides_value = numeric(),
+    complication_screening_remarks = character(),
+    complication_screening_thyroid_test_date = lubridate::as_date(1),
+    complication_screening_thyroid_test_ft4_pmol_value = numeric(),
+    complication_screening_thyroid_test_ft4_ng_value = numeric(),
+    complication_screening_thyroid_test_tsh_value = numeric(),
+    dm_complication_eye = character(),
+    dm_complication_kidney = character(),
+    dm_complication_others = character(),
+    dm_complication_remarks = character(),
+    dob = lubridate::as_date(1),
+    edu_occ = character(),
+    edu_occ_updated = lubridate::as_date(1),
+    family_history = character(),
+    fbg_baseline_mg = numeric(),
+    fbg_baseline_mmol = numeric(),
+    fbg_updated_date = lubridate::as_date(1),
+    fbg_updated_mg = numeric(),
+    fbg_updated_mmol = numeric(),
+    file_name = character(),
+    hba1c_baseline = numeric(),
+    hba1c_baseline_exceeds = logical(),
+    hba1c_updated = numeric(),
+    hba1c_updated_exceeds = logical(),
+    hba1c_updated_date = lubridate::as_date(1),
+    height = numeric(),
+    hospitalisation_cause = character(),
+    hospitalisation_date = lubridate::as_date(1),
+    human_insulin_intermediate_acting = character(),
+    human_insulin_pre_mixed = character(),
+    human_insulin_short_acting = character(),
+    insulin_injections = numeric(),
+    insulin_regimen = character(),
+    insulin_total_units = numeric(),
+    insulin_type = character(),
+    insulin_subtype = character(),
+    last_clinic_visit_date = lubridate::as_date(1),
+    last_remote_followup_date = lubridate::as_date(1),
+    lost_date = lubridate::as_date(1),
+    name = character(),
+    observations = character(),
+    observations_category = character(),
+    other_issues = character(),
+    patient_consent = character(),
+    patient_id = character(),
+    province = character(),
+    recruitment_date = lubridate::as_date(1),
+    remote_followup = character(),
+    sex = character(),
+    sheet_name = character(),
+    status = character(),
+    status_out = character(),
+    support_level = character(),
+    t1d_diagnosis_age = integer(),
+    t1d_diagnosis_date = lubridate::as_date(1),
+    t1d_diagnosis_with_dka = character(),
+    testing_frequency = integer(),
+    tracker_date = lubridate::as_date(1),
+    tracker_month = integer(),
+    tracker_year = integer(),
+    weight = numeric()
+)
+
+# Add missing columns
+df_patient <- merge.default(df_raw, schema, all.x = TRUE)
+df_patient <- df_patient[colnames(schema)]
+cat(sprintf("  Shape: %d rows, %d cols\n", nrow(df_patient), ncol(df_patient)))
+
+cat("\nStep 2: Pre-processing (fix known problems)\n")
+df_step2 <- df_patient %>%
+    rowwise() %>%
+    mutate(
+        hba1c_baseline = stringr::str_replace(hba1c_baseline, "<|>", ""),
+        hba1c_updated = stringr::str_replace(hba1c_updated, "<|>", ""),
+        fbg_updated_mg = fix_fbg(fbg_updated_mg),
+        fbg_updated_mmol = fix_fbg(fbg_updated_mmol),
+        testing_frequency = fix_testing_frequency(testing_frequency, patient_id),
+        analog_insulin_long_acting = sub("-", "N", analog_insulin_long_acting, fixed = TRUE),
+        analog_insulin_rapid_acting = sub("-", "N", analog_insulin_rapid_acting, fixed = TRUE),
+        human_insulin_intermediate_acting = sub("-", "N", human_insulin_intermediate_acting, fixed = TRUE),
+        human_insulin_pre_mixed = sub("-", "N", human_insulin_pre_mixed, fixed = TRUE),
+        human_insulin_short_acting = sub("-", "N", human_insulin_short_acting, fixed = TRUE)
+    )
+cat("  ✅ Step 2 complete\n")
+
+cat("\nStep 3: Type conversions\n")
+cat("  Converting numeric columns...\n")
+df_step3 <- df_step2 %>%
+    mutate(
+        across(
+            schema %>% select(where(is.numeric)) %>% names(),
+            \(x) convert_to(correct_decimal_sign(x), as.numeric, ERROR_VAL_NUMERIC, cur_column(), id = patient_id)
+        )
+    )
+cat("  ✅ Numeric conversion complete\n")
+
+cat("  Converting logical columns...\n")
+df_step3 <- df_step3 %>%
+    mutate(
+        across(
+            schema %>% select(where(is.logical)) %>% names(),
+            \(x) convert_to(x, as.logical, FALSE, cur_column(), id = patient_id)
+        )
+    )
+cat("  ✅ Logical conversion complete\n")
+
+cat("  Converting date columns...\n")
+df_step3 <- df_step3 %>%
+    mutate(
+        across(
+            schema %>% select(where(lubridate::is.Date)) %>% names(),
+            \(x) convert_to(fix_digit_date(x), parse_dates, as.Date(ERROR_VAL_DATE), cur_column(), id = patient_id)
+        )
+    )
+cat("  ✅ Date conversion complete\n")
+
+cat("  Converting integer columns...\n")
+df_step3 <- df_step3 %>%
+    mutate(
+        across(
+            schema %>% select(where(is.integer)) %>% names(),
+            \(x) convert_to(x, function(x) as.integer(round(as.double(x))), ERROR_VAL_NUMERIC, cur_column(), id = patient_id)
+        )
+    )
+cat("  ✅ Integer conversion complete\n")
+
+cat("\nStep 4: Post-processing transformations\n")
+cat("  Attempting height transformation...\n")
+df_step4 <- df_step3 %>%
+    mutate(
+        height = transform_cm_to_m(height) %>%
+            cut_numeric_value(min = 0, max = 2.3, col_name = "height")
+    )
+cat("  ✅ Height transformation complete\n")
+
+cat("\nSample heights after transformation:\n")
+print(df_step4$height[1:5])
+
+cat("\n✅ Full pipeline test successful!\n")

From e6241f891b77b27c4945f887e65c24d338bf102c Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Wed, 25 Feb 2026 00:25:12 +0000
Subject: [PATCH 5/6] Upgrade Python from 3.11 to 3.13 in Dockerfile and CI
 workflow

Co-authored-by: pmayd <9614291+pmayd@users.noreply.github.com>
---
 .github/workflows/python-ci.yml | 2 +-
 a4d-python/Dockerfile           | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/python-ci.yml b/.github/workflows/python-ci.yml
index 3048080..51f7652 100644
--- a/.github/workflows/python-ci.yml
+++ b/.github/workflows/python-ci.yml
@@ -28,7 +28,7 @@ jobs:
         enable-cache: true
 
     - name: Set up Python
-      run: uv python install 3.11
+      run: uv python install 3.13
 
     - name: Install dependencies
       run: uv sync --all-extras
diff --git a/a4d-python/Dockerfile b/a4d-python/Dockerfile
index f13820b..739b1c7 100644
--- a/a4d-python/Dockerfile
+++ b/a4d-python/Dockerfile
@@ -1,4 +1,4 @@
-FROM python:3.11-slim
+FROM python:3.13-slim
 
 # Install system dependencies
 RUN apt-get update && apt-get install -y --no-install-recommends \

From ac1181fc2215583e2a823f944368e1a62ee3b2c1 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Wed, 25 Feb 2026 00:29:52 +0000
Subject: [PATCH 6/6] Remove unused duckdb dependency and upgrade to Python
 3.14

Co-authored-by: pmayd <9614291+pmayd@users.noreply.github.com>
---
 .github/workflows/python-ci.yml |   2 +-
 a4d-python/Dockerfile           |   2 +-
 a4d-python/pyproject.toml       |   5 +-
 a4d-python/uv.lock              | 334 +-------------------------------
 4 files changed, 6 insertions(+), 337 deletions(-)

diff --git a/.github/workflows/python-ci.yml b/.github/workflows/python-ci.yml
index 51f7652..fe1b1d7 100644
--- a/.github/workflows/python-ci.yml
+++ b/.github/workflows/python-ci.yml
@@ -28,7 +28,7 @@ jobs:
         enable-cache: true
 
     - name: Set up Python
-      run: uv python install 3.13
+      run: uv python install 3.14
 
     - name: Install dependencies
       run: uv sync --all-extras
diff --git a/a4d-python/Dockerfile b/a4d-python/Dockerfile
index 739b1c7..de143cc 100644
--- a/a4d-python/Dockerfile
+++ b/a4d-python/Dockerfile
@@ -1,4 +1,4 @@
-FROM python:3.13-slim
+FROM python:3.14-slim
 
 # Install system dependencies
 RUN apt-get update && apt-get install -y --no-install-recommends \
diff --git a/a4d-python/pyproject.toml b/a4d-python/pyproject.toml
index d959a09..5bad486 100644
--- a/a4d-python/pyproject.toml
+++ b/a4d-python/pyproject.toml
@@ -3,7 +3,7 @@ name = "a4d"
 version = "2.0.0"
 description = "A4D Medical Tracker Data Processing Pipeline (Python)"
 readme = "README.md"
-requires-python = ">=3.11"
+requires-python = ">=3.14"
 authors = [
     {name = "Michael Aydinbas", email = "michael.aydinbas@gmail.com"}
 ]
@@ -11,7 +11,6 @@ license = {text = "MIT"}
 
 dependencies = [
     "polars>=0.20.0",
-    "duckdb>=0.10.0",
     "pydantic>=2.6.0",
     "pydantic-settings>=2.2.0",
     "pandera[polars]>=0.18.0",
@@ -47,7 +46,7 @@ build-backend = "hatchling.build"
 
 [tool.ruff]
 line-length = 100
-target-version = "py311"
+target-version = "py314"
 lint.select = [
     "E",   # pycodestyle errors
     "W",   # pycodestyle warnings
diff --git a/a4d-python/uv.lock b/a4d-python/uv.lock
index 10cf087..5f5f2ad 100644
--- a/a4d-python/uv.lock
+++ b/a4d-python/uv.lock
@@ -1,18 +1,12 @@
 version = 1
 revision = 3
-requires-python = ">=3.11"
-resolution-markers = [
-    "python_full_version >= '3.14'",
-    "python_full_version == '3.13.*'",
-    "python_full_version < '3.13'",
-]
+requires-python = ">=3.14"
 
 [[package]]
 name = "a4d"
 version = "2.0.0"
 source = { editable = "." }
 dependencies = [
-    { name = "duckdb" },
     { name = "fastexcel" },
     { name = "google-cloud-bigquery" },
     { name = "google-cloud-storage" },
@@ -41,7 +35,6 @@ dev = [
 
 [package.metadata]
 requires-dist = [
-    { name = "duckdb", specifier = ">=0.10.0" },
     { name = "fastexcel", specifier = ">=0.16.0" },
     { name = "google-cloud-bigquery", specifier = ">=3.17.0" },
     { name = "google-cloud-storage", specifier = ">=2.14.0" },
@@ -110,54 +103,6 @@ version = "3.4.4"
 source = { registry = "https://pypi.org/simple" }
 sdist = { url = "https://files.pythonhosted.org/packages/13/69/33ddede1939fdd074bce5434295f38fae7136463422fe4fd3e0e89b98062/charset_normalizer-3.4.4.tar.gz", hash = "sha256:94537985111c35f28720e43603b8e7b43a6ecfb2ce1d3058bbe955b73404e21a", size = 129418, upload-time = "2025-10-14T04:42:32.879Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/ed/27/c6491ff4954e58a10f69ad90aca8a1b6fe9c5d3c6f380907af3c37435b59/charset_normalizer-3.4.4-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:6e1fcf0720908f200cd21aa4e6750a48ff6ce4afe7ff5a79a90d5ed8a08296f8", size = 206988, upload-time = "2025-10-14T04:40:33.79Z" },
-    { url = "https://files.pythonhosted.org/packages/94/59/2e87300fe67ab820b5428580a53cad894272dbb97f38a7a814a2a1ac1011/charset_normalizer-3.4.4-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:5f819d5fe9234f9f82d75bdfa9aef3a3d72c4d24a6e57aeaebba32a704553aa0", size = 147324, upload-time = "2025-10-14T04:40:34.961Z" },
-    { url = "https://files.pythonhosted.org/packages/07/fb/0cf61dc84b2b088391830f6274cb57c82e4da8bbc2efeac8c025edb88772/charset_normalizer-3.4.4-cp311-cp311-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:a59cb51917aa591b1c4e6a43c132f0cdc3c76dbad6155df4e28ee626cc77a0a3", size = 142742, upload-time = "2025-10-14T04:40:36.105Z" },
-    { url = "https://files.pythonhosted.org/packages/62/8b/171935adf2312cd745d290ed93cf16cf0dfe320863ab7cbeeae1dcd6535f/charset_normalizer-3.4.4-cp311-cp311-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:8ef3c867360f88ac904fd3f5e1f902f13307af9052646963ee08ff4f131adafc", size = 160863, upload-time = "2025-10-14T04:40:37.188Z" },
-    { url = "https://files.pythonhosted.org/packages/09/73/ad875b192bda14f2173bfc1bc9a55e009808484a4b256748d931b6948442/charset_normalizer-3.4.4-cp311-cp311-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:d9e45d7faa48ee908174d8fe84854479ef838fc6a705c9315372eacbc2f02897", size = 157837, upload-time = "2025-10-14T04:40:38.435Z" },
-    { url = "https://files.pythonhosted.org/packages/6d/fc/de9cce525b2c5b94b47c70a4b4fb19f871b24995c728e957ee68ab1671ea/charset_normalizer-3.4.4-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:840c25fb618a231545cbab0564a799f101b63b9901f2569faecd6b222ac72381", size = 151550, upload-time = "2025-10-14T04:40:40.053Z" },
-    { url = "https://files.pythonhosted.org/packages/55/c2/43edd615fdfba8c6f2dfbd459b25a6b3b551f24ea21981e23fb768503ce1/charset_normalizer-3.4.4-cp311-cp311-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:ca5862d5b3928c4940729dacc329aa9102900382fea192fc5e52eb69d6093815", size = 149162, upload-time = "2025-10-14T04:40:41.163Z" },
-    { url = "https://files.pythonhosted.org/packages/03/86/bde4ad8b4d0e9429a4e82c1e8f5c659993a9a863ad62c7df05cf7b678d75/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:d9c7f57c3d666a53421049053eaacdd14bbd0a528e2186fcb2e672effd053bb0", size = 150019, upload-time = "2025-10-14T04:40:42.276Z" },
-    { url = "https://files.pythonhosted.org/packages/1f/86/a151eb2af293a7e7bac3a739b81072585ce36ccfb4493039f49f1d3cae8c/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_armv7l.whl", hash = "sha256:277e970e750505ed74c832b4bf75dac7476262ee2a013f5574dd49075879e161", size = 143310, upload-time = "2025-10-14T04:40:43.439Z" },
-    { url = "https://files.pythonhosted.org/packages/b5/fe/43dae6144a7e07b87478fdfc4dbe9efd5defb0e7ec29f5f58a55aeef7bf7/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_ppc64le.whl", hash = "sha256:31fd66405eaf47bb62e8cd575dc621c56c668f27d46a61d975a249930dd5e2a4", size = 162022, upload-time = "2025-10-14T04:40:44.547Z" },
-    { url = "https://files.pythonhosted.org/packages/80/e6/7aab83774f5d2bca81f42ac58d04caf44f0cc2b65fc6db2b3b2e8a05f3b3/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_riscv64.whl", hash = "sha256:0d3d8f15c07f86e9ff82319b3d9ef6f4bf907608f53fe9d92b28ea9ae3d1fd89", size = 149383, upload-time = "2025-10-14T04:40:46.018Z" },
-    { url = "https://files.pythonhosted.org/packages/4f/e8/b289173b4edae05c0dde07f69f8db476a0b511eac556dfe0d6bda3c43384/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_s390x.whl", hash = "sha256:9f7fcd74d410a36883701fafa2482a6af2ff5ba96b9a620e9e0721e28ead5569", size = 159098, upload-time = "2025-10-14T04:40:47.081Z" },
-    { url = "https://files.pythonhosted.org/packages/d8/df/fe699727754cae3f8478493c7f45f777b17c3ef0600e28abfec8619eb49c/charset_normalizer-3.4.4-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:ebf3e58c7ec8a8bed6d66a75d7fb37b55e5015b03ceae72a8e7c74495551e224", size = 152991, upload-time = "2025-10-14T04:40:48.246Z" },
-    { url = "https://files.pythonhosted.org/packages/1a/86/584869fe4ddb6ffa3bd9f491b87a01568797fb9bd8933f557dba9771beaf/charset_normalizer-3.4.4-cp311-cp311-win32.whl", hash = "sha256:eecbc200c7fd5ddb9a7f16c7decb07b566c29fa2161a16cf67b8d068bd21690a", size = 99456, upload-time = "2025-10-14T04:40:49.376Z" },
-    { url = "https://files.pythonhosted.org/packages/65/f6/62fdd5feb60530f50f7e38b4f6a1d5203f4d16ff4f9f0952962c044e919a/charset_normalizer-3.4.4-cp311-cp311-win_amd64.whl", hash = "sha256:5ae497466c7901d54b639cf42d5b8c1b6a4fead55215500d2f486d34db48d016", size = 106978, upload-time = "2025-10-14T04:40:50.844Z" },
-    { url = "https://files.pythonhosted.org/packages/7a/9d/0710916e6c82948b3be62d9d398cb4fcf4e97b56d6a6aeccd66c4b2f2bd5/charset_normalizer-3.4.4-cp311-cp311-win_arm64.whl", hash = "sha256:65e2befcd84bc6f37095f5961e68a6f077bf44946771354a28ad434c2cce0ae1", size = 99969, upload-time = "2025-10-14T04:40:52.272Z" },
-    { url = "https://files.pythonhosted.org/packages/f3/85/1637cd4af66fa687396e757dec650f28025f2a2f5a5531a3208dc0ec43f2/charset_normalizer-3.4.4-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:0a98e6759f854bd25a58a73fa88833fba3b7c491169f86ce1180c948ab3fd394", size = 208425, upload-time = "2025-10-14T04:40:53.353Z" },
-    { url = "https://files.pythonhosted.org/packages/9d/6a/04130023fef2a0d9c62d0bae2649b69f7b7d8d24ea5536feef50551029df/charset_normalizer-3.4.4-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:b5b290ccc2a263e8d185130284f8501e3e36c5e02750fc6b6bdeb2e9e96f1e25", size = 148162, upload-time = "2025-10-14T04:40:54.558Z" },
-    { url = "https://files.pythonhosted.org/packages/78/29/62328d79aa60da22c9e0b9a66539feae06ca0f5a4171ac4f7dc285b83688/charset_normalizer-3.4.4-cp312-cp312-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:74bb723680f9f7a6234dcf67aea57e708ec1fbdf5699fb91dfd6f511b0a320ef", size = 144558, upload-time = "2025-10-14T04:40:55.677Z" },
-    { url = "https://files.pythonhosted.org/packages/86/bb/b32194a4bf15b88403537c2e120b817c61cd4ecffa9b6876e941c3ee38fe/charset_normalizer-3.4.4-cp312-cp312-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:f1e34719c6ed0b92f418c7c780480b26b5d9c50349e9a9af7d76bf757530350d", size = 161497, upload-time = "2025-10-14T04:40:57.217Z" },
-    { url = "https://files.pythonhosted.org/packages/19/89/a54c82b253d5b9b111dc74aca196ba5ccfcca8242d0fb64146d4d3183ff1/charset_normalizer-3.4.4-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:2437418e20515acec67d86e12bf70056a33abdacb5cb1655042f6538d6b085a8", size = 159240, upload-time = "2025-10-14T04:40:58.358Z" },
-    { url = "https://files.pythonhosted.org/packages/c0/10/d20b513afe03acc89ec33948320a5544d31f21b05368436d580dec4e234d/charset_normalizer-3.4.4-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:11d694519d7f29d6cd09f6ac70028dba10f92f6cdd059096db198c283794ac86", size = 153471, upload-time = "2025-10-14T04:40:59.468Z" },
-    { url = "https://files.pythonhosted.org/packages/61/fa/fbf177b55bdd727010f9c0a3c49eefa1d10f960e5f09d1d887bf93c2e698/charset_normalizer-3.4.4-cp312-cp312-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:ac1c4a689edcc530fc9d9aa11f5774b9e2f33f9a0c6a57864e90908f5208d30a", size = 150864, upload-time = "2025-10-14T04:41:00.623Z" },
-    { url = "https://files.pythonhosted.org/packages/05/12/9fbc6a4d39c0198adeebbde20b619790e9236557ca59fc40e0e3cebe6f40/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:21d142cc6c0ec30d2efee5068ca36c128a30b0f2c53c1c07bd78cb6bc1d3be5f", size = 150647, upload-time = "2025-10-14T04:41:01.754Z" },
-    { url = "https://files.pythonhosted.org/packages/ad/1f/6a9a593d52e3e8c5d2b167daf8c6b968808efb57ef4c210acb907c365bc4/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_armv7l.whl", hash = "sha256:5dbe56a36425d26d6cfb40ce79c314a2e4dd6211d51d6d2191c00bed34f354cc", size = 145110, upload-time = "2025-10-14T04:41:03.231Z" },
-    { url = "https://files.pythonhosted.org/packages/30/42/9a52c609e72471b0fc54386dc63c3781a387bb4fe61c20231a4ebcd58bdd/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:5bfbb1b9acf3334612667b61bd3002196fe2a1eb4dd74d247e0f2a4d50ec9bbf", size = 162839, upload-time = "2025-10-14T04:41:04.715Z" },
-    { url = "https://files.pythonhosted.org/packages/c4/5b/c0682bbf9f11597073052628ddd38344a3d673fda35a36773f7d19344b23/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_riscv64.whl", hash = "sha256:d055ec1e26e441f6187acf818b73564e6e6282709e9bcb5b63f5b23068356a15", size = 150667, upload-time = "2025-10-14T04:41:05.827Z" },
-    { url = "https://files.pythonhosted.org/packages/e4/24/a41afeab6f990cf2daf6cb8c67419b63b48cf518e4f56022230840c9bfb2/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_s390x.whl", hash = "sha256:af2d8c67d8e573d6de5bc30cdb27e9b95e49115cd9baad5ddbd1a6207aaa82a9", size = 160535, upload-time = "2025-10-14T04:41:06.938Z" },
-    { url = "https://files.pythonhosted.org/packages/2a/e5/6a4ce77ed243c4a50a1fecca6aaaab419628c818a49434be428fe24c9957/charset_normalizer-3.4.4-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:780236ac706e66881f3b7f2f32dfe90507a09e67d1d454c762cf642e6e1586e0", size = 154816, upload-time = "2025-10-14T04:41:08.101Z" },
-    { url = "https://files.pythonhosted.org/packages/a8/ef/89297262b8092b312d29cdb2517cb1237e51db8ecef2e9af5edbe7b683b1/charset_normalizer-3.4.4-cp312-cp312-win32.whl", hash = "sha256:5833d2c39d8896e4e19b689ffc198f08ea58116bee26dea51e362ecc7cd3ed26", size = 99694, upload-time = "2025-10-14T04:41:09.23Z" },
-    { url = "https://files.pythonhosted.org/packages/3d/2d/1e5ed9dd3b3803994c155cd9aacb60c82c331bad84daf75bcb9c91b3295e/charset_normalizer-3.4.4-cp312-cp312-win_amd64.whl", hash = "sha256:a79cfe37875f822425b89a82333404539ae63dbdddf97f84dcbc3d339aae9525", size = 107131, upload-time = "2025-10-14T04:41:10.467Z" },
-    { url = "https://files.pythonhosted.org/packages/d0/d9/0ed4c7098a861482a7b6a95603edce4c0d9db2311af23da1fb2b75ec26fc/charset_normalizer-3.4.4-cp312-cp312-win_arm64.whl", hash = "sha256:376bec83a63b8021bb5c8ea75e21c4ccb86e7e45ca4eb81146091b56599b80c3", size = 100390, upload-time = "2025-10-14T04:41:11.915Z" },
-    { url = "https://files.pythonhosted.org/packages/97/45/4b3a1239bbacd321068ea6e7ac28875b03ab8bc0aa0966452db17cd36714/charset_normalizer-3.4.4-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:e1f185f86a6f3403aa2420e815904c67b2f9ebc443f045edd0de921108345794", size = 208091, upload-time = "2025-10-14T04:41:13.346Z" },
-    { url = "https://files.pythonhosted.org/packages/7d/62/73a6d7450829655a35bb88a88fca7d736f9882a27eacdca2c6d505b57e2e/charset_normalizer-3.4.4-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:6b39f987ae8ccdf0d2642338faf2abb1862340facc796048b604ef14919e55ed", size = 147936, upload-time = "2025-10-14T04:41:14.461Z" },
-    { url = "https://files.pythonhosted.org/packages/89/c5/adb8c8b3d6625bef6d88b251bbb0d95f8205831b987631ab0c8bb5d937c2/charset_normalizer-3.4.4-cp313-cp313-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:3162d5d8ce1bb98dd51af660f2121c55d0fa541b46dff7bb9b9f86ea1d87de72", size = 144180, upload-time = "2025-10-14T04:41:15.588Z" },
-    { url = "https://files.pythonhosted.org/packages/91/ed/9706e4070682d1cc219050b6048bfd293ccf67b3d4f5a4f39207453d4b99/charset_normalizer-3.4.4-cp313-cp313-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:81d5eb2a312700f4ecaa977a8235b634ce853200e828fbadf3a9c50bab278328", size = 161346, upload-time = "2025-10-14T04:41:16.738Z" },
-    { url = "https://files.pythonhosted.org/packages/d5/0d/031f0d95e4972901a2f6f09ef055751805ff541511dc1252ba3ca1f80cf5/charset_normalizer-3.4.4-cp313-cp313-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:5bd2293095d766545ec1a8f612559f6b40abc0eb18bb2f5d1171872d34036ede", size = 158874, upload-time = "2025-10-14T04:41:17.923Z" },
-    { url = "https://files.pythonhosted.org/packages/f5/83/6ab5883f57c9c801ce5e5677242328aa45592be8a00644310a008d04f922/charset_normalizer-3.4.4-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:a8a8b89589086a25749f471e6a900d3f662d1d3b6e2e59dcecf787b1cc3a1894", size = 153076, upload-time = "2025-10-14T04:41:19.106Z" },
-    { url = "https://files.pythonhosted.org/packages/75/1e/5ff781ddf5260e387d6419959ee89ef13878229732732ee73cdae01800f2/charset_normalizer-3.4.4-cp313-cp313-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:bc7637e2f80d8530ee4a78e878bce464f70087ce73cf7c1caf142416923b98f1", size = 150601, upload-time = "2025-10-14T04:41:20.245Z" },
-    { url = "https://files.pythonhosted.org/packages/d7/57/71be810965493d3510a6ca79b90c19e48696fb1ff964da319334b12677f0/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:f8bf04158c6b607d747e93949aa60618b61312fe647a6369f88ce2ff16043490", size = 150376, upload-time = "2025-10-14T04:41:21.398Z" },
-    { url = "https://files.pythonhosted.org/packages/e5/d5/c3d057a78c181d007014feb7e9f2e65905a6c4ef182c0ddf0de2924edd65/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_armv7l.whl", hash = "sha256:554af85e960429cf30784dd47447d5125aaa3b99a6f0683589dbd27e2f45da44", size = 144825, upload-time = "2025-10-14T04:41:22.583Z" },
-    { url = "https://files.pythonhosted.org/packages/e6/8c/d0406294828d4976f275ffbe66f00266c4b3136b7506941d87c00cab5272/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_ppc64le.whl", hash = "sha256:74018750915ee7ad843a774364e13a3db91682f26142baddf775342c3f5b1133", size = 162583, upload-time = "2025-10-14T04:41:23.754Z" },
-    { url = "https://files.pythonhosted.org/packages/d7/24/e2aa1f18c8f15c4c0e932d9287b8609dd30ad56dbe41d926bd846e22fb8d/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_riscv64.whl", hash = "sha256:c0463276121fdee9c49b98908b3a89c39be45d86d1dbaa22957e38f6321d4ce3", size = 150366, upload-time = "2025-10-14T04:41:25.27Z" },
-    { url = "https://files.pythonhosted.org/packages/e4/5b/1e6160c7739aad1e2df054300cc618b06bf784a7a164b0f238360721ab86/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_s390x.whl", hash = "sha256:362d61fd13843997c1c446760ef36f240cf81d3ebf74ac62652aebaf7838561e", size = 160300, upload-time = "2025-10-14T04:41:26.725Z" },
-    { url = "https://files.pythonhosted.org/packages/7a/10/f882167cd207fbdd743e55534d5d9620e095089d176d55cb22d5322f2afd/charset_normalizer-3.4.4-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:9a26f18905b8dd5d685d6d07b0cdf98a79f3c7a918906af7cc143ea2e164c8bc", size = 154465, upload-time = "2025-10-14T04:41:28.322Z" },
-    { url = "https://files.pythonhosted.org/packages/89/66/c7a9e1b7429be72123441bfdbaf2bc13faab3f90b933f664db506dea5915/charset_normalizer-3.4.4-cp313-cp313-win32.whl", hash = "sha256:9b35f4c90079ff2e2edc5b26c0c77925e5d2d255c42c74fdb70fb49b172726ac", size = 99404, upload-time = "2025-10-14T04:41:29.95Z" },
-    { url = "https://files.pythonhosted.org/packages/c4/26/b9924fa27db384bdcd97ab83b4f0a8058d96ad9626ead570674d5e737d90/charset_normalizer-3.4.4-cp313-cp313-win_amd64.whl", hash = "sha256:b435cba5f4f750aa6c0a0d92c541fb79f69a387c91e61f1795227e4ed9cece14", size = 107092, upload-time = "2025-10-14T04:41:31.188Z" },
-    { url = "https://files.pythonhosted.org/packages/af/8f/3ed4bfa0c0c72a7ca17f0380cd9e4dd842b09f664e780c13cff1dcf2ef1b/charset_normalizer-3.4.4-cp313-cp313-win_arm64.whl", hash = "sha256:542d2cee80be6f80247095cc36c418f7bddd14f4a6de45af91dfad36d817bba2", size = 100408, upload-time = "2025-10-14T04:41:32.624Z" },
     { url = "https://files.pythonhosted.org/packages/2a/35/7051599bd493e62411d6ede36fd5af83a38f37c4767b92884df7301db25d/charset_normalizer-3.4.4-cp314-cp314-macosx_10_13_universal2.whl", hash = "sha256:da3326d9e65ef63a817ecbcc0df6e94463713b754fe293eaa03da99befb9a5bd", size = 207746, upload-time = "2025-10-14T04:41:33.773Z" },
     { url = "https://files.pythonhosted.org/packages/10/9a/97c8d48ef10d6cd4fcead2415523221624bf58bcf68a802721a6bc807c8f/charset_normalizer-3.4.4-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:8af65f14dc14a79b924524b1e7fffe304517b2bff5a58bf64f30b98bbc5079eb", size = 147889, upload-time = "2025-10-14T04:41:34.897Z" },
     { url = "https://files.pythonhosted.org/packages/10/bf/979224a919a1b606c82bd2c5fa49b5c6d5727aa47b4312bb27b1734f53cd/charset_normalizer-3.4.4-cp314-cp314-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:74664978bb272435107de04e36db5a9735e78232b85b77d45cfb38f758efd33e", size = 143641, upload-time = "2025-10-14T04:41:36.116Z" },
@@ -204,58 +149,6 @@ version = "7.11.0"
 source = { registry = "https://pypi.org/simple" }
 sdist = { url = "https://files.pythonhosted.org/packages/1c/38/ee22495420457259d2f3390309505ea98f98a5eed40901cf62196abad006/coverage-7.11.0.tar.gz", hash = "sha256:167bd504ac1ca2af7ff3b81d245dfea0292c5032ebef9d66cc08a7d28c1b8050", size = 811905, upload-time = "2025-10-15T15:15:08.542Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/49/3a/ee1074c15c408ddddddb1db7dd904f6b81bc524e01f5a1c5920e13dbde23/coverage-7.11.0-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:3d58ecaa865c5b9fa56e35efc51d1014d4c0d22838815b9fce57a27dd9576847", size = 215912, upload-time = "2025-10-15T15:12:40.665Z" },
-    { url = "https://files.pythonhosted.org/packages/70/c4/9f44bebe5cb15f31608597b037d78799cc5f450044465bcd1ae8cb222fe1/coverage-7.11.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:b679e171f1c104a5668550ada700e3c4937110dbdd153b7ef9055c4f1a1ee3cc", size = 216310, upload-time = "2025-10-15T15:12:42.461Z" },
-    { url = "https://files.pythonhosted.org/packages/42/01/5e06077cfef92d8af926bdd86b84fb28bf9bc6ad27343d68be9b501d89f2/coverage-7.11.0-cp311-cp311-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:ca61691ba8c5b6797deb221a0d09d7470364733ea9c69425a640f1f01b7c5bf0", size = 246706, upload-time = "2025-10-15T15:12:44.001Z" },
-    { url = "https://files.pythonhosted.org/packages/40/b8/7a3f1f33b35cc4a6c37e759137533119560d06c0cc14753d1a803be0cd4a/coverage-7.11.0-cp311-cp311-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:aef1747ede4bd8ca9cfc04cc3011516500c6891f1b33a94add3253f6f876b7b7", size = 248634, upload-time = "2025-10-15T15:12:45.768Z" },
-    { url = "https://files.pythonhosted.org/packages/7a/41/7f987eb33de386bc4c665ab0bf98d15fcf203369d6aacae74f5dd8ec489a/coverage-7.11.0-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:a1839d08406e4cba2953dcc0ffb312252f14d7c4c96919f70167611f4dee2623", size = 250741, upload-time = "2025-10-15T15:12:47.222Z" },
-    { url = "https://files.pythonhosted.org/packages/23/c1/a4e0ca6a4e83069fb8216b49b30a7352061ca0cb38654bd2dc96b7b3b7da/coverage-7.11.0-cp311-cp311-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:e0eb0a2dcc62478eb5b4cbb80b97bdee852d7e280b90e81f11b407d0b81c4287", size = 246837, upload-time = "2025-10-15T15:12:48.904Z" },
-    { url = "https://files.pythonhosted.org/packages/5d/03/ced062a17f7c38b4728ff76c3acb40d8465634b20b4833cdb3cc3a74e115/coverage-7.11.0-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:bc1fbea96343b53f65d5351d8fd3b34fd415a2670d7c300b06d3e14a5af4f552", size = 248429, upload-time = "2025-10-15T15:12:50.73Z" },
-    { url = "https://files.pythonhosted.org/packages/97/af/a7c6f194bb8c5a2705ae019036b8fe7f49ea818d638eedb15fdb7bed227c/coverage-7.11.0-cp311-cp311-musllinux_1_2_i686.whl", hash = "sha256:214b622259dd0cf435f10241f1333d32caa64dbc27f8790ab693428a141723de", size = 246490, upload-time = "2025-10-15T15:12:52.646Z" },
-    { url = "https://files.pythonhosted.org/packages/ab/c3/aab4df02b04a8fde79068c3c41ad7a622b0ef2b12e1ed154da986a727c3f/coverage-7.11.0-cp311-cp311-musllinux_1_2_riscv64.whl", hash = "sha256:258d9967520cca899695d4eb7ea38be03f06951d6ca2f21fb48b1235f791e601", size = 246208, upload-time = "2025-10-15T15:12:54.586Z" },
-    { url = "https://files.pythonhosted.org/packages/30/d8/e282ec19cd658238d60ed404f99ef2e45eed52e81b866ab1518c0d4163cf/coverage-7.11.0-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:cf9e6ff4ca908ca15c157c409d608da77a56a09877b97c889b98fb2c32b6465e", size = 247126, upload-time = "2025-10-15T15:12:56.485Z" },
-    { url = "https://files.pythonhosted.org/packages/d1/17/a635fa07fac23adb1a5451ec756216768c2767efaed2e4331710342a3399/coverage-7.11.0-cp311-cp311-win32.whl", hash = "sha256:fcc15fc462707b0680cff6242c48625da7f9a16a28a41bb8fd7a4280920e676c", size = 218314, upload-time = "2025-10-15T15:12:58.365Z" },
-    { url = "https://files.pythonhosted.org/packages/2a/29/2ac1dfcdd4ab9a70026edc8d715ece9b4be9a1653075c658ee6f271f394d/coverage-7.11.0-cp311-cp311-win_amd64.whl", hash = "sha256:865965bf955d92790f1facd64fe7ff73551bd2c1e7e6b26443934e9701ba30b9", size = 219203, upload-time = "2025-10-15T15:12:59.902Z" },
-    { url = "https://files.pythonhosted.org/packages/03/21/5ce8b3a0133179115af4c041abf2ee652395837cb896614beb8ce8ddcfd9/coverage-7.11.0-cp311-cp311-win_arm64.whl", hash = "sha256:5693e57a065760dcbeb292d60cc4d0231a6d4b6b6f6a3191561e1d5e8820b745", size = 217879, upload-time = "2025-10-15T15:13:01.35Z" },
-    { url = "https://files.pythonhosted.org/packages/c4/db/86f6906a7c7edc1a52b2c6682d6dd9be775d73c0dfe2b84f8923dfea5784/coverage-7.11.0-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:9c49e77811cf9d024b95faf86c3f059b11c0c9be0b0d61bc598f453703bd6fd1", size = 216098, upload-time = "2025-10-15T15:13:02.916Z" },
-    { url = "https://files.pythonhosted.org/packages/21/54/e7b26157048c7ba555596aad8569ff903d6cd67867d41b75287323678ede/coverage-7.11.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:a61e37a403a778e2cda2a6a39abcc895f1d984071942a41074b5c7ee31642007", size = 216331, upload-time = "2025-10-15T15:13:04.403Z" },
-    { url = "https://files.pythonhosted.org/packages/b9/19/1ce6bf444f858b83a733171306134a0544eaddf1ca8851ede6540a55b2ad/coverage-7.11.0-cp312-cp312-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:c79cae102bb3b1801e2ef1511fb50e91ec83a1ce466b2c7c25010d884336de46", size = 247825, upload-time = "2025-10-15T15:13:05.92Z" },
-    { url = "https://files.pythonhosted.org/packages/71/0b/d3bcbbc259fcced5fb67c5d78f6e7ee965f49760c14afd931e9e663a83b2/coverage-7.11.0-cp312-cp312-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:16ce17ceb5d211f320b62df002fa7016b7442ea0fd260c11cec8ce7730954893", size = 250573, upload-time = "2025-10-15T15:13:07.471Z" },
-    { url = "https://files.pythonhosted.org/packages/58/8d/b0ff3641a320abb047258d36ed1c21d16be33beed4152628331a1baf3365/coverage-7.11.0-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:80027673e9d0bd6aef86134b0771845e2da85755cf686e7c7c59566cf5a89115", size = 251706, upload-time = "2025-10-15T15:13:09.4Z" },
-    { url = "https://files.pythonhosted.org/packages/59/c8/5a586fe8c7b0458053d9c687f5cff515a74b66c85931f7fe17a1c958b4ac/coverage-7.11.0-cp312-cp312-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:4d3ffa07a08657306cd2215b0da53761c4d73cb54d9143b9303a6481ec0cd415", size = 248221, upload-time = "2025-10-15T15:13:10.964Z" },
-    { url = "https://files.pythonhosted.org/packages/d0/ff/3a25e3132804ba44cfa9a778cdf2b73dbbe63ef4b0945e39602fc896ba52/coverage-7.11.0-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:a3b6a5f8b2524fd6c1066bc85bfd97e78709bb5e37b5b94911a6506b65f47186", size = 249624, upload-time = "2025-10-15T15:13:12.5Z" },
-    { url = "https://files.pythonhosted.org/packages/c5/12/ff10c8ce3895e1b17a73485ea79ebc1896a9e466a9d0f4aef63e0d17b718/coverage-7.11.0-cp312-cp312-musllinux_1_2_i686.whl", hash = "sha256:fcc0a4aa589de34bc56e1a80a740ee0f8c47611bdfb28cd1849de60660f3799d", size = 247744, upload-time = "2025-10-15T15:13:14.554Z" },
-    { url = "https://files.pythonhosted.org/packages/16/02/d500b91f5471b2975947e0629b8980e5e90786fe316b6d7299852c1d793d/coverage-7.11.0-cp312-cp312-musllinux_1_2_riscv64.whl", hash = "sha256:dba82204769d78c3fd31b35c3d5f46e06511936c5019c39f98320e05b08f794d", size = 247325, upload-time = "2025-10-15T15:13:16.438Z" },
-    { url = "https://files.pythonhosted.org/packages/77/11/dee0284fbbd9cd64cfce806b827452c6df3f100d9e66188e82dfe771d4af/coverage-7.11.0-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:81b335f03ba67309a95210caf3eb43bd6fe75a4e22ba653ef97b4696c56c7ec2", size = 249180, upload-time = "2025-10-15T15:13:17.959Z" },
-    { url = "https://files.pythonhosted.org/packages/59/1b/cdf1def928f0a150a057cab03286774e73e29c2395f0d30ce3d9e9f8e697/coverage-7.11.0-cp312-cp312-win32.whl", hash = "sha256:037b2d064c2f8cc8716fe4d39cb705779af3fbf1ba318dc96a1af858888c7bb5", size = 218479, upload-time = "2025-10-15T15:13:19.608Z" },
-    { url = "https://files.pythonhosted.org/packages/ff/55/e5884d55e031da9c15b94b90a23beccc9d6beee65e9835cd6da0a79e4f3a/coverage-7.11.0-cp312-cp312-win_amd64.whl", hash = "sha256:d66c0104aec3b75e5fd897e7940188ea1892ca1d0235316bf89286d6a22568c0", size = 219290, upload-time = "2025-10-15T15:13:21.593Z" },
-    { url = "https://files.pythonhosted.org/packages/23/a8/faa930cfc71c1d16bc78f9a19bb73700464f9c331d9e547bfbc1dbd3a108/coverage-7.11.0-cp312-cp312-win_arm64.whl", hash = "sha256:d91ebeac603812a09cf6a886ba6e464f3bbb367411904ae3790dfe28311b15ad", size = 217924, upload-time = "2025-10-15T15:13:23.39Z" },
-    { url = "https://files.pythonhosted.org/packages/60/7f/85e4dfe65e400645464b25c036a26ac226cf3a69d4a50c3934c532491cdd/coverage-7.11.0-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:cc3f49e65ea6e0d5d9bd60368684fe52a704d46f9e7fc413918f18d046ec40e1", size = 216129, upload-time = "2025-10-15T15:13:25.371Z" },
-    { url = "https://files.pythonhosted.org/packages/96/5d/dc5fa98fea3c175caf9d360649cb1aa3715e391ab00dc78c4c66fabd7356/coverage-7.11.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:f39ae2f63f37472c17b4990f794035c9890418b1b8cca75c01193f3c8d3e01be", size = 216380, upload-time = "2025-10-15T15:13:26.976Z" },
-    { url = "https://files.pythonhosted.org/packages/b2/f5/3da9cc9596708273385189289c0e4d8197d37a386bdf17619013554b3447/coverage-7.11.0-cp313-cp313-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:7db53b5cdd2917b6eaadd0b1251cf4e7d96f4a8d24e174bdbdf2f65b5ea7994d", size = 247375, upload-time = "2025-10-15T15:13:28.923Z" },
-    { url = "https://files.pythonhosted.org/packages/65/6c/f7f59c342359a235559d2bc76b0c73cfc4bac7d61bb0df210965cb1ecffd/coverage-7.11.0-cp313-cp313-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:10ad04ac3a122048688387828b4537bc9cf60c0bf4869c1e9989c46e45690b82", size = 249978, upload-time = "2025-10-15T15:13:30.525Z" },
-    { url = "https://files.pythonhosted.org/packages/e7/8c/042dede2e23525e863bf1ccd2b92689692a148d8b5fd37c37899ba882645/coverage-7.11.0-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:4036cc9c7983a2b1f2556d574d2eb2154ac6ed55114761685657e38782b23f52", size = 251253, upload-time = "2025-10-15T15:13:32.174Z" },
-    { url = "https://files.pythonhosted.org/packages/7b/a9/3c58df67bfa809a7bddd786356d9c5283e45d693edb5f3f55d0986dd905a/coverage-7.11.0-cp313-cp313-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:7ab934dd13b1c5e94b692b1e01bd87e4488cb746e3a50f798cb9464fd128374b", size = 247591, upload-time = "2025-10-15T15:13:34.147Z" },
-    { url = "https://files.pythonhosted.org/packages/26/5b/c7f32efd862ee0477a18c41e4761305de6ddd2d49cdeda0c1116227570fd/coverage-7.11.0-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:59a6e5a265f7cfc05f76e3bb53eca2e0dfe90f05e07e849930fecd6abb8f40b4", size = 249411, upload-time = "2025-10-15T15:13:38.425Z" },
-    { url = "https://files.pythonhosted.org/packages/76/b5/78cb4f1e86c1611431c990423ec0768122905b03837e1b4c6a6f388a858b/coverage-7.11.0-cp313-cp313-musllinux_1_2_i686.whl", hash = "sha256:df01d6c4c81e15a7c88337b795bb7595a8596e92310266b5072c7e301168efbd", size = 247303, upload-time = "2025-10-15T15:13:40.464Z" },
-    { url = "https://files.pythonhosted.org/packages/87/c9/23c753a8641a330f45f221286e707c427e46d0ffd1719b080cedc984ec40/coverage-7.11.0-cp313-cp313-musllinux_1_2_riscv64.whl", hash = "sha256:8c934bd088eed6174210942761e38ee81d28c46de0132ebb1801dbe36a390dcc", size = 247157, upload-time = "2025-10-15T15:13:42.087Z" },
-    { url = "https://files.pythonhosted.org/packages/c5/42/6e0cc71dc8a464486e944a4fa0d85bdec031cc2969e98ed41532a98336b9/coverage-7.11.0-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:5a03eaf7ec24078ad64a07f02e30060aaf22b91dedf31a6b24d0d98d2bba7f48", size = 248921, upload-time = "2025-10-15T15:13:43.715Z" },
-    { url = "https://files.pythonhosted.org/packages/e8/1c/743c2ef665e6858cccb0f84377dfe3a4c25add51e8c7ef19249be92465b6/coverage-7.11.0-cp313-cp313-win32.whl", hash = "sha256:695340f698a5f56f795b2836abe6fb576e7c53d48cd155ad2f80fd24bc63a040", size = 218526, upload-time = "2025-10-15T15:13:45.336Z" },
-    { url = "https://files.pythonhosted.org/packages/ff/d5/226daadfd1bf8ddbccefbd3aa3547d7b960fb48e1bdac124e2dd13a2b71a/coverage-7.11.0-cp313-cp313-win_amd64.whl", hash = "sha256:2727d47fce3ee2bac648528e41455d1b0c46395a087a229deac75e9f88ba5a05", size = 219317, upload-time = "2025-10-15T15:13:47.401Z" },
-    { url = "https://files.pythonhosted.org/packages/97/54/47db81dcbe571a48a298f206183ba8a7ba79200a37cd0d9f4788fcd2af4a/coverage-7.11.0-cp313-cp313-win_arm64.whl", hash = "sha256:0efa742f431529699712b92ecdf22de8ff198df41e43aeaaadf69973eb93f17a", size = 217948, upload-time = "2025-10-15T15:13:49.096Z" },
-    { url = "https://files.pythonhosted.org/packages/e5/8b/cb68425420154e7e2a82fd779a8cc01549b6fa83c2ad3679cd6c088ebd07/coverage-7.11.0-cp313-cp313t-macosx_10_13_x86_64.whl", hash = "sha256:587c38849b853b157706407e9ebdca8fd12f45869edb56defbef2daa5fb0812b", size = 216837, upload-time = "2025-10-15T15:13:51.09Z" },
-    { url = "https://files.pythonhosted.org/packages/33/55/9d61b5765a025685e14659c8d07037247de6383c0385757544ffe4606475/coverage-7.11.0-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:b971bdefdd75096163dd4261c74be813c4508477e39ff7b92191dea19f24cd37", size = 217061, upload-time = "2025-10-15T15:13:52.747Z" },
-    { url = "https://files.pythonhosted.org/packages/52/85/292459c9186d70dcec6538f06ea251bc968046922497377bf4a1dc9a71de/coverage-7.11.0-cp313-cp313t-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:269bfe913b7d5be12ab13a95f3a76da23cf147be7fa043933320ba5625f0a8de", size = 258398, upload-time = "2025-10-15T15:13:54.45Z" },
-    { url = "https://files.pythonhosted.org/packages/1f/e2/46edd73fb8bf51446c41148d81944c54ed224854812b6ca549be25113ee0/coverage-7.11.0-cp313-cp313t-manylinux1_x86_64.manylinux_2_28_x86_64.manylinux_2_5_x86_64.whl", hash = "sha256:dadbcce51a10c07b7c72b0ce4a25e4b6dcb0c0372846afb8e5b6307a121eb99f", size = 260574, upload-time = "2025-10-15T15:13:56.145Z" },
-    { url = "https://files.pythonhosted.org/packages/07/5e/1df469a19007ff82e2ca8fe509822820a31e251f80ee7344c34f6cd2ec43/coverage-7.11.0-cp313-cp313t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:9ed43fa22c6436f7957df036331f8fe4efa7af132054e1844918866cd228af6c", size = 262797, upload-time = "2025-10-15T15:13:58.635Z" },
-    { url = "https://files.pythonhosted.org/packages/f9/50/de216b31a1434b94d9b34a964c09943c6be45069ec704bfc379d8d89a649/coverage-7.11.0-cp313-cp313t-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:9516add7256b6713ec08359b7b05aeff8850c98d357784c7205b2e60aa2513fa", size = 257361, upload-time = "2025-10-15T15:14:00.409Z" },
-    { url = "https://files.pythonhosted.org/packages/82/1e/3f9f8344a48111e152e0fd495b6fff13cc743e771a6050abf1627a7ba918/coverage-7.11.0-cp313-cp313t-musllinux_1_2_aarch64.whl", hash = "sha256:eb92e47c92fcbcdc692f428da67db33337fa213756f7adb6a011f7b5a7a20740", size = 260349, upload-time = "2025-10-15T15:14:02.188Z" },
-    { url = "https://files.pythonhosted.org/packages/65/9b/3f52741f9e7d82124272f3070bbe316006a7de1bad1093f88d59bfc6c548/coverage-7.11.0-cp313-cp313t-musllinux_1_2_i686.whl", hash = "sha256:d06f4fc7acf3cabd6d74941d53329e06bab00a8fe10e4df2714f0b134bfc64ef", size = 258114, upload-time = "2025-10-15T15:14:03.907Z" },
-    { url = "https://files.pythonhosted.org/packages/0b/8b/918f0e15f0365d50d3986bbd3338ca01178717ac5678301f3f547b6619e6/coverage-7.11.0-cp313-cp313t-musllinux_1_2_riscv64.whl", hash = "sha256:6fbcee1a8f056af07ecd344482f711f563a9eb1c2cad192e87df00338ec3cdb0", size = 256723, upload-time = "2025-10-15T15:14:06.324Z" },
-    { url = "https://files.pythonhosted.org/packages/44/9e/7776829f82d3cf630878a7965a7d70cc6ca94f22c7d20ec4944f7148cb46/coverage-7.11.0-cp313-cp313t-musllinux_1_2_x86_64.whl", hash = "sha256:dbbf012be5f32533a490709ad597ad8a8ff80c582a95adc8d62af664e532f9ca", size = 259238, upload-time = "2025-10-15T15:14:08.002Z" },
-    { url = "https://files.pythonhosted.org/packages/9a/b8/49cf253e1e7a3bedb85199b201862dd7ca4859f75b6cf25ffa7298aa0760/coverage-7.11.0-cp313-cp313t-win32.whl", hash = "sha256:cee6291bb4fed184f1c2b663606a115c743df98a537c969c3c64b49989da96c2", size = 219180, upload-time = "2025-10-15T15:14:09.786Z" },
-    { url = "https://files.pythonhosted.org/packages/ac/e1/1a541703826be7ae2125a0fb7f821af5729d56bb71e946e7b933cc7a89a4/coverage-7.11.0-cp313-cp313t-win_amd64.whl", hash = "sha256:a386c1061bf98e7ea4758e4313c0ab5ecf57af341ef0f43a0bf26c2477b5c268", size = 220241, upload-time = "2025-10-15T15:14:11.471Z" },
-    { url = "https://files.pythonhosted.org/packages/d5/d1/5ee0e0a08621140fd418ec4020f595b4d52d7eb429ae6a0c6542b4ba6f14/coverage-7.11.0-cp313-cp313t-win_arm64.whl", hash = "sha256:f9ea02ef40bb83823b2b04964459d281688fe173e20643870bb5d2edf68bc836", size = 218510, upload-time = "2025-10-15T15:14:13.46Z" },
     { url = "https://files.pythonhosted.org/packages/f4/06/e923830c1985ce808e40a3fa3eb46c13350b3224b7da59757d37b6ce12b8/coverage-7.11.0-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:c770885b28fb399aaf2a65bbd1c12bf6f307ffd112d6a76c5231a94276f0c497", size = 216110, upload-time = "2025-10-15T15:14:15.157Z" },
     { url = "https://files.pythonhosted.org/packages/42/82/cdeed03bfead45203fb651ed756dfb5266028f5f939e7f06efac4041dad5/coverage-7.11.0-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:a3d0e2087dba64c86a6b254f43e12d264b636a39e88c5cc0a01a7c71bcfdab7e", size = 216395, upload-time = "2025-10-15T15:14:16.863Z" },
     { url = "https://files.pythonhosted.org/packages/fc/ba/e1c80caffc3199aa699813f73ff097bc2df7b31642bdbc7493600a8f1de5/coverage-7.11.0-cp314-cp314-manylinux1_i686.manylinux_2_28_i686.manylinux_2_5_i686.whl", hash = "sha256:73feb83bb41c32811973b8565f3705caf01d928d972b72042b44e97c71fd70d1", size = 247433, upload-time = "2025-10-15T15:14:18.589Z" },
@@ -285,11 +178,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/5f/04/642c1d8a448ae5ea1369eac8495740a79eb4e581a9fb0cbdce56bbf56da1/coverage-7.11.0-py3-none-any.whl", hash = "sha256:4b7589765348d78fb4e5fb6ea35d07564e387da2fc5efff62e0222971f155f68", size = 207761, upload-time = "2025-10-15T15:15:06.439Z" },
 ]
 
-[package.optional-dependencies]
-toml = [
-    { name = "tomli", marker = "python_full_version <= '3.11'" },
-]
-
 [[package]]
 name = "distlib"
 version = "0.4.0"
@@ -299,32 +187,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/33/6b/e0547afaf41bf2c42e52430072fa5658766e3d65bd4b03a563d1b6336f57/distlib-0.4.0-py2.py3-none-any.whl", hash = "sha256:9659f7d87e46584a30b5780e43ac7a2143098441670ff0a49d5f9034c54a6c16", size = 469047, upload-time = "2025-07-17T16:51:58.613Z" },
 ]
 
-[[package]]
-name = "duckdb"
-version = "1.4.1"
-source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/ea/e7/21cf50a3d52ffceee1f0bcc3997fa96a5062e6bab705baee4f6c4e33cce5/duckdb-1.4.1.tar.gz", hash = "sha256:f903882f045d057ebccad12ac69975952832edfe133697694854bb784b8d6c76", size = 18461687, upload-time = "2025-10-07T10:37:28.605Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/d9/52/606f13fa9669a24166d2fe523e28982d8ef9039874b4de774255c7806d1f/duckdb-1.4.1-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:605d563c1d5203ca992497cd33fb386ac3d533deca970f9dcf539f62a34e22a9", size = 29065894, upload-time = "2025-10-07T10:36:29.837Z" },
-    { url = "https://files.pythonhosted.org/packages/84/57/138241952ece868b9577e607858466315bed1739e1fbb47205df4dfdfd88/duckdb-1.4.1-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:d3305c7c4b70336171de7adfdb50431f23671c000f11839b580c4201d9ce6ef5", size = 16163720, upload-time = "2025-10-07T10:36:32.241Z" },
-    { url = "https://files.pythonhosted.org/packages/a3/81/afa3a0a78498a6f4acfea75c48a70c5082032d9ac87822713d7c2d164af1/duckdb-1.4.1-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:a063d6febbe34b32f1ad2e68822db4d0e4b1102036f49aaeeb22b844427a75df", size = 13756223, upload-time = "2025-10-07T10:36:34.673Z" },
-    { url = "https://files.pythonhosted.org/packages/47/dd/5f6064fbd9248e37a3e806a244f81e0390ab8f989d231b584fb954f257fc/duckdb-1.4.1-cp311-cp311-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:d1ffcaaf74f7d1df3684b54685cbf8d3ce732781c541def8e1ced304859733ae", size = 18487022, upload-time = "2025-10-07T10:36:36.759Z" },
-    { url = "https://files.pythonhosted.org/packages/a1/10/b54969a1c42fd9344ad39228d671faceb8aa9f144b67cd9531a63551757f/duckdb-1.4.1-cp311-cp311-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:685d3d1599dc08160e0fa0cf09e93ac4ff8b8ed399cb69f8b5391cd46b5b207c", size = 20491004, upload-time = "2025-10-07T10:36:39.318Z" },
-    { url = "https://files.pythonhosted.org/packages/ed/d5/7332ae8f804869a4e895937821b776199a283f8d9fc775fd3ae5a0558099/duckdb-1.4.1-cp311-cp311-win_amd64.whl", hash = "sha256:78f1d28a15ae73bd449c43f80233732adffa49be1840a32de8f1a6bb5b286764", size = 12327619, upload-time = "2025-10-07T10:36:41.509Z" },
-    { url = "https://files.pythonhosted.org/packages/0e/6c/906a3fe41cd247b5638866fc1245226b528de196588802d4df4df1e6e819/duckdb-1.4.1-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:cd1765a7d180b7482874586859fc23bc9969d7d6c96ced83b245e6c6f49cde7f", size = 29076820, upload-time = "2025-10-07T10:36:43.782Z" },
-    { url = "https://files.pythonhosted.org/packages/66/c7/01dd33083f01f618c2a29f6dd068baf16945b8cbdb132929d3766610bbbb/duckdb-1.4.1-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:8ed7a86725185470953410823762956606693c0813bb64e09c7d44dbd9253a64", size = 16167558, upload-time = "2025-10-07T10:36:46.003Z" },
-    { url = "https://files.pythonhosted.org/packages/81/e2/f983b4b7ae1dfbdd2792dd31dee9a0d35f88554452cbfc6c9d65e22fdfa9/duckdb-1.4.1-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:8a189bdfc64cfb9cc1adfbe4f2dcfde0a4992ec08505ad8ce33c886e4813f0bf", size = 13762226, upload-time = "2025-10-07T10:36:48.55Z" },
-    { url = "https://files.pythonhosted.org/packages/ed/34/fb69a7be19b90f573b3cc890961be7b11870b77514769655657514f10a98/duckdb-1.4.1-cp312-cp312-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:a9090089b6486f7319c92acdeed8acda022d4374032d78a465956f50fc52fabf", size = 18500901, upload-time = "2025-10-07T10:36:52.445Z" },
-    { url = "https://files.pythonhosted.org/packages/e4/a5/1395d7b49d5589e85da9a9d7ffd8b50364c9d159c2807bef72d547f0ad1e/duckdb-1.4.1-cp312-cp312-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:142552ea3e768048e0e8c832077a545ca07792631c59edaee925e3e67401c2a0", size = 20514177, upload-time = "2025-10-07T10:36:55.358Z" },
-    { url = "https://files.pythonhosted.org/packages/c0/21/08f10706d30252753349ec545833fc0cea67c11abd0b5223acf2827f1056/duckdb-1.4.1-cp312-cp312-win_amd64.whl", hash = "sha256:567f3b3a785a9e8650612461893c49ca799661d2345a6024dda48324ece89ded", size = 12336422, upload-time = "2025-10-07T10:36:57.521Z" },
-    { url = "https://files.pythonhosted.org/packages/d7/08/705988c33e38665c969f7876b3ca4328be578554aa7e3dc0f34158da3e64/duckdb-1.4.1-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:46496a2518752ae0c6c5d75d4cdecf56ea23dd098746391176dd8e42cf157791", size = 29077070, upload-time = "2025-10-07T10:36:59.83Z" },
-    { url = "https://files.pythonhosted.org/packages/99/c5/7c9165f1e6b9069441bcda4da1e19382d4a2357783d37ff9ae238c5c41ac/duckdb-1.4.1-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:1c65ae7e9b541cea07d8075343bcfebdecc29a3c0481aa6078ee63d51951cfcd", size = 16167506, upload-time = "2025-10-07T10:37:02.24Z" },
-    { url = "https://files.pythonhosted.org/packages/38/46/267f4a570a0ee3ae6871ddc03435f9942884284e22a7ba9b7cb252ee69b6/duckdb-1.4.1-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:598d1a314e34b65d9399ddd066ccce1eeab6a60a2ef5885a84ce5ed62dbaf729", size = 13762330, upload-time = "2025-10-07T10:37:04.581Z" },
-    { url = "https://files.pythonhosted.org/packages/15/7b/c4f272a40c36d82df20937d93a1780eb39ab0107fe42b62cba889151eab9/duckdb-1.4.1-cp313-cp313-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:e2f16b8def782d484a9f035fc422bb6f06941ed0054b4511ddcdc514a7fb6a75", size = 18504687, upload-time = "2025-10-07T10:37:06.991Z" },
-    { url = "https://files.pythonhosted.org/packages/17/fc/9b958751f0116d7b0406406b07fa6f5a10c22d699be27826d0b896f9bf51/duckdb-1.4.1-cp313-cp313-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:a5a7d0aed068a5c33622a8848857947cab5cfb3f2a315b1251849bac2c74c492", size = 20513823, upload-time = "2025-10-07T10:37:09.349Z" },
-    { url = "https://files.pythonhosted.org/packages/30/79/4f544d73fcc0513b71296cb3ebb28a227d22e80dec27204977039b9fa875/duckdb-1.4.1-cp313-cp313-win_amd64.whl", hash = "sha256:280fd663dacdd12bb3c3bf41f3e5b2e5b95e00b88120afabb8b8befa5f335c6f", size = 12336460, upload-time = "2025-10-07T10:37:12.154Z" },
-]
-
 [[package]]
 name = "et-xmlfile"
 version = "2.0.0"
@@ -445,27 +307,6 @@ name = "google-crc32c"
 version = "1.7.1"
 source = { registry = "https://pypi.org/simple" }
 sdist = { url = "https://files.pythonhosted.org/packages/19/ae/87802e6d9f9d69adfaedfcfd599266bf386a54d0be058b532d04c794f76d/google_crc32c-1.7.1.tar.gz", hash = "sha256:2bff2305f98846f3e825dbeec9ee406f89da7962accdb29356e4eadc251bd472", size = 14495, upload-time = "2025-03-26T14:29:13.32Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/f7/94/220139ea87822b6fdfdab4fb9ba81b3fff7ea2c82e2af34adc726085bffc/google_crc32c-1.7.1-cp311-cp311-macosx_12_0_arm64.whl", hash = "sha256:6fbab4b935989e2c3610371963ba1b86afb09537fd0c633049be82afe153ac06", size = 30468, upload-time = "2025-03-26T14:32:52.215Z" },
-    { url = "https://files.pythonhosted.org/packages/94/97/789b23bdeeb9d15dc2904660463ad539d0318286d7633fe2760c10ed0c1c/google_crc32c-1.7.1-cp311-cp311-macosx_12_0_x86_64.whl", hash = "sha256:ed66cbe1ed9cbaaad9392b5259b3eba4a9e565420d734e6238813c428c3336c9", size = 30313, upload-time = "2025-03-26T14:57:38.758Z" },
-    { url = "https://files.pythonhosted.org/packages/81/b8/976a2b843610c211e7ccb3e248996a61e87dbb2c09b1499847e295080aec/google_crc32c-1.7.1-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ee6547b657621b6cbed3562ea7826c3e11cab01cd33b74e1f677690652883e77", size = 33048, upload-time = "2025-03-26T14:41:30.679Z" },
-    { url = "https://files.pythonhosted.org/packages/c9/16/a3842c2cf591093b111d4a5e2bfb478ac6692d02f1b386d2a33283a19dc9/google_crc32c-1.7.1-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d68e17bad8f7dd9a49181a1f5a8f4b251c6dbc8cc96fb79f1d321dfd57d66f53", size = 32669, upload-time = "2025-03-26T14:41:31.432Z" },
-    { url = "https://files.pythonhosted.org/packages/04/17/ed9aba495916fcf5fe4ecb2267ceb851fc5f273c4e4625ae453350cfd564/google_crc32c-1.7.1-cp311-cp311-win_amd64.whl", hash = "sha256:6335de12921f06e1f774d0dd1fbea6bf610abe0887a1638f64d694013138be5d", size = 33476, upload-time = "2025-03-26T14:29:10.211Z" },
-    { url = "https://files.pythonhosted.org/packages/dd/b7/787e2453cf8639c94b3d06c9d61f512234a82e1d12d13d18584bd3049904/google_crc32c-1.7.1-cp312-cp312-macosx_12_0_arm64.whl", hash = "sha256:2d73a68a653c57281401871dd4aeebbb6af3191dcac751a76ce430df4d403194", size = 30470, upload-time = "2025-03-26T14:34:31.655Z" },
-    { url = "https://files.pythonhosted.org/packages/ed/b4/6042c2b0cbac3ec3a69bb4c49b28d2f517b7a0f4a0232603c42c58e22b44/google_crc32c-1.7.1-cp312-cp312-macosx_12_0_x86_64.whl", hash = "sha256:22beacf83baaf59f9d3ab2bbb4db0fb018da8e5aebdce07ef9f09fce8220285e", size = 30315, upload-time = "2025-03-26T15:01:54.634Z" },
-    { url = "https://files.pythonhosted.org/packages/29/ad/01e7a61a5d059bc57b702d9ff6a18b2585ad97f720bd0a0dbe215df1ab0e/google_crc32c-1.7.1-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:19eafa0e4af11b0a4eb3974483d55d2d77ad1911e6cf6f832e1574f6781fd337", size = 33180, upload-time = "2025-03-26T14:41:32.168Z" },
-    { url = "https://files.pythonhosted.org/packages/3b/a5/7279055cf004561894ed3a7bfdf5bf90a53f28fadd01af7cd166e88ddf16/google_crc32c-1.7.1-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:b6d86616faaea68101195c6bdc40c494e4d76f41e07a37ffdef270879c15fb65", size = 32794, upload-time = "2025-03-26T14:41:33.264Z" },
-    { url = "https://files.pythonhosted.org/packages/0f/d6/77060dbd140c624e42ae3ece3df53b9d811000729a5c821b9fd671ceaac6/google_crc32c-1.7.1-cp312-cp312-win_amd64.whl", hash = "sha256:b7491bdc0c7564fcf48c0179d2048ab2f7c7ba36b84ccd3a3e1c3f7a72d3bba6", size = 33477, upload-time = "2025-03-26T14:29:10.94Z" },
-    { url = "https://files.pythonhosted.org/packages/8b/72/b8d785e9184ba6297a8620c8a37cf6e39b81a8ca01bb0796d7cbb28b3386/google_crc32c-1.7.1-cp313-cp313-macosx_12_0_arm64.whl", hash = "sha256:df8b38bdaf1629d62d51be8bdd04888f37c451564c2042d36e5812da9eff3c35", size = 30467, upload-time = "2025-03-26T14:36:06.909Z" },
-    { url = "https://files.pythonhosted.org/packages/34/25/5f18076968212067c4e8ea95bf3b69669f9fc698476e5f5eb97d5b37999f/google_crc32c-1.7.1-cp313-cp313-macosx_12_0_x86_64.whl", hash = "sha256:e42e20a83a29aa2709a0cf271c7f8aefaa23b7ab52e53b322585297bb94d4638", size = 30309, upload-time = "2025-03-26T15:06:15.318Z" },
-    { url = "https://files.pythonhosted.org/packages/92/83/9228fe65bf70e93e419f38bdf6c5ca5083fc6d32886ee79b450ceefd1dbd/google_crc32c-1.7.1-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:905a385140bf492ac300026717af339790921f411c0dfd9aa5a9e69a08ed32eb", size = 33133, upload-time = "2025-03-26T14:41:34.388Z" },
-    { url = "https://files.pythonhosted.org/packages/c3/ca/1ea2fd13ff9f8955b85e7956872fdb7050c4ace8a2306a6d177edb9cf7fe/google_crc32c-1.7.1-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:6b211ddaf20f7ebeec5c333448582c224a7c90a9d98826fbab82c0ddc11348e6", size = 32773, upload-time = "2025-03-26T14:41:35.19Z" },
-    { url = "https://files.pythonhosted.org/packages/89/32/a22a281806e3ef21b72db16f948cad22ec68e4bdd384139291e00ff82fe2/google_crc32c-1.7.1-cp313-cp313-win_amd64.whl", hash = "sha256:0f99eaa09a9a7e642a61e06742856eec8b19fc0037832e03f941fe7cf0c8e4db", size = 33475, upload-time = "2025-03-26T14:29:11.771Z" },
-    { url = "https://files.pythonhosted.org/packages/b8/c5/002975aff514e57fc084ba155697a049b3f9b52225ec3bc0f542871dd524/google_crc32c-1.7.1-cp313-cp313t-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:32d1da0d74ec5634a05f53ef7df18fc646666a25efaaca9fc7dcfd4caf1d98c3", size = 33243, upload-time = "2025-03-26T14:41:35.975Z" },
-    { url = "https://files.pythonhosted.org/packages/61/cb/c585282a03a0cea70fcaa1bf55d5d702d0f2351094d663ec3be1c6c67c52/google_crc32c-1.7.1-cp313-cp313t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e10554d4abc5238823112c2ad7e4560f96c7bf3820b202660373d769d9e6e4c9", size = 32870, upload-time = "2025-03-26T14:41:37.08Z" },
-    { url = "https://files.pythonhosted.org/packages/16/1b/1693372bf423ada422f80fd88260dbfd140754adb15cbc4d7e9a68b1cb8e/google_crc32c-1.7.1-pp311-pypy311_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:85fef7fae11494e747c9fd1359a527e5970fc9603c90764843caabd3a16a0a48", size = 28241, upload-time = "2025-03-26T14:41:45.898Z" },
-    { url = "https://files.pythonhosted.org/packages/fd/3c/2a19a60a473de48717b4efb19398c3f914795b64a96cf3fbe82588044f78/google_crc32c-1.7.1-pp311-pypy311_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:6efb97eb4369d52593ad6f75e7e10d053cf00c48983f7a973105bc70b0ac4d82", size = 28048, upload-time = "2025-03-26T14:41:46.696Z" },
-]
 
 [[package]]
 name = "google-resumable-media"
@@ -500,36 +341,6 @@ dependencies = [
 ]
 sdist = { url = "https://files.pythonhosted.org/packages/9d/f7/8963848164c7604efb3a3e6ee457fdb3a469653e19002bd24742473254f8/grpcio-1.75.1.tar.gz", hash = "sha256:3e81d89ece99b9ace23a6916880baca613c03a799925afb2857887efa8b1b3d2", size = 12731327, upload-time = "2025-09-26T09:03:36.887Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/0c/3c/35ca9747473a306bfad0cee04504953f7098527cd112a4ab55c55af9e7bd/grpcio-1.75.1-cp311-cp311-linux_armv7l.whl", hash = "sha256:573855ca2e58e35032aff30bfbd1ee103fbcf4472e4b28d4010757700918e326", size = 5709761, upload-time = "2025-09-26T09:01:28.528Z" },
-    { url = "https://files.pythonhosted.org/packages/c9/2c/ecbcb4241e4edbe85ac2663f885726fea0e947767401288b50d8fdcb9200/grpcio-1.75.1-cp311-cp311-macosx_11_0_universal2.whl", hash = "sha256:6a4996a2c8accc37976dc142d5991adf60733e223e5c9a2219e157dc6a8fd3a2", size = 11496691, upload-time = "2025-09-26T09:01:31.214Z" },
-    { url = "https://files.pythonhosted.org/packages/81/40/bc07aee2911f0d426fa53fe636216100c31a8ea65a400894f280274cb023/grpcio-1.75.1-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:b1ea1bbe77ecbc1be00af2769f4ae4a88ce93be57a4f3eebd91087898ed749f9", size = 6296084, upload-time = "2025-09-26T09:01:34.596Z" },
-    { url = "https://files.pythonhosted.org/packages/b8/d1/10c067f6c67396cbf46448b80f27583b5e8c4b46cdfbe18a2a02c2c2f290/grpcio-1.75.1-cp311-cp311-manylinux2014_i686.manylinux_2_17_i686.whl", hash = "sha256:e5b425aee54cc5e3e3c58f00731e8a33f5567965d478d516d35ef99fd648ab68", size = 6950403, upload-time = "2025-09-26T09:01:36.736Z" },
-    { url = "https://files.pythonhosted.org/packages/3f/42/5f628abe360b84dfe8dd8f32be6b0606dc31dc04d3358eef27db791ea4d5/grpcio-1.75.1-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:0049a7bf547dafaeeb1db17079ce79596c298bfe308fc084d023c8907a845b9a", size = 6470166, upload-time = "2025-09-26T09:01:39.474Z" },
-    { url = "https://files.pythonhosted.org/packages/c3/93/a24035080251324019882ee2265cfde642d6476c0cf8eb207fc693fcebdc/grpcio-1.75.1-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:5b8ea230c7f77c0a1a3208a04a1eda164633fb0767b4cefd65a01079b65e5b1f", size = 7107828, upload-time = "2025-09-26T09:01:41.782Z" },
-    { url = "https://files.pythonhosted.org/packages/e4/f8/d18b984c1c9ba0318e3628dbbeb6af77a5007f02abc378c845070f2d3edd/grpcio-1.75.1-cp311-cp311-musllinux_1_2_i686.whl", hash = "sha256:36990d629c3c9fb41e546414e5af52d0a7af37ce7113d9682c46d7e2919e4cca", size = 8045421, upload-time = "2025-09-26T09:01:45.835Z" },
-    { url = "https://files.pythonhosted.org/packages/7e/b6/4bf9aacff45deca5eac5562547ed212556b831064da77971a4e632917da3/grpcio-1.75.1-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:b10ad908118d38c2453ade7ff790e5bce36580c3742919007a2a78e3a1e521ca", size = 7503290, upload-time = "2025-09-26T09:01:49.28Z" },
-    { url = "https://files.pythonhosted.org/packages/3b/15/d8d69d10223cb54c887a2180bd29fe5fa2aec1d4995c8821f7aa6eaf72e4/grpcio-1.75.1-cp311-cp311-win32.whl", hash = "sha256:d6be2b5ee7bea656c954dcf6aa8093c6f0e6a3ef9945c99d99fcbfc88c5c0bfe", size = 3950631, upload-time = "2025-09-26T09:01:51.23Z" },
-    { url = "https://files.pythonhosted.org/packages/8a/40/7b8642d45fff6f83300c24eaac0380a840e5e7fe0e8d80afd31b99d7134e/grpcio-1.75.1-cp311-cp311-win_amd64.whl", hash = "sha256:61c692fb05956b17dd6d1ab480f7f10ad0536dba3bc8fd4e3c7263dc244ed772", size = 4646131, upload-time = "2025-09-26T09:01:53.266Z" },
-    { url = "https://files.pythonhosted.org/packages/3a/81/42be79e73a50aaa20af66731c2defeb0e8c9008d9935a64dd8ea8e8c44eb/grpcio-1.75.1-cp312-cp312-linux_armv7l.whl", hash = "sha256:7b888b33cd14085d86176b1628ad2fcbff94cfbbe7809465097aa0132e58b018", size = 5668314, upload-time = "2025-09-26T09:01:55.424Z" },
-    { url = "https://files.pythonhosted.org/packages/c5/a7/3686ed15822fedc58c22f82b3a7403d9faf38d7c33de46d4de6f06e49426/grpcio-1.75.1-cp312-cp312-macosx_11_0_universal2.whl", hash = "sha256:8775036efe4ad2085975531d221535329f5dac99b6c2a854a995456098f99546", size = 11476125, upload-time = "2025-09-26T09:01:57.927Z" },
-    { url = "https://files.pythonhosted.org/packages/14/85/21c71d674f03345ab183c634ecd889d3330177e27baea8d5d247a89b6442/grpcio-1.75.1-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:bb658f703468d7fbb5dcc4037c65391b7dc34f808ac46ed9136c24fc5eeb041d", size = 6246335, upload-time = "2025-09-26T09:02:00.76Z" },
-    { url = "https://files.pythonhosted.org/packages/fd/db/3beb661bc56a385ae4fa6b0e70f6b91ac99d47afb726fe76aaff87ebb116/grpcio-1.75.1-cp312-cp312-manylinux2014_i686.manylinux_2_17_i686.whl", hash = "sha256:4b7177a1cdb3c51b02b0c0a256b0a72fdab719600a693e0e9037949efffb200b", size = 6916309, upload-time = "2025-09-26T09:02:02.894Z" },
-    { url = "https://files.pythonhosted.org/packages/1e/9c/eda9fe57f2b84343d44c1b66cf3831c973ba29b078b16a27d4587a1fdd47/grpcio-1.75.1-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:7d4fa6ccc3ec2e68a04f7b883d354d7fea22a34c44ce535a2f0c0049cf626ddf", size = 6435419, upload-time = "2025-09-26T09:02:05.055Z" },
-    { url = "https://files.pythonhosted.org/packages/c3/b8/090c98983e0a9d602e3f919a6e2d4e470a8b489452905f9a0fa472cac059/grpcio-1.75.1-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:3d86880ecaeb5b2f0a8afa63824de93adb8ebe4e49d0e51442532f4e08add7d6", size = 7064893, upload-time = "2025-09-26T09:02:07.275Z" },
-    { url = "https://files.pythonhosted.org/packages/ec/c0/6d53d4dbbd00f8bd81571f5478d8a95528b716e0eddb4217cc7cb45aae5f/grpcio-1.75.1-cp312-cp312-musllinux_1_2_i686.whl", hash = "sha256:a8041d2f9e8a742aeae96f4b047ee44e73619f4f9d24565e84d5446c623673b6", size = 8011922, upload-time = "2025-09-26T09:02:09.527Z" },
-    { url = "https://files.pythonhosted.org/packages/f2/7c/48455b2d0c5949678d6982c3e31ea4d89df4e16131b03f7d5c590811cbe9/grpcio-1.75.1-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:3652516048bf4c314ce12be37423c79829f46efffb390ad64149a10c6071e8de", size = 7466181, upload-time = "2025-09-26T09:02:12.279Z" },
-    { url = "https://files.pythonhosted.org/packages/fd/12/04a0e79081e3170b6124f8cba9b6275871276be06c156ef981033f691880/grpcio-1.75.1-cp312-cp312-win32.whl", hash = "sha256:44b62345d8403975513af88da2f3d5cc76f73ca538ba46596f92a127c2aea945", size = 3938543, upload-time = "2025-09-26T09:02:14.77Z" },
-    { url = "https://files.pythonhosted.org/packages/5f/d7/11350d9d7fb5adc73d2b0ebf6ac1cc70135577701e607407fe6739a90021/grpcio-1.75.1-cp312-cp312-win_amd64.whl", hash = "sha256:b1e191c5c465fa777d4cafbaacf0c01e0d5278022082c0abbd2ee1d6454ed94d", size = 4641938, upload-time = "2025-09-26T09:02:16.927Z" },
-    { url = "https://files.pythonhosted.org/packages/46/74/bac4ab9f7722164afdf263ae31ba97b8174c667153510322a5eba4194c32/grpcio-1.75.1-cp313-cp313-linux_armv7l.whl", hash = "sha256:3bed22e750d91d53d9e31e0af35a7b0b51367e974e14a4ff229db5b207647884", size = 5672779, upload-time = "2025-09-26T09:02:19.11Z" },
-    { url = "https://files.pythonhosted.org/packages/a6/52/d0483cfa667cddaa294e3ab88fd2c2a6e9dc1a1928c0e5911e2e54bd5b50/grpcio-1.75.1-cp313-cp313-macosx_11_0_universal2.whl", hash = "sha256:5b8f381eadcd6ecaa143a21e9e80a26424c76a0a9b3d546febe6648f3a36a5ac", size = 11470623, upload-time = "2025-09-26T09:02:22.117Z" },
-    { url = "https://files.pythonhosted.org/packages/cf/e4/d1954dce2972e32384db6a30273275e8c8ea5a44b80347f9055589333b3f/grpcio-1.75.1-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:5bf4001d3293e3414d0cf99ff9b1139106e57c3a66dfff0c5f60b2a6286ec133", size = 6248838, upload-time = "2025-09-26T09:02:26.426Z" },
-    { url = "https://files.pythonhosted.org/packages/06/43/073363bf63826ba8077c335d797a8d026f129dc0912b69c42feaf8f0cd26/grpcio-1.75.1-cp313-cp313-manylinux2014_i686.manylinux_2_17_i686.whl", hash = "sha256:9f82ff474103e26351dacfe8d50214e7c9322960d8d07ba7fa1d05ff981c8b2d", size = 6922663, upload-time = "2025-09-26T09:02:28.724Z" },
-    { url = "https://files.pythonhosted.org/packages/c2/6f/076ac0df6c359117676cacfa8a377e2abcecec6a6599a15a672d331f6680/grpcio-1.75.1-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:0ee119f4f88d9f75414217823d21d75bfe0e6ed40135b0cbbfc6376bc9f7757d", size = 6436149, upload-time = "2025-09-26T09:02:30.971Z" },
-    { url = "https://files.pythonhosted.org/packages/6b/27/1d08824f1d573fcb1fa35ede40d6020e68a04391709939e1c6f4193b445f/grpcio-1.75.1-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:664eecc3abe6d916fa6cf8dd6b778e62fb264a70f3430a3180995bf2da935446", size = 7067989, upload-time = "2025-09-26T09:02:33.233Z" },
-    { url = "https://files.pythonhosted.org/packages/c6/98/98594cf97b8713feb06a8cb04eeef60b4757e3e2fb91aa0d9161da769843/grpcio-1.75.1-cp313-cp313-musllinux_1_2_i686.whl", hash = "sha256:c32193fa08b2fbebf08fe08e84f8a0aad32d87c3ad42999c65e9449871b1c66e", size = 8010717, upload-time = "2025-09-26T09:02:36.011Z" },
-    { url = "https://files.pythonhosted.org/packages/8c/7e/bb80b1bba03c12158f9254762cdf5cced4a9bc2e8ed51ed335915a5a06ef/grpcio-1.75.1-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:5cebe13088b9254f6e615bcf1da9131d46cfa4e88039454aca9cb65f639bd3bc", size = 7463822, upload-time = "2025-09-26T09:02:38.26Z" },
-    { url = "https://files.pythonhosted.org/packages/23/1c/1ea57fdc06927eb5640f6750c697f596f26183573069189eeaf6ef86ba2d/grpcio-1.75.1-cp313-cp313-win32.whl", hash = "sha256:4b4c678e7ed50f8ae8b8dbad15a865ee73ce12668b6aaf411bf3258b5bc3f970", size = 3938490, upload-time = "2025-09-26T09:02:40.268Z" },
-    { url = "https://files.pythonhosted.org/packages/4b/24/fbb8ff1ccadfbf78ad2401c41aceaf02b0d782c084530d8871ddd69a2d49/grpcio-1.75.1-cp313-cp313-win_amd64.whl", hash = "sha256:5573f51e3f296a1bcf71e7a690c092845fb223072120f4bdb7a5b48e111def66", size = 4642538, upload-time = "2025-09-26T09:02:42.519Z" },
     { url = "https://files.pythonhosted.org/packages/f2/1b/9a0a5cecd24302b9fdbcd55d15ed6267e5f3d5b898ff9ac8cbe17ee76129/grpcio-1.75.1-cp314-cp314-linux_armv7l.whl", hash = "sha256:c05da79068dd96723793bffc8d0e64c45f316248417515f28d22204d9dae51c7", size = 5673319, upload-time = "2025-09-26T09:02:44.742Z" },
     { url = "https://files.pythonhosted.org/packages/c6/ec/9d6959429a83fbf5df8549c591a8a52bb313976f6646b79852c4884e3225/grpcio-1.75.1-cp314-cp314-macosx_11_0_universal2.whl", hash = "sha256:06373a94fd16ec287116a825161dca179a0402d0c60674ceeec8c9fba344fe66", size = 11480347, upload-time = "2025-09-26T09:02:47.539Z" },
     { url = "https://files.pythonhosted.org/packages/09/7a/26da709e42c4565c3d7bf999a9569da96243ce34a8271a968dee810a7cf1/grpcio-1.75.1-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:4484f4b7287bdaa7a5b3980f3c7224c3c622669405d20f69549f5fb956ad0421", size = 6254706, upload-time = "2025-09-26T09:02:50.4Z" },
@@ -809,53 +620,6 @@ dependencies = [
 ]
 sdist = { url = "https://files.pythonhosted.org/packages/df/18/d0944e8eaaa3efd0a91b0f1fc537d3be55ad35091b6a87638211ba691964/pydantic_core-2.41.4.tar.gz", hash = "sha256:70e47929a9d4a1905a67e4b687d5946026390568a8e952b92824118063cee4d5", size = 457557, upload-time = "2025-10-14T10:23:47.909Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/62/4c/f6cbfa1e8efacd00b846764e8484fe173d25b8dab881e277a619177f3384/pydantic_core-2.41.4-cp311-cp311-macosx_10_12_x86_64.whl", hash = "sha256:28ff11666443a1a8cf2a044d6a545ebffa8382b5f7973f22c36109205e65dc80", size = 2109062, upload-time = "2025-10-14T10:20:04.486Z" },
-    { url = "https://files.pythonhosted.org/packages/21/f8/40b72d3868896bfcd410e1bd7e516e762d326201c48e5b4a06446f6cf9e8/pydantic_core-2.41.4-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:61760c3925d4633290292bad462e0f737b840508b4f722247d8729684f6539ae", size = 1916301, upload-time = "2025-10-14T10:20:06.857Z" },
-    { url = "https://files.pythonhosted.org/packages/94/4d/d203dce8bee7faeca791671c88519969d98d3b4e8f225da5b96dad226fc8/pydantic_core-2.41.4-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:eae547b7315d055b0de2ec3965643b0ab82ad0106a7ffd29615ee9f266a02827", size = 1968728, upload-time = "2025-10-14T10:20:08.353Z" },
-    { url = "https://files.pythonhosted.org/packages/65/f5/6a66187775df87c24d526985b3a5d78d861580ca466fbd9d4d0e792fcf6c/pydantic_core-2.41.4-cp311-cp311-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:ef9ee5471edd58d1fcce1c80ffc8783a650e3e3a193fe90d52e43bb4d87bff1f", size = 2050238, upload-time = "2025-10-14T10:20:09.766Z" },
-    { url = "https://files.pythonhosted.org/packages/5e/b9/78336345de97298cf53236b2f271912ce11f32c1e59de25a374ce12f9cce/pydantic_core-2.41.4-cp311-cp311-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:15dd504af121caaf2c95cb90c0ebf71603c53de98305621b94da0f967e572def", size = 2249424, upload-time = "2025-10-14T10:20:11.732Z" },
-    { url = "https://files.pythonhosted.org/packages/99/bb/a4584888b70ee594c3d374a71af5075a68654d6c780369df269118af7402/pydantic_core-2.41.4-cp311-cp311-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:3a926768ea49a8af4d36abd6a8968b8790f7f76dd7cbd5a4c180db2b4ac9a3a2", size = 2366047, upload-time = "2025-10-14T10:20:13.647Z" },
-    { url = "https://files.pythonhosted.org/packages/5f/8d/17fc5de9d6418e4d2ae8c675f905cdafdc59d3bf3bf9c946b7ab796a992a/pydantic_core-2.41.4-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:6916b9b7d134bff5440098a4deb80e4cb623e68974a87883299de9124126c2a8", size = 2071163, upload-time = "2025-10-14T10:20:15.307Z" },
-    { url = "https://files.pythonhosted.org/packages/54/e7/03d2c5c0b8ed37a4617430db68ec5e7dbba66358b629cd69e11b4d564367/pydantic_core-2.41.4-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:5cf90535979089df02e6f17ffd076f07237efa55b7343d98760bde8743c4b265", size = 2190585, upload-time = "2025-10-14T10:20:17.3Z" },
-    { url = "https://files.pythonhosted.org/packages/be/fc/15d1c9fe5ad9266a5897d9b932b7f53d7e5cfc800573917a2c5d6eea56ec/pydantic_core-2.41.4-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:7533c76fa647fade2d7ec75ac5cc079ab3f34879626dae5689b27790a6cf5a5c", size = 2150109, upload-time = "2025-10-14T10:20:19.143Z" },
-    { url = "https://files.pythonhosted.org/packages/26/ef/e735dd008808226c83ba56972566138665b71477ad580fa5a21f0851df48/pydantic_core-2.41.4-cp311-cp311-musllinux_1_1_armv7l.whl", hash = "sha256:37e516bca9264cbf29612539801ca3cd5d1be465f940417b002905e6ed79d38a", size = 2315078, upload-time = "2025-10-14T10:20:20.742Z" },
-    { url = "https://files.pythonhosted.org/packages/90/00/806efdcf35ff2ac0f938362350cd9827b8afb116cc814b6b75cf23738c7c/pydantic_core-2.41.4-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:0c19cb355224037c83642429b8ce261ae108e1c5fbf5c028bac63c77b0f8646e", size = 2318737, upload-time = "2025-10-14T10:20:22.306Z" },
-    { url = "https://files.pythonhosted.org/packages/41/7e/6ac90673fe6cb36621a2283552897838c020db343fa86e513d3f563b196f/pydantic_core-2.41.4-cp311-cp311-win32.whl", hash = "sha256:09c2a60e55b357284b5f31f5ab275ba9f7f70b7525e18a132ec1f9160b4f1f03", size = 1974160, upload-time = "2025-10-14T10:20:23.817Z" },
-    { url = "https://files.pythonhosted.org/packages/e0/9d/7c5e24ee585c1f8b6356e1d11d40ab807ffde44d2db3b7dfd6d20b09720e/pydantic_core-2.41.4-cp311-cp311-win_amd64.whl", hash = "sha256:711156b6afb5cb1cb7c14a2cc2c4a8b4c717b69046f13c6b332d8a0a8f41ca3e", size = 2021883, upload-time = "2025-10-14T10:20:25.48Z" },
-    { url = "https://files.pythonhosted.org/packages/33/90/5c172357460fc28b2871eb4a0fb3843b136b429c6fa827e4b588877bf115/pydantic_core-2.41.4-cp311-cp311-win_arm64.whl", hash = "sha256:6cb9cf7e761f4f8a8589a45e49ed3c0d92d1d696a45a6feaee8c904b26efc2db", size = 1968026, upload-time = "2025-10-14T10:20:27.039Z" },
-    { url = "https://files.pythonhosted.org/packages/e9/81/d3b3e95929c4369d30b2a66a91db63c8ed0a98381ae55a45da2cd1cc1288/pydantic_core-2.41.4-cp312-cp312-macosx_10_12_x86_64.whl", hash = "sha256:ab06d77e053d660a6faaf04894446df7b0a7e7aba70c2797465a0a1af00fc887", size = 2099043, upload-time = "2025-10-14T10:20:28.561Z" },
-    { url = "https://files.pythonhosted.org/packages/58/da/46fdac49e6717e3a94fc9201403e08d9d61aa7a770fab6190b8740749047/pydantic_core-2.41.4-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:c53ff33e603a9c1179a9364b0a24694f183717b2e0da2b5ad43c316c956901b2", size = 1910699, upload-time = "2025-10-14T10:20:30.217Z" },
-    { url = "https://files.pythonhosted.org/packages/1e/63/4d948f1b9dd8e991a5a98b77dd66c74641f5f2e5225fee37994b2e07d391/pydantic_core-2.41.4-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:304c54176af2c143bd181d82e77c15c41cbacea8872a2225dd37e6544dce9999", size = 1952121, upload-time = "2025-10-14T10:20:32.246Z" },
-    { url = "https://files.pythonhosted.org/packages/b2/a7/e5fc60a6f781fc634ecaa9ecc3c20171d238794cef69ae0af79ac11b89d7/pydantic_core-2.41.4-cp312-cp312-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:025ba34a4cf4fb32f917d5d188ab5e702223d3ba603be4d8aca2f82bede432a4", size = 2041590, upload-time = "2025-10-14T10:20:34.332Z" },
-    { url = "https://files.pythonhosted.org/packages/70/69/dce747b1d21d59e85af433428978a1893c6f8a7068fa2bb4a927fba7a5ff/pydantic_core-2.41.4-cp312-cp312-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:b9f5f30c402ed58f90c70e12eff65547d3ab74685ffe8283c719e6bead8ef53f", size = 2219869, upload-time = "2025-10-14T10:20:35.965Z" },
-    { url = "https://files.pythonhosted.org/packages/83/6a/c070e30e295403bf29c4df1cb781317b6a9bac7cd07b8d3acc94d501a63c/pydantic_core-2.41.4-cp312-cp312-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:dd96e5d15385d301733113bcaa324c8bcf111275b7675a9c6e88bfb19fc05e3b", size = 2345169, upload-time = "2025-10-14T10:20:37.627Z" },
-    { url = "https://files.pythonhosted.org/packages/f0/83/06d001f8043c336baea7fd202a9ac7ad71f87e1c55d8112c50b745c40324/pydantic_core-2.41.4-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:98f348cbb44fae6e9653c1055db7e29de67ea6a9ca03a5fa2c2e11a47cff0e47", size = 2070165, upload-time = "2025-10-14T10:20:39.246Z" },
-    { url = "https://files.pythonhosted.org/packages/14/0a/e567c2883588dd12bcbc110232d892cf385356f7c8a9910311ac997ab715/pydantic_core-2.41.4-cp312-cp312-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:ec22626a2d14620a83ca583c6f5a4080fa3155282718b6055c2ea48d3ef35970", size = 2189067, upload-time = "2025-10-14T10:20:41.015Z" },
-    { url = "https://files.pythonhosted.org/packages/f4/1d/3d9fca34273ba03c9b1c5289f7618bc4bd09c3ad2289b5420481aa051a99/pydantic_core-2.41.4-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:3a95d4590b1f1a43bf33ca6d647b990a88f4a3824a8c4572c708f0b45a5290ed", size = 2132997, upload-time = "2025-10-14T10:20:43.106Z" },
-    { url = "https://files.pythonhosted.org/packages/52/70/d702ef7a6cd41a8afc61f3554922b3ed8d19dd54c3bd4bdbfe332e610827/pydantic_core-2.41.4-cp312-cp312-musllinux_1_1_armv7l.whl", hash = "sha256:f9672ab4d398e1b602feadcffcdd3af44d5f5e6ddc15bc7d15d376d47e8e19f8", size = 2307187, upload-time = "2025-10-14T10:20:44.849Z" },
-    { url = "https://files.pythonhosted.org/packages/68/4c/c06be6e27545d08b802127914156f38d10ca287a9e8489342793de8aae3c/pydantic_core-2.41.4-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:84d8854db5f55fead3b579f04bda9a36461dab0730c5d570e1526483e7bb8431", size = 2305204, upload-time = "2025-10-14T10:20:46.781Z" },
-    { url = "https://files.pythonhosted.org/packages/b0/e5/35ae4919bcd9f18603419e23c5eaf32750224a89d41a8df1a3704b69f77e/pydantic_core-2.41.4-cp312-cp312-win32.whl", hash = "sha256:9be1c01adb2ecc4e464392c36d17f97e9110fbbc906bcbe1c943b5b87a74aabd", size = 1972536, upload-time = "2025-10-14T10:20:48.39Z" },
-    { url = "https://files.pythonhosted.org/packages/1e/c2/49c5bb6d2a49eb2ee3647a93e3dae7080c6409a8a7558b075027644e879c/pydantic_core-2.41.4-cp312-cp312-win_amd64.whl", hash = "sha256:d682cf1d22bab22a5be08539dca3d1593488a99998f9f412137bc323179067ff", size = 2031132, upload-time = "2025-10-14T10:20:50.421Z" },
-    { url = "https://files.pythonhosted.org/packages/06/23/936343dbcba6eec93f73e95eb346810fc732f71ba27967b287b66f7b7097/pydantic_core-2.41.4-cp312-cp312-win_arm64.whl", hash = "sha256:833eebfd75a26d17470b58768c1834dfc90141b7afc6eb0429c21fc5a21dcfb8", size = 1969483, upload-time = "2025-10-14T10:20:52.35Z" },
-    { url = "https://files.pythonhosted.org/packages/13/d0/c20adabd181a029a970738dfe23710b52a31f1258f591874fcdec7359845/pydantic_core-2.41.4-cp313-cp313-macosx_10_12_x86_64.whl", hash = "sha256:85e050ad9e5f6fe1004eec65c914332e52f429bc0ae12d6fa2092407a462c746", size = 2105688, upload-time = "2025-10-14T10:20:54.448Z" },
-    { url = "https://files.pythonhosted.org/packages/00/b6/0ce5c03cec5ae94cca220dfecddc453c077d71363b98a4bbdb3c0b22c783/pydantic_core-2.41.4-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:e7393f1d64792763a48924ba31d1e44c2cfbc05e3b1c2c9abb4ceeadd912cced", size = 1910807, upload-time = "2025-10-14T10:20:56.115Z" },
-    { url = "https://files.pythonhosted.org/packages/68/3e/800d3d02c8beb0b5c069c870cbb83799d085debf43499c897bb4b4aaff0d/pydantic_core-2.41.4-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:94dab0940b0d1fb28bcab847adf887c66a27a40291eedf0b473be58761c9799a", size = 1956669, upload-time = "2025-10-14T10:20:57.874Z" },
-    { url = "https://files.pythonhosted.org/packages/60/a4/24271cc71a17f64589be49ab8bd0751f6a0a03046c690df60989f2f95c2c/pydantic_core-2.41.4-cp313-cp313-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:de7c42f897e689ee6f9e93c4bec72b99ae3b32a2ade1c7e4798e690ff5246e02", size = 2051629, upload-time = "2025-10-14T10:21:00.006Z" },
-    { url = "https://files.pythonhosted.org/packages/68/de/45af3ca2f175d91b96bfb62e1f2d2f1f9f3b14a734afe0bfeff079f78181/pydantic_core-2.41.4-cp313-cp313-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:664b3199193262277b8b3cd1e754fb07f2c6023289c815a1e1e8fb415cb247b1", size = 2224049, upload-time = "2025-10-14T10:21:01.801Z" },
-    { url = "https://files.pythonhosted.org/packages/af/8f/ae4e1ff84672bf869d0a77af24fd78387850e9497753c432875066b5d622/pydantic_core-2.41.4-cp313-cp313-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:d95b253b88f7d308b1c0b417c4624f44553ba4762816f94e6986819b9c273fb2", size = 2342409, upload-time = "2025-10-14T10:21:03.556Z" },
-    { url = "https://files.pythonhosted.org/packages/18/62/273dd70b0026a085c7b74b000394e1ef95719ea579c76ea2f0cc8893736d/pydantic_core-2.41.4-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a1351f5bbdbbabc689727cb91649a00cb9ee7203e0a6e54e9f5ba9e22e384b84", size = 2069635, upload-time = "2025-10-14T10:21:05.385Z" },
-    { url = "https://files.pythonhosted.org/packages/30/03/cf485fff699b4cdaea469bc481719d3e49f023241b4abb656f8d422189fc/pydantic_core-2.41.4-cp313-cp313-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:1affa4798520b148d7182da0615d648e752de4ab1a9566b7471bc803d88a062d", size = 2194284, upload-time = "2025-10-14T10:21:07.122Z" },
-    { url = "https://files.pythonhosted.org/packages/f9/7e/c8e713db32405dfd97211f2fc0a15d6bf8adb7640f3d18544c1f39526619/pydantic_core-2.41.4-cp313-cp313-musllinux_1_1_aarch64.whl", hash = "sha256:7b74e18052fea4aa8dea2fb7dbc23d15439695da6cbe6cfc1b694af1115df09d", size = 2137566, upload-time = "2025-10-14T10:21:08.981Z" },
-    { url = "https://files.pythonhosted.org/packages/04/f7/db71fd4cdccc8b75990f79ccafbbd66757e19f6d5ee724a6252414483fb4/pydantic_core-2.41.4-cp313-cp313-musllinux_1_1_armv7l.whl", hash = "sha256:285b643d75c0e30abda9dc1077395624f314a37e3c09ca402d4015ef5979f1a2", size = 2316809, upload-time = "2025-10-14T10:21:10.805Z" },
-    { url = "https://files.pythonhosted.org/packages/76/63/a54973ddb945f1bca56742b48b144d85c9fc22f819ddeb9f861c249d5464/pydantic_core-2.41.4-cp313-cp313-musllinux_1_1_x86_64.whl", hash = "sha256:f52679ff4218d713b3b33f88c89ccbf3a5c2c12ba665fb80ccc4192b4608dbab", size = 2311119, upload-time = "2025-10-14T10:21:12.583Z" },
-    { url = "https://files.pythonhosted.org/packages/f8/03/5d12891e93c19218af74843a27e32b94922195ded2386f7b55382f904d2f/pydantic_core-2.41.4-cp313-cp313-win32.whl", hash = "sha256:ecde6dedd6fff127c273c76821bb754d793be1024bc33314a120f83a3c69460c", size = 1981398, upload-time = "2025-10-14T10:21:14.584Z" },
-    { url = "https://files.pythonhosted.org/packages/be/d8/fd0de71f39db91135b7a26996160de71c073d8635edfce8b3c3681be0d6d/pydantic_core-2.41.4-cp313-cp313-win_amd64.whl", hash = "sha256:d081a1f3800f05409ed868ebb2d74ac39dd0c1ff6c035b5162356d76030736d4", size = 2030735, upload-time = "2025-10-14T10:21:16.432Z" },
-    { url = "https://files.pythonhosted.org/packages/72/86/c99921c1cf6650023c08bfab6fe2d7057a5142628ef7ccfa9921f2dda1d5/pydantic_core-2.41.4-cp313-cp313-win_arm64.whl", hash = "sha256:f8e49c9c364a7edcbe2a310f12733aad95b022495ef2a8d653f645e5d20c1564", size = 1973209, upload-time = "2025-10-14T10:21:18.213Z" },
-    { url = "https://files.pythonhosted.org/packages/36/0d/b5706cacb70a8414396efdda3d72ae0542e050b591119e458e2490baf035/pydantic_core-2.41.4-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:ed97fd56a561f5eb5706cebe94f1ad7c13b84d98312a05546f2ad036bafe87f4", size = 1877324, upload-time = "2025-10-14T10:21:20.363Z" },
-    { url = "https://files.pythonhosted.org/packages/de/2d/cba1fa02cfdea72dfb3a9babb067c83b9dff0bbcb198368e000a6b756ea7/pydantic_core-2.41.4-cp313-cp313t-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:a870c307bf1ee91fc58a9a61338ff780d01bfae45922624816878dce784095d2", size = 1884515, upload-time = "2025-10-14T10:21:22.339Z" },
-    { url = "https://files.pythonhosted.org/packages/07/ea/3df927c4384ed9b503c9cc2d076cf983b4f2adb0c754578dfb1245c51e46/pydantic_core-2.41.4-cp313-cp313t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d25e97bc1f5f8f7985bdc2335ef9e73843bb561eb1fa6831fdfc295c1c2061cf", size = 2042819, upload-time = "2025-10-14T10:21:26.683Z" },
-    { url = "https://files.pythonhosted.org/packages/6a/ee/df8e871f07074250270a3b1b82aad4cd0026b588acd5d7d3eb2fcb1471a3/pydantic_core-2.41.4-cp313-cp313t-win_amd64.whl", hash = "sha256:d405d14bea042f166512add3091c1af40437c2e7f86988f3915fabd27b1e9cd2", size = 1995866, upload-time = "2025-10-14T10:21:28.951Z" },
-    { url = "https://files.pythonhosted.org/packages/fc/de/b20f4ab954d6d399499c33ec4fafc46d9551e11dc1858fb7f5dca0748ceb/pydantic_core-2.41.4-cp313-cp313t-win_arm64.whl", hash = "sha256:19f3684868309db5263a11bace3c45d93f6f24afa2ffe75a647583df22a2ff89", size = 1970034, upload-time = "2025-10-14T10:21:30.869Z" },
     { url = "https://files.pythonhosted.org/packages/54/28/d3325da57d413b9819365546eb9a6e8b7cbd9373d9380efd5f74326143e6/pydantic_core-2.41.4-cp314-cp314-macosx_10_12_x86_64.whl", hash = "sha256:e9205d97ed08a82ebb9a307e92914bb30e18cdf6f6b12ca4bedadb1588a0bfe1", size = 2102022, upload-time = "2025-10-14T10:21:32.809Z" },
     { url = "https://files.pythonhosted.org/packages/9e/24/b58a1bc0d834bf1acc4361e61233ee217169a42efbdc15a60296e13ce438/pydantic_core-2.41.4-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:82df1f432b37d832709fbcc0e24394bba04a01b6ecf1ee87578145c19cde12ac", size = 1905495, upload-time = "2025-10-14T10:21:34.812Z" },
     { url = "https://files.pythonhosted.org/packages/fb/a4/71f759cc41b7043e8ecdaab81b985a9b6cad7cec077e0b92cff8b71ecf6b/pydantic_core-2.41.4-cp314-cp314-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:fc3b4cc4539e055cfa39a3763c939f9d409eb40e85813257dcd761985a108554", size = 1956131, upload-time = "2025-10-14T10:21:36.924Z" },
@@ -875,22 +639,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/1e/29/b53a9ca6cd366bfc928823679c6a76c7a4c69f8201c0ba7903ad18ebae2f/pydantic_core-2.41.4-cp314-cp314t-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:5729225de81fb65b70fdb1907fcf08c75d498f4a6f15af005aabb1fdadc19dfa", size = 2041183, upload-time = "2025-10-14T10:22:08.812Z" },
     { url = "https://files.pythonhosted.org/packages/c7/3d/f8c1a371ceebcaf94d6dd2d77c6cf4b1c078e13a5837aee83f760b4f7cfd/pydantic_core-2.41.4-cp314-cp314t-win_amd64.whl", hash = "sha256:de2cfbb09e88f0f795fd90cf955858fc2c691df65b1f21f0aa00b99f3fbc661d", size = 1993542, upload-time = "2025-10-14T10:22:11.332Z" },
     { url = "https://files.pythonhosted.org/packages/8a/ac/9fc61b4f9d079482a290afe8d206b8f490e9fd32d4fc03ed4fc698214e01/pydantic_core-2.41.4-cp314-cp314t-win_arm64.whl", hash = "sha256:d34f950ae05a83e0ede899c595f312ca976023ea1db100cd5aa188f7005e3ab0", size = 1973897, upload-time = "2025-10-14T10:22:13.444Z" },
-    { url = "https://files.pythonhosted.org/packages/b0/12/5ba58daa7f453454464f92b3ca7b9d7c657d8641c48e370c3ebc9a82dd78/pydantic_core-2.41.4-graalpy311-graalpy242_311_native-macosx_10_12_x86_64.whl", hash = "sha256:a1b2cfec3879afb742a7b0bcfa53e4f22ba96571c9e54d6a3afe1052d17d843b", size = 2122139, upload-time = "2025-10-14T10:22:47.288Z" },
-    { url = "https://files.pythonhosted.org/packages/21/fb/6860126a77725c3108baecd10fd3d75fec25191d6381b6eb2ac660228eac/pydantic_core-2.41.4-graalpy311-graalpy242_311_native-macosx_11_0_arm64.whl", hash = "sha256:d175600d975b7c244af6eb9c9041f10059f20b8bbffec9e33fdd5ee3f67cdc42", size = 1936674, upload-time = "2025-10-14T10:22:49.555Z" },
-    { url = "https://files.pythonhosted.org/packages/de/be/57dcaa3ed595d81f8757e2b44a38240ac5d37628bce25fb20d02c7018776/pydantic_core-2.41.4-graalpy311-graalpy242_311_native-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:0f184d657fa4947ae5ec9c47bd7e917730fa1cbb78195037e32dcbab50aca5ee", size = 1956398, upload-time = "2025-10-14T10:22:52.19Z" },
-    { url = "https://files.pythonhosted.org/packages/2f/1d/679a344fadb9695f1a6a294d739fbd21d71fa023286daeea8c0ed49e7c2b/pydantic_core-2.41.4-graalpy311-graalpy242_311_native-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1ed810568aeffed3edc78910af32af911c835cc39ebbfacd1f0ab5dd53028e5c", size = 2138674, upload-time = "2025-10-14T10:22:54.499Z" },
-    { url = "https://files.pythonhosted.org/packages/c4/48/ae937e5a831b7c0dc646b2ef788c27cd003894882415300ed21927c21efa/pydantic_core-2.41.4-graalpy312-graalpy250_312_native-macosx_10_12_x86_64.whl", hash = "sha256:4f5d640aeebb438517150fdeec097739614421900e4a08db4a3ef38898798537", size = 2112087, upload-time = "2025-10-14T10:22:56.818Z" },
-    { url = "https://files.pythonhosted.org/packages/5e/db/6db8073e3d32dae017da7e0d16a9ecb897d0a4d92e00634916e486097961/pydantic_core-2.41.4-graalpy312-graalpy250_312_native-macosx_11_0_arm64.whl", hash = "sha256:4a9ab037b71927babc6d9e7fc01aea9e66dc2a4a34dff06ef0724a4049629f94", size = 1920387, upload-time = "2025-10-14T10:22:59.342Z" },
-    { url = "https://files.pythonhosted.org/packages/0d/c1/dd3542d072fcc336030d66834872f0328727e3b8de289c662faa04aa270e/pydantic_core-2.41.4-graalpy312-graalpy250_312_native-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:e4dab9484ec605c3016df9ad4fd4f9a390bc5d816a3b10c6550f8424bb80b18c", size = 1951495, upload-time = "2025-10-14T10:23:02.089Z" },
-    { url = "https://files.pythonhosted.org/packages/2b/c6/db8d13a1f8ab3f1eb08c88bd00fd62d44311e3456d1e85c0e59e0a0376e7/pydantic_core-2.41.4-graalpy312-graalpy250_312_native-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:bd8a5028425820731d8c6c098ab642d7b8b999758e24acae03ed38a66eca8335", size = 2139008, upload-time = "2025-10-14T10:23:04.539Z" },
-    { url = "https://files.pythonhosted.org/packages/7e/7d/138e902ed6399b866f7cfe4435d22445e16fff888a1c00560d9dc79a780f/pydantic_core-2.41.4-pp311-pypy311_pp73-macosx_10_12_x86_64.whl", hash = "sha256:491535d45cd7ad7e4a2af4a5169b0d07bebf1adfd164b0368da8aa41e19907a5", size = 2104721, upload-time = "2025-10-14T10:23:26.906Z" },
-    { url = "https://files.pythonhosted.org/packages/47/13/0525623cf94627f7b53b4c2034c81edc8491cbfc7c28d5447fa318791479/pydantic_core-2.41.4-pp311-pypy311_pp73-macosx_11_0_arm64.whl", hash = "sha256:54d86c0cada6aba4ec4c047d0e348cbad7063b87ae0f005d9f8c9ad04d4a92a2", size = 1931608, upload-time = "2025-10-14T10:23:29.306Z" },
-    { url = "https://files.pythonhosted.org/packages/d6/f9/744bc98137d6ef0a233f808bfc9b18cf94624bf30836a18d3b05d08bf418/pydantic_core-2.41.4-pp311-pypy311_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:eca1124aced216b2500dc2609eade086d718e8249cb9696660ab447d50a758bd", size = 2132986, upload-time = "2025-10-14T10:23:32.057Z" },
-    { url = "https://files.pythonhosted.org/packages/17/c8/629e88920171173f6049386cc71f893dff03209a9ef32b4d2f7e7c264bcf/pydantic_core-2.41.4-pp311-pypy311_pp73-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:6c9024169becccf0cb470ada03ee578d7348c119a0d42af3dcf9eda96e3a247c", size = 2187516, upload-time = "2025-10-14T10:23:34.871Z" },
-    { url = "https://files.pythonhosted.org/packages/2e/0f/4f2734688d98488782218ca61bcc118329bf5de05bb7fe3adc7dd79b0b86/pydantic_core-2.41.4-pp311-pypy311_pp73-musllinux_1_1_aarch64.whl", hash = "sha256:26895a4268ae5a2849269f4991cdc97236e4b9c010e51137becf25182daac405", size = 2146146, upload-time = "2025-10-14T10:23:37.342Z" },
-    { url = "https://files.pythonhosted.org/packages/ed/f2/ab385dbd94a052c62224b99cf99002eee99dbec40e10006c78575aead256/pydantic_core-2.41.4-pp311-pypy311_pp73-musllinux_1_1_armv7l.whl", hash = "sha256:ca4df25762cf71308c446e33c9b1fdca2923a3f13de616e2a949f38bf21ff5a8", size = 2311296, upload-time = "2025-10-14T10:23:40.145Z" },
-    { url = "https://files.pythonhosted.org/packages/fc/8e/e4f12afe1beeb9823bba5375f8f258df0cc61b056b0195fb1cf9f62a1a58/pydantic_core-2.41.4-pp311-pypy311_pp73-musllinux_1_1_x86_64.whl", hash = "sha256:5a28fcedd762349519276c36634e71853b4541079cab4acaaac60c4421827308", size = 2315386, upload-time = "2025-10-14T10:23:42.624Z" },
-    { url = "https://files.pythonhosted.org/packages/48/f7/925f65d930802e3ea2eb4d5afa4cb8730c8dc0d2cb89a59dc4ed2fcb2d74/pydantic_core-2.41.4-pp311-pypy311_pp73-win_amd64.whl", hash = "sha256:c173ddcd86afd2535e2b695217e82191580663a1d1928239f877f5a1649ef39f", size = 2147775, upload-time = "2025-10-14T10:23:45.406Z" },
 ]
 
 [[package]]
@@ -937,7 +685,7 @@ name = "pytest-cov"
 version = "7.0.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
-    { name = "coverage", extra = ["toml"] },
+    { name = "coverage" },
     { name = "pluggy" },
     { name = "pytest" },
 ]
@@ -985,35 +733,6 @@ version = "6.0.3"
 source = { registry = "https://pypi.org/simple" }
 sdist = { url = "https://files.pythonhosted.org/packages/05/8e/961c0007c59b8dd7729d542c61a4d537767a59645b82a0b521206e1e25c2/pyyaml-6.0.3.tar.gz", hash = "sha256:d76623373421df22fb4cf8817020cbb7ef15c725b9d5e45f17e189bfc384190f", size = 130960, upload-time = "2025-09-25T21:33:16.546Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/6d/16/a95b6757765b7b031c9374925bb718d55e0a9ba8a1b6a12d25962ea44347/pyyaml-6.0.3-cp311-cp311-macosx_10_13_x86_64.whl", hash = "sha256:44edc647873928551a01e7a563d7452ccdebee747728c1080d881d68af7b997e", size = 185826, upload-time = "2025-09-25T21:31:58.655Z" },
-    { url = "https://files.pythonhosted.org/packages/16/19/13de8e4377ed53079ee996e1ab0a9c33ec2faf808a4647b7b4c0d46dd239/pyyaml-6.0.3-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:652cb6edd41e718550aad172851962662ff2681490a8a711af6a4d288dd96824", size = 175577, upload-time = "2025-09-25T21:32:00.088Z" },
-    { url = "https://files.pythonhosted.org/packages/0c/62/d2eb46264d4b157dae1275b573017abec435397aa59cbcdab6fc978a8af4/pyyaml-6.0.3-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:10892704fc220243f5305762e276552a0395f7beb4dbf9b14ec8fd43b57f126c", size = 775556, upload-time = "2025-09-25T21:32:01.31Z" },
-    { url = "https://files.pythonhosted.org/packages/10/cb/16c3f2cf3266edd25aaa00d6c4350381c8b012ed6f5276675b9eba8d9ff4/pyyaml-6.0.3-cp311-cp311-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:850774a7879607d3a6f50d36d04f00ee69e7fc816450e5f7e58d7f17f1ae5c00", size = 882114, upload-time = "2025-09-25T21:32:03.376Z" },
-    { url = "https://files.pythonhosted.org/packages/71/60/917329f640924b18ff085ab889a11c763e0b573da888e8404ff486657602/pyyaml-6.0.3-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:b8bb0864c5a28024fac8a632c443c87c5aa6f215c0b126c449ae1a150412f31d", size = 806638, upload-time = "2025-09-25T21:32:04.553Z" },
-    { url = "https://files.pythonhosted.org/packages/dd/6f/529b0f316a9fd167281a6c3826b5583e6192dba792dd55e3203d3f8e655a/pyyaml-6.0.3-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:1d37d57ad971609cf3c53ba6a7e365e40660e3be0e5175fa9f2365a379d6095a", size = 767463, upload-time = "2025-09-25T21:32:06.152Z" },
-    { url = "https://files.pythonhosted.org/packages/f2/6a/b627b4e0c1dd03718543519ffb2f1deea4a1e6d42fbab8021936a4d22589/pyyaml-6.0.3-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:37503bfbfc9d2c40b344d06b2199cf0e96e97957ab1c1b546fd4f87e53e5d3e4", size = 794986, upload-time = "2025-09-25T21:32:07.367Z" },
-    { url = "https://files.pythonhosted.org/packages/45/91/47a6e1c42d9ee337c4839208f30d9f09caa9f720ec7582917b264defc875/pyyaml-6.0.3-cp311-cp311-win32.whl", hash = "sha256:8098f252adfa6c80ab48096053f512f2321f0b998f98150cea9bd23d83e1467b", size = 142543, upload-time = "2025-09-25T21:32:08.95Z" },
-    { url = "https://files.pythonhosted.org/packages/da/e3/ea007450a105ae919a72393cb06f122f288ef60bba2dc64b26e2646fa315/pyyaml-6.0.3-cp311-cp311-win_amd64.whl", hash = "sha256:9f3bfb4965eb874431221a3ff3fdcddc7e74e3b07799e0e84ca4a0f867d449bf", size = 158763, upload-time = "2025-09-25T21:32:09.96Z" },
-    { url = "https://files.pythonhosted.org/packages/d1/33/422b98d2195232ca1826284a76852ad5a86fe23e31b009c9886b2d0fb8b2/pyyaml-6.0.3-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:7f047e29dcae44602496db43be01ad42fc6f1cc0d8cd6c83d342306c32270196", size = 182063, upload-time = "2025-09-25T21:32:11.445Z" },
-    { url = "https://files.pythonhosted.org/packages/89/a0/6cf41a19a1f2f3feab0e9c0b74134aa2ce6849093d5517a0c550fe37a648/pyyaml-6.0.3-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:fc09d0aa354569bc501d4e787133afc08552722d3ab34836a80547331bb5d4a0", size = 173973, upload-time = "2025-09-25T21:32:12.492Z" },
-    { url = "https://files.pythonhosted.org/packages/ed/23/7a778b6bd0b9a8039df8b1b1d80e2e2ad78aa04171592c8a5c43a56a6af4/pyyaml-6.0.3-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:9149cad251584d5fb4981be1ecde53a1ca46c891a79788c0df828d2f166bda28", size = 775116, upload-time = "2025-09-25T21:32:13.652Z" },
-    { url = "https://files.pythonhosted.org/packages/65/30/d7353c338e12baef4ecc1b09e877c1970bd3382789c159b4f89d6a70dc09/pyyaml-6.0.3-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:5fdec68f91a0c6739b380c83b951e2c72ac0197ace422360e6d5a959d8d97b2c", size = 844011, upload-time = "2025-09-25T21:32:15.21Z" },
-    { url = "https://files.pythonhosted.org/packages/8b/9d/b3589d3877982d4f2329302ef98a8026e7f4443c765c46cfecc8858c6b4b/pyyaml-6.0.3-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:ba1cc08a7ccde2d2ec775841541641e4548226580ab850948cbfda66a1befcdc", size = 807870, upload-time = "2025-09-25T21:32:16.431Z" },
-    { url = "https://files.pythonhosted.org/packages/05/c0/b3be26a015601b822b97d9149ff8cb5ead58c66f981e04fedf4e762f4bd4/pyyaml-6.0.3-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:8dc52c23056b9ddd46818a57b78404882310fb473d63f17b07d5c40421e47f8e", size = 761089, upload-time = "2025-09-25T21:32:17.56Z" },
-    { url = "https://files.pythonhosted.org/packages/be/8e/98435a21d1d4b46590d5459a22d88128103f8da4c2d4cb8f14f2a96504e1/pyyaml-6.0.3-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:41715c910c881bc081f1e8872880d3c650acf13dfa8214bad49ed4cede7c34ea", size = 790181, upload-time = "2025-09-25T21:32:18.834Z" },
-    { url = "https://files.pythonhosted.org/packages/74/93/7baea19427dcfbe1e5a372d81473250b379f04b1bd3c4c5ff825e2327202/pyyaml-6.0.3-cp312-cp312-win32.whl", hash = "sha256:96b533f0e99f6579b3d4d4995707cf36df9100d67e0c8303a0c55b27b5f99bc5", size = 137658, upload-time = "2025-09-25T21:32:20.209Z" },
-    { url = "https://files.pythonhosted.org/packages/86/bf/899e81e4cce32febab4fb42bb97dcdf66bc135272882d1987881a4b519e9/pyyaml-6.0.3-cp312-cp312-win_amd64.whl", hash = "sha256:5fcd34e47f6e0b794d17de1b4ff496c00986e1c83f7ab2fb8fcfe9616ff7477b", size = 154003, upload-time = "2025-09-25T21:32:21.167Z" },
-    { url = "https://files.pythonhosted.org/packages/1a/08/67bd04656199bbb51dbed1439b7f27601dfb576fb864099c7ef0c3e55531/pyyaml-6.0.3-cp312-cp312-win_arm64.whl", hash = "sha256:64386e5e707d03a7e172c0701abfb7e10f0fb753ee1d773128192742712a98fd", size = 140344, upload-time = "2025-09-25T21:32:22.617Z" },
-    { url = "https://files.pythonhosted.org/packages/d1/11/0fd08f8192109f7169db964b5707a2f1e8b745d4e239b784a5a1dd80d1db/pyyaml-6.0.3-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:8da9669d359f02c0b91ccc01cac4a67f16afec0dac22c2ad09f46bee0697eba8", size = 181669, upload-time = "2025-09-25T21:32:23.673Z" },
-    { url = "https://files.pythonhosted.org/packages/b1/16/95309993f1d3748cd644e02e38b75d50cbc0d9561d21f390a76242ce073f/pyyaml-6.0.3-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:2283a07e2c21a2aa78d9c4442724ec1eb15f5e42a723b99cb3d822d48f5f7ad1", size = 173252, upload-time = "2025-09-25T21:32:25.149Z" },
-    { url = "https://files.pythonhosted.org/packages/50/31/b20f376d3f810b9b2371e72ef5adb33879b25edb7a6d072cb7ca0c486398/pyyaml-6.0.3-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:ee2922902c45ae8ccada2c5b501ab86c36525b883eff4255313a253a3160861c", size = 767081, upload-time = "2025-09-25T21:32:26.575Z" },
-    { url = "https://files.pythonhosted.org/packages/49/1e/a55ca81e949270d5d4432fbbd19dfea5321eda7c41a849d443dc92fd1ff7/pyyaml-6.0.3-cp313-cp313-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:a33284e20b78bd4a18c8c2282d549d10bc8408a2a7ff57653c0cf0b9be0afce5", size = 841159, upload-time = "2025-09-25T21:32:27.727Z" },
-    { url = "https://files.pythonhosted.org/packages/74/27/e5b8f34d02d9995b80abcef563ea1f8b56d20134d8f4e5e81733b1feceb2/pyyaml-6.0.3-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:0f29edc409a6392443abf94b9cf89ce99889a1dd5376d94316ae5145dfedd5d6", size = 801626, upload-time = "2025-09-25T21:32:28.878Z" },
-    { url = "https://files.pythonhosted.org/packages/f9/11/ba845c23988798f40e52ba45f34849aa8a1f2d4af4b798588010792ebad6/pyyaml-6.0.3-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:f7057c9a337546edc7973c0d3ba84ddcdf0daa14533c2065749c9075001090e6", size = 753613, upload-time = "2025-09-25T21:32:30.178Z" },
-    { url = "https://files.pythonhosted.org/packages/3d/e0/7966e1a7bfc0a45bf0a7fb6b98ea03fc9b8d84fa7f2229e9659680b69ee3/pyyaml-6.0.3-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:eda16858a3cab07b80edaf74336ece1f986ba330fdb8ee0d6c0d68fe82bc96be", size = 794115, upload-time = "2025-09-25T21:32:31.353Z" },
-    { url = "https://files.pythonhosted.org/packages/de/94/980b50a6531b3019e45ddeada0626d45fa85cbe22300844a7983285bed3b/pyyaml-6.0.3-cp313-cp313-win32.whl", hash = "sha256:d0eae10f8159e8fdad514efdc92d74fd8d682c933a6dd088030f3834bc8e6b26", size = 137427, upload-time = "2025-09-25T21:32:32.58Z" },
-    { url = "https://files.pythonhosted.org/packages/97/c9/39d5b874e8b28845e4ec2202b5da735d0199dbe5b8fb85f91398814a9a46/pyyaml-6.0.3-cp313-cp313-win_amd64.whl", hash = "sha256:79005a0d97d5ddabfeeea4cf676af11e647e41d81c9a7722a193022accdb6b7c", size = 154090, upload-time = "2025-09-25T21:32:33.659Z" },
-    { url = "https://files.pythonhosted.org/packages/73/e8/2bdf3ca2090f68bb3d75b44da7bbc71843b19c9f2b9cb9b0f4ab7a5a4329/pyyaml-6.0.3-cp313-cp313-win_arm64.whl", hash = "sha256:5498cd1645aa724a7c71c8f378eb29ebe23da2fc0d7a08071d89469bf1d2defb", size = 140246, upload-time = "2025-09-25T21:32:34.663Z" },
     { url = "https://files.pythonhosted.org/packages/9d/8c/f4bd7f6465179953d3ac9bc44ac1a8a3e6122cf8ada906b4f96c60172d43/pyyaml-6.0.3-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:8d1fab6bb153a416f9aeb4b8763bc0f22a5586065f86f7664fc23339fc1c1fac", size = 181814, upload-time = "2025-09-25T21:32:35.712Z" },
     { url = "https://files.pythonhosted.org/packages/bd/9c/4d95bb87eb2063d20db7b60faa3840c1b18025517ae857371c4dd55a6b3a/pyyaml-6.0.3-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:34d5fcd24b8445fadc33f9cf348c1047101756fd760b4dacb5c3e99755703310", size = 173809, upload-time = "2025-09-25T21:32:36.789Z" },
     { url = "https://files.pythonhosted.org/packages/92/b5/47e807c2623074914e29dabd16cbbdd4bf5e9b2db9f8090fa64411fc5382/pyyaml-6.0.3-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:501a031947e3a9025ed4405a168e6ef5ae3126c59f90ce0cd6f2bfc477be31b7", size = 766454, upload-time = "2025-09-25T21:32:37.966Z" },
@@ -1118,55 +837,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/b7/ce/149a00dd41f10bc29e5921b496af8b574d8413afcd5e30dfa0ed46c2cc5e/six-1.17.0-py2.py3-none-any.whl", hash = "sha256:4721f391ed90541fddacab5acf947aa0d3dc7d27b2e1e8eda2be8970586c3274", size = 11050, upload-time = "2024-12-04T17:35:26.475Z" },
 ]
 
-[[package]]
-name = "tomli"
-version = "2.3.0"
-source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/52/ed/3f73f72945444548f33eba9a87fc7a6e969915e7b1acc8260b30e1f76a2f/tomli-2.3.0.tar.gz", hash = "sha256:64be704a875d2a59753d80ee8a533c3fe183e3f06807ff7dc2232938ccb01549", size = 17392, upload-time = "2025-10-08T22:01:47.119Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/b3/2e/299f62b401438d5fe1624119c723f5d877acc86a4c2492da405626665f12/tomli-2.3.0-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:88bd15eb972f3664f5ed4b57c1634a97153b4bac4479dcb6a495f41921eb7f45", size = 153236, upload-time = "2025-10-08T22:01:00.137Z" },
-    { url = "https://files.pythonhosted.org/packages/86/7f/d8fffe6a7aefdb61bced88fcb5e280cfd71e08939da5894161bd71bea022/tomli-2.3.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:883b1c0d6398a6a9d29b508c331fa56adbcdff647f6ace4dfca0f50e90dfd0ba", size = 148084, upload-time = "2025-10-08T22:01:01.63Z" },
-    { url = "https://files.pythonhosted.org/packages/47/5c/24935fb6a2ee63e86d80e4d3b58b222dafaf438c416752c8b58537c8b89a/tomli-2.3.0-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:d1381caf13ab9f300e30dd8feadb3de072aeb86f1d34a8569453ff32a7dea4bf", size = 234832, upload-time = "2025-10-08T22:01:02.543Z" },
-    { url = "https://files.pythonhosted.org/packages/89/da/75dfd804fc11e6612846758a23f13271b76d577e299592b4371a4ca4cd09/tomli-2.3.0-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:a0e285d2649b78c0d9027570d4da3425bdb49830a6156121360b3f8511ea3441", size = 242052, upload-time = "2025-10-08T22:01:03.836Z" },
-    { url = "https://files.pythonhosted.org/packages/70/8c/f48ac899f7b3ca7eb13af73bacbc93aec37f9c954df3c08ad96991c8c373/tomli-2.3.0-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:0a154a9ae14bfcf5d8917a59b51ffd5a3ac1fd149b71b47a3a104ca4edcfa845", size = 239555, upload-time = "2025-10-08T22:01:04.834Z" },
-    { url = "https://files.pythonhosted.org/packages/ba/28/72f8afd73f1d0e7829bfc093f4cb98ce0a40ffc0cc997009ee1ed94ba705/tomli-2.3.0-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:74bf8464ff93e413514fefd2be591c3b0b23231a77f901db1eb30d6f712fc42c", size = 245128, upload-time = "2025-10-08T22:01:05.84Z" },
-    { url = "https://files.pythonhosted.org/packages/b6/eb/a7679c8ac85208706d27436e8d421dfa39d4c914dcf5fa8083a9305f58d9/tomli-2.3.0-cp311-cp311-win32.whl", hash = "sha256:00b5f5d95bbfc7d12f91ad8c593a1659b6387b43f054104cda404be6bda62456", size = 96445, upload-time = "2025-10-08T22:01:06.896Z" },
-    { url = "https://files.pythonhosted.org/packages/0a/fe/3d3420c4cb1ad9cb462fb52967080575f15898da97e21cb6f1361d505383/tomli-2.3.0-cp311-cp311-win_amd64.whl", hash = "sha256:4dc4ce8483a5d429ab602f111a93a6ab1ed425eae3122032db7e9acf449451be", size = 107165, upload-time = "2025-10-08T22:01:08.107Z" },
-    { url = "https://files.pythonhosted.org/packages/ff/b7/40f36368fcabc518bb11c8f06379a0fd631985046c038aca08c6d6a43c6e/tomli-2.3.0-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:d7d86942e56ded512a594786a5ba0a5e521d02529b3826e7761a05138341a2ac", size = 154891, upload-time = "2025-10-08T22:01:09.082Z" },
-    { url = "https://files.pythonhosted.org/packages/f9/3f/d9dd692199e3b3aab2e4e4dd948abd0f790d9ded8cd10cbaae276a898434/tomli-2.3.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:73ee0b47d4dad1c5e996e3cd33b8a76a50167ae5f96a2607cbe8cc773506ab22", size = 148796, upload-time = "2025-10-08T22:01:10.266Z" },
-    { url = "https://files.pythonhosted.org/packages/60/83/59bff4996c2cf9f9387a0f5a3394629c7efa5ef16142076a23a90f1955fa/tomli-2.3.0-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:792262b94d5d0a466afb5bc63c7daa9d75520110971ee269152083270998316f", size = 242121, upload-time = "2025-10-08T22:01:11.332Z" },
-    { url = "https://files.pythonhosted.org/packages/45/e5/7c5119ff39de8693d6baab6c0b6dcb556d192c165596e9fc231ea1052041/tomli-2.3.0-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:4f195fe57ecceac95a66a75ac24d9d5fbc98ef0962e09b2eddec5d39375aae52", size = 250070, upload-time = "2025-10-08T22:01:12.498Z" },
-    { url = "https://files.pythonhosted.org/packages/45/12/ad5126d3a278f27e6701abde51d342aa78d06e27ce2bb596a01f7709a5a2/tomli-2.3.0-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:e31d432427dcbf4d86958c184b9bfd1e96b5b71f8eb17e6d02531f434fd335b8", size = 245859, upload-time = "2025-10-08T22:01:13.551Z" },
-    { url = "https://files.pythonhosted.org/packages/fb/a1/4d6865da6a71c603cfe6ad0e6556c73c76548557a8d658f9e3b142df245f/tomli-2.3.0-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:7b0882799624980785240ab732537fcfc372601015c00f7fc367c55308c186f6", size = 250296, upload-time = "2025-10-08T22:01:14.614Z" },
-    { url = "https://files.pythonhosted.org/packages/a0/b7/a7a7042715d55c9ba6e8b196d65d2cb662578b4d8cd17d882d45322b0d78/tomli-2.3.0-cp312-cp312-win32.whl", hash = "sha256:ff72b71b5d10d22ecb084d345fc26f42b5143c5533db5e2eaba7d2d335358876", size = 97124, upload-time = "2025-10-08T22:01:15.629Z" },
-    { url = "https://files.pythonhosted.org/packages/06/1e/f22f100db15a68b520664eb3328fb0ae4e90530887928558112c8d1f4515/tomli-2.3.0-cp312-cp312-win_amd64.whl", hash = "sha256:1cb4ed918939151a03f33d4242ccd0aa5f11b3547d0cf30f7c74a408a5b99878", size = 107698, upload-time = "2025-10-08T22:01:16.51Z" },
-    { url = "https://files.pythonhosted.org/packages/89/48/06ee6eabe4fdd9ecd48bf488f4ac783844fd777f547b8d1b61c11939974e/tomli-2.3.0-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:5192f562738228945d7b13d4930baffda67b69425a7f0da96d360b0a3888136b", size = 154819, upload-time = "2025-10-08T22:01:17.964Z" },
-    { url = "https://files.pythonhosted.org/packages/f1/01/88793757d54d8937015c75dcdfb673c65471945f6be98e6a0410fba167ed/tomli-2.3.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:be71c93a63d738597996be9528f4abe628d1adf5e6eb11607bc8fe1a510b5dae", size = 148766, upload-time = "2025-10-08T22:01:18.959Z" },
-    { url = "https://files.pythonhosted.org/packages/42/17/5e2c956f0144b812e7e107f94f1cc54af734eb17b5191c0bbfb72de5e93e/tomli-2.3.0-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:c4665508bcbac83a31ff8ab08f424b665200c0e1e645d2bd9ab3d3e557b6185b", size = 240771, upload-time = "2025-10-08T22:01:20.106Z" },
-    { url = "https://files.pythonhosted.org/packages/d5/f4/0fbd014909748706c01d16824eadb0307115f9562a15cbb012cd9b3512c5/tomli-2.3.0-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:4021923f97266babc6ccab9f5068642a0095faa0a51a246a6a02fccbb3514eaf", size = 248586, upload-time = "2025-10-08T22:01:21.164Z" },
-    { url = "https://files.pythonhosted.org/packages/30/77/fed85e114bde5e81ecf9bc5da0cc69f2914b38f4708c80ae67d0c10180c5/tomli-2.3.0-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:a4ea38c40145a357d513bffad0ed869f13c1773716cf71ccaa83b0fa0cc4e42f", size = 244792, upload-time = "2025-10-08T22:01:22.417Z" },
-    { url = "https://files.pythonhosted.org/packages/55/92/afed3d497f7c186dc71e6ee6d4fcb0acfa5f7d0a1a2878f8beae379ae0cc/tomli-2.3.0-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:ad805ea85eda330dbad64c7ea7a4556259665bdf9d2672f5dccc740eb9d3ca05", size = 248909, upload-time = "2025-10-08T22:01:23.859Z" },
-    { url = "https://files.pythonhosted.org/packages/f8/84/ef50c51b5a9472e7265ce1ffc7f24cd4023d289e109f669bdb1553f6a7c2/tomli-2.3.0-cp313-cp313-win32.whl", hash = "sha256:97d5eec30149fd3294270e889b4234023f2c69747e555a27bd708828353ab606", size = 96946, upload-time = "2025-10-08T22:01:24.893Z" },
-    { url = "https://files.pythonhosted.org/packages/b2/b7/718cd1da0884f281f95ccfa3a6cc572d30053cba64603f79d431d3c9b61b/tomli-2.3.0-cp313-cp313-win_amd64.whl", hash = "sha256:0c95ca56fbe89e065c6ead5b593ee64b84a26fca063b5d71a1122bf26e533999", size = 107705, upload-time = "2025-10-08T22:01:26.153Z" },
-    { url = "https://files.pythonhosted.org/packages/19/94/aeafa14a52e16163008060506fcb6aa1949d13548d13752171a755c65611/tomli-2.3.0-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:cebc6fe843e0733ee827a282aca4999b596241195f43b4cc371d64fc6639da9e", size = 154244, upload-time = "2025-10-08T22:01:27.06Z" },
-    { url = "https://files.pythonhosted.org/packages/db/e4/1e58409aa78eefa47ccd19779fc6f36787edbe7d4cd330eeeedb33a4515b/tomli-2.3.0-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:4c2ef0244c75aba9355561272009d934953817c49f47d768070c3c94355c2aa3", size = 148637, upload-time = "2025-10-08T22:01:28.059Z" },
-    { url = "https://files.pythonhosted.org/packages/26/b6/d1eccb62f665e44359226811064596dd6a366ea1f985839c566cd61525ae/tomli-2.3.0-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:c22a8bf253bacc0cf11f35ad9808b6cb75ada2631c2d97c971122583b129afbc", size = 241925, upload-time = "2025-10-08T22:01:29.066Z" },
-    { url = "https://files.pythonhosted.org/packages/70/91/7cdab9a03e6d3d2bb11beae108da5bdc1c34bdeb06e21163482544ddcc90/tomli-2.3.0-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:0eea8cc5c5e9f89c9b90c4896a8deefc74f518db5927d0e0e8d4a80953d774d0", size = 249045, upload-time = "2025-10-08T22:01:31.98Z" },
-    { url = "https://files.pythonhosted.org/packages/15/1b/8c26874ed1f6e4f1fcfeb868db8a794cbe9f227299402db58cfcc858766c/tomli-2.3.0-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:b74a0e59ec5d15127acdabd75ea17726ac4c5178ae51b85bfe39c4f8a278e879", size = 245835, upload-time = "2025-10-08T22:01:32.989Z" },
-    { url = "https://files.pythonhosted.org/packages/fd/42/8e3c6a9a4b1a1360c1a2a39f0b972cef2cc9ebd56025168c4137192a9321/tomli-2.3.0-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:b5870b50c9db823c595983571d1296a6ff3e1b88f734a4c8f6fc6188397de005", size = 253109, upload-time = "2025-10-08T22:01:34.052Z" },
-    { url = "https://files.pythonhosted.org/packages/22/0c/b4da635000a71b5f80130937eeac12e686eefb376b8dee113b4a582bba42/tomli-2.3.0-cp314-cp314-win32.whl", hash = "sha256:feb0dacc61170ed7ab602d3d972a58f14ee3ee60494292d384649a3dc38ef463", size = 97930, upload-time = "2025-10-08T22:01:35.082Z" },
-    { url = "https://files.pythonhosted.org/packages/b9/74/cb1abc870a418ae99cd5c9547d6bce30701a954e0e721821df483ef7223c/tomli-2.3.0-cp314-cp314-win_amd64.whl", hash = "sha256:b273fcbd7fc64dc3600c098e39136522650c49bca95df2d11cf3b626422392c8", size = 107964, upload-time = "2025-10-08T22:01:36.057Z" },
-    { url = "https://files.pythonhosted.org/packages/54/78/5c46fff6432a712af9f792944f4fcd7067d8823157949f4e40c56b8b3c83/tomli-2.3.0-cp314-cp314t-macosx_10_13_x86_64.whl", hash = "sha256:940d56ee0410fa17ee1f12b817b37a4d4e4dc4d27340863cc67236c74f582e77", size = 163065, upload-time = "2025-10-08T22:01:37.27Z" },
-    { url = "https://files.pythonhosted.org/packages/39/67/f85d9bd23182f45eca8939cd2bc7050e1f90c41f4a2ecbbd5963a1d1c486/tomli-2.3.0-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:f85209946d1fe94416debbb88d00eb92ce9cd5266775424ff81bc959e001acaf", size = 159088, upload-time = "2025-10-08T22:01:38.235Z" },
-    { url = "https://files.pythonhosted.org/packages/26/5a/4b546a0405b9cc0659b399f12b6adb750757baf04250b148d3c5059fc4eb/tomli-2.3.0-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:a56212bdcce682e56b0aaf79e869ba5d15a6163f88d5451cbde388d48b13f530", size = 268193, upload-time = "2025-10-08T22:01:39.712Z" },
-    { url = "https://files.pythonhosted.org/packages/42/4f/2c12a72ae22cf7b59a7fe75b3465b7aba40ea9145d026ba41cb382075b0e/tomli-2.3.0-cp314-cp314t-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:c5f3ffd1e098dfc032d4d3af5c0ac64f6d286d98bc148698356847b80fa4de1b", size = 275488, upload-time = "2025-10-08T22:01:40.773Z" },
-    { url = "https://files.pythonhosted.org/packages/92/04/a038d65dbe160c3aa5a624e93ad98111090f6804027d474ba9c37c8ae186/tomli-2.3.0-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:5e01decd096b1530d97d5d85cb4dff4af2d8347bd35686654a004f8dea20fc67", size = 272669, upload-time = "2025-10-08T22:01:41.824Z" },
-    { url = "https://files.pythonhosted.org/packages/be/2f/8b7c60a9d1612a7cbc39ffcca4f21a73bf368a80fc25bccf8253e2563267/tomli-2.3.0-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:8a35dd0e643bb2610f156cca8db95d213a90015c11fee76c946aa62b7ae7e02f", size = 279709, upload-time = "2025-10-08T22:01:43.177Z" },
-    { url = "https://files.pythonhosted.org/packages/7e/46/cc36c679f09f27ded940281c38607716c86cf8ba4a518d524e349c8b4874/tomli-2.3.0-cp314-cp314t-win32.whl", hash = "sha256:a1f7f282fe248311650081faafa5f4732bdbfef5d45fe3f2e702fbc6f2d496e0", size = 107563, upload-time = "2025-10-08T22:01:44.233Z" },
-    { url = "https://files.pythonhosted.org/packages/84/ff/426ca8683cf7b753614480484f6437f568fd2fda2edbdf57a2d3d8b27a0b/tomli-2.3.0-cp314-cp314t-win_amd64.whl", hash = "sha256:70a251f8d4ba2d9ac2542eecf008b3c8a9fc5c3f9f02c56a9d7952612be2fdba", size = 119756, upload-time = "2025-10-08T22:01:45.234Z" },
-    { url = "https://files.pythonhosted.org/packages/77/b8/0135fadc89e73be292b473cb820b4f5a08197779206b33191e801feeae40/tomli-2.3.0-py3-none-any.whl", hash = "sha256:e95b1af3c5b07d9e643909b5abbec77cd9f1217e6d0bca72b0234736b9fb1f1b", size = 14408, upload-time = "2025-10-08T22:01:46.04Z" },
-]
-
 [[package]]
 name = "tqdm"
 version = "4.67.1"