From 2105f27bfa0b097d1092f2f3c1f016a51c73a0ae Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 18:51:56 +0300
Subject: [PATCH 01/13] Lab 6: blocks/tags, Docker Compose, wipe logic, CI/CD

---
 .github/workflows/ansible-deploy.yml          |  91 ++
 .gitignore                                    |   2 +-
 ansible/ansible.cfg                           |  22 +-
 ansible/docs/LAB05.md                         | 764 +++++++-------
 ansible/docs/LAB06.md                         | 960 ++++++++++++++++++
 ansible/group_vars/all.yml                    |  36 +-
 ansible/inventory/hosts.ini                   |   2 +-
 ansible/playbooks/deploy.yml                  |  18 +-
 ansible/playbooks/provision.yml               |  16 +-
 ansible/playbooks/site.yml                    |  18 +-
 ansible/roles/app_deploy/tasks/main.yml       |  46 -
 ansible/roles/common/defaults/main.yml        |  28 +-
 ansible/roles/common/tasks/main.yml           |  99 +-
 ansible/roles/docker/defaults/main.yml        |  25 +-
 ansible/roles/docker/handlers/main.yml        |  10 +-
 ansible/roles/docker/tasks/main.yml           | 168 ++-
 .../{app_deploy => web_app}/defaults/main.yml |  25 +-
 .../{app_deploy => web_app}/handlers/main.yml |  12 +-
 ansible/roles/web_app/meta/main.yml           |   9 +
 ansible/roles/web_app/tasks/main.yml          |  80 ++
 ansible/roles/web_app/tasks/wipe.yml          |  23 +
 .../web_app/templates/docker-compose.yml.j2   |  30 +
 22 files changed, 1892 insertions(+), 592 deletions(-)
 create mode 100644 .github/workflows/ansible-deploy.yml
 create mode 100644 ansible/docs/LAB06.md
 delete mode 100644 ansible/roles/app_deploy/tasks/main.yml
 rename ansible/roles/{app_deploy => web_app}/defaults/main.yml (68%)
 rename ansible/roles/{app_deploy => web_app}/handlers/main.yml (96%)
 create mode 100644 ansible/roles/web_app/meta/main.yml
 create mode 100644 ansible/roles/web_app/tasks/main.yml
 create mode 100644 ansible/roles/web_app/tasks/wipe.yml
 create mode 100644 ansible/roles/web_app/templates/docker-compose.yml.j2

diff --git a/.github/workflows/ansible-deploy.yml b/.github/workflows/ansible-deploy.yml
new file mode 100644
index 0000000000..551819a03f
--- /dev/null
+++ b/.github/workflows/ansible-deploy.yml
@@ -0,0 +1,91 @@
+name: Ansible Deployment
+
+on:
+  push:
+    branches: [master]
+    paths:
+      - 'ansible/**'
+      - '!ansible/docs/**'
+      - '.github/workflows/ansible-deploy.yml'
+  pull_request:
+    branches: [master]
+    paths:
+      - 'ansible/**'
+      - '.github/workflows/ansible-deploy.yml'
+
+concurrency:
+  group: ansible-deploy-${{ github.ref }}
+  cancel-in-progress: true
+
+permissions:
+  contents: read
+
+jobs:
+  lint:
+    name: Ansible Lint
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+
+      - name: Set up Python 3.12
+        uses: actions/setup-python@v5
+        with:
+          python-version: '3.12'
+          cache: pip
+
+      - name: Install Ansible and ansible-lint
+        run: pip install ansible ansible-lint
+
+      - name: Run ansible-lint
+        run: |
+          cd ansible
+          ansible-lint playbooks/provision.yml playbooks/deploy.yml playbooks/site.yml
+
+  deploy:
+    name: Deploy Application
+    needs: lint
+    runs-on: ubuntu-latest
+    if: github.event_name == 'push'
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+
+      - name: Set up Python 3.12
+        uses: actions/setup-python@v5
+        with:
+          python-version: '3.12'
+          cache: pip
+
+      - name: Install Ansible
+        run: pip install ansible
+
+      - name: Install community.docker collection
+        run: ansible-galaxy collection install community.docker community.general
+
+      - name: Configure SSH access to target VM
+        run: |
+          mkdir -p ~/.ssh
+          echo "${{ secrets.SSH_PRIVATE_KEY }}" > ~/.ssh/id_rsa
+          chmod 600 ~/.ssh/id_rsa
+          ssh-keyscan -H "${{ secrets.VM_HOST }}" >> ~/.ssh/known_hosts
+
+      - name: Write Vault password file
+        run: echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
+
+      - name: Run Ansible deploy playbook
+        env:
+          ANSIBLE_HOST_KEY_CHECKING: "False"
+        run: |
+          cd ansible
+          ansible-playbook playbooks/deploy.yml \
+            --vault-password-file /tmp/vault_pass
+
+      - name: Clean up Vault password file
+        if: always()
+        run: rm -f /tmp/vault_pass
+
+      - name: Verify deployment
+        run: |
+          sleep 10
+          curl -f "http://${{ secrets.VM_HOST }}:5000/health" || exit 1
diff --git a/.gitignore b/.gitignore
index 30d74d2584..5dfde0f734 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1 +1 @@
-test
\ No newline at end of file
+test.vault_pass
diff --git a/ansible/ansible.cfg b/ansible/ansible.cfg
index 11bb2bd1f9..7737aab432 100644
--- a/ansible/ansible.cfg
+++ b/ansible/ansible.cfg
@@ -1,12 +1,12 @@
-[defaults]
-vault_password_file = .vault_pass
-inventory = inventory/hosts.ini
-roles_path = roles
-host_key_checking = False
-remote_user = ubuntu
-retry_files_enabled = False
-
-[privilege_escalation]
-become = True
-become_method = sudo
+[defaults]
+vault_password_file = .vault_pass
+inventory = inventory/hosts.ini
+roles_path = roles
+host_key_checking = False
+remote_user = ubuntu
+retry_files_enabled = False
+
+[privilege_escalation]
+become = True
+become_method = sudo
 become_user = root
\ No newline at end of file
diff --git a/ansible/docs/LAB05.md b/ansible/docs/LAB05.md
index 936cc2037b..b5bb093bfc 100644
--- a/ansible/docs/LAB05.md
+++ b/ansible/docs/LAB05.md
@@ -1,382 +1,382 @@
-# Lab 05 — Ansible Fundamentals
-
-## 1. Architecture Overview
-
-**Ansible version:** ansible [core 2.16.3]
-
-**Target VM OS:** Ubuntu 22.04.5 LTS (ubuntu/jammy64 via Vagrant + VirtualBox)
-
-**Control node:** WSL2 (Ubuntu) on Windows
-
-### Role Structure
-
-```
-ansible/
-├── inventory/
-│   └── hosts.ini              # Static inventory — VM IP + SSH key
-├── roles/
-│   ├── common/                # System packages & timezone
-│   │   ├── tasks/main.yml
-│   │   └── defaults/main.yml
-│   ├── docker/                # Docker CE installation
-│   │   ├── tasks/main.yml
-│   │   ├── handlers/main.yml
-│   │   └── defaults/main.yml
-│   └── app_deploy/            # Pull & run containerized app
-│       ├── tasks/main.yml
-│       ├── handlers/main.yml
-│       └── defaults/main.yml
-├── playbooks/
-│   ├── site.yml               # Imports both playbooks
-│   ├── provision.yml          # common + docker roles
-│   └── deploy.yml             # app_deploy role
-├── group_vars/
-│   └── all.yml               # Ansible Vault encrypted secrets
-├── ansible.cfg
-└── docs/LAB05.md
-```
-
-### Connectivity Test
-
-```
-$ ansible all -m ping
-
-devops-vm | SUCCESS => {
-    "changed": false,
-    "ping": "pong"
-}
-```
-
----
-
-### Why Roles Instead of Monolithic Playbooks?
-
-Roles split responsibilities cleanly: `common` handles system setup, `docker` handles Docker installation, `app_deploy` handles the application. Each role can be reused across multiple projects, tested independently, and understood in isolation. A monolithic playbook with 50+ tasks becomes impossible to maintain — roles keep complexity manageable.
-
----
-
-## 2. Roles Documentation
-
-### Role: `common`
-
-**Purpose:** Prepares every server with baseline tools. Updates the apt cache and installs utilities like git, curl, vim, htop, python3-pip.
-
-**Variables (`defaults/main.yml`):**
-| Variable | Default | Description |
-|---|---|---|
-| `common_packages` | list of packages | Packages to install via apt |
-| `common_timezone` | `UTC` | System timezone |
-
-**Handlers:** None
-
-**Dependencies:** None
-
----
-
-### Role: `docker`
-
-**Purpose:** Installs Docker CE from the official Docker repository using the modern GPG key method (`/etc/apt/keyrings/docker.gpg`), ensures the service is running and enabled at boot, adds the target user to the `docker` group.
-
-**Variables (`defaults/main.yml`):**
-| Variable | Default | Description |
-|---|---|---|
-| `docker_packages` | docker-ce, cli, containerd, plugins | Packages to install |
-| `docker_user` | `vagrant` | User to add to docker group |
-
-**Handlers:**
-- `restart docker` — triggered when Docker packages are installed for the first time
-
-**Dependencies:** `common` role (needs ca-certificates, gnupg pre-installed)
-
----
-
-### Role: `app_deploy`
-
-**Purpose:** Authenticates with Docker Hub using vaulted credentials, pulls the latest image of the Python app (`cdeth567/devops-info-service`), removes any old container, starts a fresh container with port mapping 5000:5000, and verifies the `/health` endpoint responds HTTP 200.
-
-**Variables (`group_vars/all.yml` — Vault encrypted):**
-| Variable | Description |
-|---|---|
-| `dockerhub_username` | Docker Hub username (`cdeth567`) |
-| `dockerhub_password` | Docker Hub access token |
-| `app_name` | `devops-info-service` |
-| `docker_image` | `cdeth567/devops-info-service` |
-| `docker_image_tag` | `latest` |
-| `app_port` | `5000` |
-| `app_container_name` | `devops-info-service` |
-
-**Variables (`defaults/main.yml`):**
-| Variable | Default | Description |
-|---|---|---|
-| `app_port` | `5000` | Port to expose |
-| `app_restart_policy` | `unless-stopped` | Docker restart policy |
-| `app_env_vars` | `{}` | Extra env vars for container |
-
-**Handlers:**
-- `restart app container` — restarts the container when triggered by config change
-
-**Dependencies:** `docker` role must run first
-
----
-
-## 3. Idempotency Demonstration
-
-### First Run (`ansible-playbook playbooks/provision.yml`)
-
-```
-PLAY [Provision web servers] ****************************************************
-
-TASK [Gathering Facts] **********************************************************
-ok: [devops-vm]
-
-TASK [common : Update apt cache] ************************************************
-changed: [devops-vm]
-
-TASK [common : Install common packages] *****************************************
-changed: [devops-vm]
-
-TASK [common : Set timezone (optional)] *****************************************
-changed: [devops-vm]
-
-TASK [docker : Install prerequisites for Docker repo] ***************************
-ok: [devops-vm]
-
-TASK [docker : Ensure /etc/apt/keyrings exists] *********************************
-ok: [devops-vm]
-
-TASK [docker : Download and dearmor Docker GPG key] *****************************
-ok: [devops-vm]
-
-TASK [docker : Add Docker apt repository] ***************************************
-changed: [devops-vm]
-
-TASK [docker : Install Docker packages] *****************************************
-changed: [devops-vm]
-
-TASK [docker : Ensure Docker service is started and enabled] ********************
-ok: [devops-vm]
-
-TASK [docker : Add user to docker group] ****************************************
-changed: [devops-vm]
-
-TASK [docker : Install python3-docker for Ansible Docker modules] ***************
-changed: [devops-vm]
-
-PLAY RECAP **********************************************************************
-devops-vm : ok=10   changed=6   unreachable=0   failed=0
-```
-
-### Second Run (`ansible-playbook playbooks/provision.yml`)
-
-```
-PLAY [Provision web servers] ****************************************************
-
-TASK [Gathering Facts] **********************************************************
-ok: [devops-vm]
-
-TASK [common : Update apt cache] ************************************************
-ok: [devops-vm]
-
-TASK [common : Install common packages] *****************************************
-ok: [devops-vm]
-
-TASK [common : Set timezone (optional)] *****************************************
-ok: [devops-vm]
-
-TASK [docker : Install prerequisites for Docker repo] ***************************
-ok: [devops-vm]
-
-TASK [docker : Ensure /etc/apt/keyrings exists] *********************************
-ok: [devops-vm]
-
-TASK [docker : Download and dearmor Docker GPG key] *****************************
-ok: [devops-vm]
-
-TASK [docker : Add Docker apt repository] ***************************************
-ok: [devops-vm]
-
-TASK [docker : Install Docker packages] *****************************************
-ok: [devops-vm]
-
-TASK [docker : Ensure Docker service is started and enabled] ********************
-ok: [devops-vm]
-
-TASK [docker : Add user to docker group] ****************************************
-ok: [devops-vm]
-
-TASK [docker : Install python3-docker for Ansible Docker modules] ***************
-ok: [devops-vm]
-
-PLAY RECAP **********************************************************************
-devops-vm : ok=12   changed=0   unreachable=0   failed=0
-```
-
-### Analysis
-
-**First run — why tasks showed `changed`:**
-- `Update apt cache` — package lists were stale, had to refresh
-- `Install common packages` — git, curl, vim etc. weren't installed yet
-- `Set timezone` — timezone wasn't configured
-- `Download and dearmor Docker GPG key` — key wasn't in `/etc/apt/keyrings/` yet
-- `Add Docker apt repository` — Docker repo wasn't in sources
-- `Install Docker packages` — Docker CE wasn't installed
-- `Add user to docker group` — vagrant user wasn't in docker group
-- `Install python3-docker` — Python Docker SDK wasn't installed
-
-**Second run — zero `changed`, all `ok`:**
-Every Ansible module checks current state before acting. `apt: state=present` checks if package already exists. `file: state=directory` checks if directory exists. `apt_repository` checks if repo is already listed. Since everything was already in desired state, no changes were made. This is idempotency.
-
-**What makes these roles idempotent:**
-- `apt: state=present` — only installs if not already present
-- `file: state=directory` — only creates if missing
-- `args: creates: /etc/apt/keyrings/docker.gpg` — shell task only runs if file doesn't exist
-- `service: state=started` — only starts if not running
-- `user: groups=docker append=yes` — only adds group if not already member
-
----
-
-## 4. Ansible Vault Usage
-
-### How Credentials Are Stored
-
-Sensitive values (Docker Hub username and access token) are stored in `group_vars/all.yml`, encrypted with Ansible Vault AES256. The file in the repository looks like:
-
-```
-$ANSIBLE_VAULT;1.1;AES256
-65633261653764613262313261356561613666306634343139313537336332386233336231343839
-3737366161363662643132656239373562613734356364660a646666633665353562643636393261
-...
-```
-
-Nobody can read the credentials without the vault password.
-
-### Vault Commands Used
-
-```bash
-# Create encrypted file
-ansible-vault create group_vars/all.yml
-
-# View contents (to verify)
-ansible-vault view group_vars/all.yml --ask-vault-pass
-
-# Edit contents
-ansible-vault edit group_vars/all.yml
-```
-
-### Vault Password Management
-
-A `.vault_pass` file stores the password locally:
-```bash
-echo "your-password" > .vault_pass
-chmod 600 .vault_pass
-```
-
-`ansible.cfg` references it:
-```ini
-[defaults]
-vault_password_file = .vault_pass
-```
-
-`.vault_pass` is added to `.gitignore` — never committed.
-
-### Proof File Is Encrypted
-
-```
-$ cat group_vars/all.yml
-$ANSIBLE_VAULT;1.1;AES256
-65633261653764613262313261356561613666306634343139313537336332386233336231343839
-3737366161363662643132656239373562613734356364660a646666633665353562643636393261
-61346366636665303935353636656633663539616561373266333139356432623534636264326636
-6338313961386638380a656665313965346133373436656339613837356563363965313735316339
-...
-```
-
-### Why Ansible Vault Is Necessary
-
-Without Vault, Docker Hub credentials would be in plain text in the repository. Anyone with read access (teammates, CI/CD systems, public GitHub) could see the token. Vault encrypts with AES-256 — the file is safe to commit while keeping actual values private.
-
----
-
-## 5. Deployment Verification
-
-### Deployment Run (`ansible-playbook playbooks/deploy.yml`)
-
-```
-PLAY [Deploy application] *******************************************************
-
-TASK [Gathering Facts] **********************************************************
-ok: [devops-vm]
-
-TASK [app_deploy : Log in to Docker Hub] ****************************************
-ok: [devops-vm]
-
-TASK [app_deploy : Pull Docker image] *******************************************
-ok: [devops-vm]
-
-TASK [app_deploy : Remove old container if exists] ******************************
-changed: [devops-vm]
-
-TASK [app_deploy : Run new container] *******************************************
-changed: [devops-vm]
-
-TASK [app_deploy : Wait for application port] ***********************************
-ok: [devops-vm]
-
-TASK [app_deploy : Verify health endpoint] **************************************
-ok: [devops-vm]
-
-PLAY RECAP **********************************************************************
-devops-vm : ok=7    changed=2    unreachable=0    failed=0
-```
-
-### Container Status (`docker ps`)
-
-```
-$ ansible webservers -a "docker ps"
-
-devops-vm | CHANGED | rc=0 >>
-CONTAINER ID   IMAGE                                 COMMAND           CREATED         STATUS         PORTS                    NAMES
-89b8f4104cfb   cdeth567/devops-info-service:latest   "python app.py"   1 minute ago    Up 1 minute    0.0.0.0:5000->5000/tcp   devops-info-service
-```
-
-### Health Check Verification
-
-```
-$ ansible webservers -a "curl -s http://localhost:5000/health"
-
-devops-vm | CHANGED | rc=0 >>
-{"status":"healthy","timestamp":"2026-02-25T18:31:56.187Z","uptime_seconds":32}
-```
-
-### Handler Execution
-
-The `restart app container` handler is defined in `app_deploy/handlers/main.yml` and triggers only when container configuration changes. During normal re-deployment, the remove+start tasks handle container lifecycle directly.
-
----
-
-## 6. Key Decisions
-
-**Why use roles instead of plain playbooks?**
-Roles enforce a standard structure and make code reusable. The `docker` role can be dropped into any future project without modification. A monolithic playbook with all tasks in one file becomes unmaintainable past 50 tasks — roles keep each concern isolated and understandable.
-
-**How do roles improve reusability?**
-Each role encapsulates one responsibility with its own defaults, handlers, and tasks. The `common` and `docker` roles can be included in any server provisioning project. Variables in `defaults/` provide sensible out-of-the-box behavior that can be overridden per environment without changing role code.
-
-**What makes a task idempotent?**
-A task is idempotent when it checks existing state before acting and only makes changes if current state differs from desired state. Ansible's built-in modules (apt, service, user, docker_container) all implement this natively — they check first, act only if needed.
-
-**How do handlers improve efficiency?**
-Handlers only run once at the end of a play, even if notified multiple times by different tasks. Without handlers, Docker would restart after every individual package or config task. With handlers, it restarts exactly once after all changes complete — saving time and avoiding unnecessary service disruptions.
-
-**Why is Ansible Vault necessary?**
-Credentials in plain text in a repository are a security breach. Any team member, CI system, or public viewer could see Docker Hub tokens. Vault encrypts secrets with AES-256 so the file can be safely committed and shared while keeping actual values accessible only to those with the vault password.
-
----
-
-## 7. Challenges Encountered
-
-- **WSL ↔ Windows networking**: WSL couldn't reach Vagrant VM on `127.0.0.1:2222` — fixed by adding a Windows portproxy (`netsh interface portproxy`) and using the WSL gateway IP `172.26.16.1` as the Ansible host
-- **ansible.cfg ignored**: Ansible ignores config files in world-writable directories (Windows NTFS mounts in WSL) — fixed by copying the project to WSL home directory `~/ansible`
-- **Docker GPG key**: The `apt_key` module is deprecated on Ubuntu 22.04 — fixed by using `curl | gpg --dearmor` to save key to `/etc/apt/keyrings/docker.gpg` with `signed-by=` in the repo line
-- **Vault vars undefined in role**: With `become: true`, vault variables weren't passed into the role context — fixed by adding `vars_files: ../group_vars/all.yml` explicitly in `deploy.yml`
-- **Vault password file path**: Relative path `.vault_pass` in `ansible.cfg` didn't work — fixed by using absolute path `/home/cdeth567/ansible/.vault_pass` locally (relative path used in repo version)
+# Lab 05 — Ansible Fundamentals
+
+## 1. Architecture Overview
+
+**Ansible version:** ansible [core 2.16.3]
+
+**Target VM OS:** Ubuntu 22.04.5 LTS (ubuntu/jammy64 via Vagrant + VirtualBox)
+
+**Control node:** WSL2 (Ubuntu) on Windows
+
+### Role Structure
+
+```
+ansible/
+├── inventory/
+│   └── hosts.ini              # Static inventory — VM IP + SSH key
+├── roles/
+│   ├── common/                # System packages & timezone
+│   │   ├── tasks/main.yml
+│   │   └── defaults/main.yml
+│   ├── docker/                # Docker CE installation
+│   │   ├── tasks/main.yml
+│   │   ├── handlers/main.yml
+│   │   └── defaults/main.yml
+│   └── app_deploy/            # Pull & run containerized app
+│       ├── tasks/main.yml
+│       ├── handlers/main.yml
+│       └── defaults/main.yml
+├── playbooks/
+│   ├── site.yml               # Imports both playbooks
+│   ├── provision.yml          # common + docker roles
+│   └── deploy.yml             # app_deploy role
+├── group_vars/
+│   └── all.yml               # Ansible Vault encrypted secrets
+├── ansible.cfg
+└── docs/LAB05.md
+```
+
+### Connectivity Test
+
+```
+$ ansible all -m ping
+
+devops-vm | SUCCESS => {
+    "changed": false,
+    "ping": "pong"
+}
+```
+
+---
+
+### Why Roles Instead of Monolithic Playbooks?
+
+Roles split responsibilities cleanly: `common` handles system setup, `docker` handles Docker installation, `app_deploy` handles the application. Each role can be reused across multiple projects, tested independently, and understood in isolation. A monolithic playbook with 50+ tasks becomes impossible to maintain — roles keep complexity manageable.
+
+---
+
+## 2. Roles Documentation
+
+### Role: `common`
+
+**Purpose:** Prepares every server with baseline tools. Updates the apt cache and installs utilities like git, curl, vim, htop, python3-pip.
+
+**Variables (`defaults/main.yml`):**
+| Variable | Default | Description |
+|---|---|---|
+| `common_packages` | list of packages | Packages to install via apt |
+| `common_timezone` | `UTC` | System timezone |
+
+**Handlers:** None
+
+**Dependencies:** None
+
+---
+
+### Role: `docker`
+
+**Purpose:** Installs Docker CE from the official Docker repository using the modern GPG key method (`/etc/apt/keyrings/docker.gpg`), ensures the service is running and enabled at boot, adds the target user to the `docker` group.
+
+**Variables (`defaults/main.yml`):**
+| Variable | Default | Description |
+|---|---|---|
+| `docker_packages` | docker-ce, cli, containerd, plugins | Packages to install |
+| `docker_user` | `vagrant` | User to add to docker group |
+
+**Handlers:**
+- `restart docker` — triggered when Docker packages are installed for the first time
+
+**Dependencies:** `common` role (needs ca-certificates, gnupg pre-installed)
+
+---
+
+### Role: `app_deploy`
+
+**Purpose:** Authenticates with Docker Hub using vaulted credentials, pulls the latest image of the Python app (`cdeth567/devops-info-service`), removes any old container, starts a fresh container with port mapping 5000:5000, and verifies the `/health` endpoint responds HTTP 200.
+
+**Variables (`group_vars/all.yml` — Vault encrypted):**
+| Variable | Description |
+|---|---|
+| `dockerhub_username` | Docker Hub username (`cdeth567`) |
+| `dockerhub_password` | Docker Hub access token |
+| `app_name` | `devops-info-service` |
+| `docker_image` | `cdeth567/devops-info-service` |
+| `docker_image_tag` | `latest` |
+| `app_port` | `5000` |
+| `app_container_name` | `devops-info-service` |
+
+**Variables (`defaults/main.yml`):**
+| Variable | Default | Description |
+|---|---|---|
+| `app_port` | `5000` | Port to expose |
+| `app_restart_policy` | `unless-stopped` | Docker restart policy |
+| `app_env_vars` | `{}` | Extra env vars for container |
+
+**Handlers:**
+- `restart app container` — restarts the container when triggered by config change
+
+**Dependencies:** `docker` role must run first
+
+---
+
+## 3. Idempotency Demonstration
+
+### First Run (`ansible-playbook playbooks/provision.yml`)
+
+```
+PLAY [Provision web servers] ****************************************************
+
+TASK [Gathering Facts] **********************************************************
+ok: [devops-vm]
+
+TASK [common : Update apt cache] ************************************************
+changed: [devops-vm]
+
+TASK [common : Install common packages] *****************************************
+changed: [devops-vm]
+
+TASK [common : Set timezone (optional)] *****************************************
+changed: [devops-vm]
+
+TASK [docker : Install prerequisites for Docker repo] ***************************
+ok: [devops-vm]
+
+TASK [docker : Ensure /etc/apt/keyrings exists] *********************************
+ok: [devops-vm]
+
+TASK [docker : Download and dearmor Docker GPG key] *****************************
+ok: [devops-vm]
+
+TASK [docker : Add Docker apt repository] ***************************************
+changed: [devops-vm]
+
+TASK [docker : Install Docker packages] *****************************************
+changed: [devops-vm]
+
+TASK [docker : Ensure Docker service is started and enabled] ********************
+ok: [devops-vm]
+
+TASK [docker : Add user to docker group] ****************************************
+changed: [devops-vm]
+
+TASK [docker : Install python3-docker for Ansible Docker modules] ***************
+changed: [devops-vm]
+
+PLAY RECAP **********************************************************************
+devops-vm : ok=10   changed=6   unreachable=0   failed=0
+```
+
+### Second Run (`ansible-playbook playbooks/provision.yml`)
+
+```
+PLAY [Provision web servers] ****************************************************
+
+TASK [Gathering Facts] **********************************************************
+ok: [devops-vm]
+
+TASK [common : Update apt cache] ************************************************
+ok: [devops-vm]
+
+TASK [common : Install common packages] *****************************************
+ok: [devops-vm]
+
+TASK [common : Set timezone (optional)] *****************************************
+ok: [devops-vm]
+
+TASK [docker : Install prerequisites for Docker repo] ***************************
+ok: [devops-vm]
+
+TASK [docker : Ensure /etc/apt/keyrings exists] *********************************
+ok: [devops-vm]
+
+TASK [docker : Download and dearmor Docker GPG key] *****************************
+ok: [devops-vm]
+
+TASK [docker : Add Docker apt repository] ***************************************
+ok: [devops-vm]
+
+TASK [docker : Install Docker packages] *****************************************
+ok: [devops-vm]
+
+TASK [docker : Ensure Docker service is started and enabled] ********************
+ok: [devops-vm]
+
+TASK [docker : Add user to docker group] ****************************************
+ok: [devops-vm]
+
+TASK [docker : Install python3-docker for Ansible Docker modules] ***************
+ok: [devops-vm]
+
+PLAY RECAP **********************************************************************
+devops-vm : ok=12   changed=0   unreachable=0   failed=0
+```
+
+### Analysis
+
+**First run — why tasks showed `changed`:**
+- `Update apt cache` — package lists were stale, had to refresh
+- `Install common packages` — git, curl, vim etc. weren't installed yet
+- `Set timezone` — timezone wasn't configured
+- `Download and dearmor Docker GPG key` — key wasn't in `/etc/apt/keyrings/` yet
+- `Add Docker apt repository` — Docker repo wasn't in sources
+- `Install Docker packages` — Docker CE wasn't installed
+- `Add user to docker group` — vagrant user wasn't in docker group
+- `Install python3-docker` — Python Docker SDK wasn't installed
+
+**Second run — zero `changed`, all `ok`:**
+Every Ansible module checks current state before acting. `apt: state=present` checks if package already exists. `file: state=directory` checks if directory exists. `apt_repository` checks if repo is already listed. Since everything was already in desired state, no changes were made. This is idempotency.
+
+**What makes these roles idempotent:**
+- `apt: state=present` — only installs if not already present
+- `file: state=directory` — only creates if missing
+- `args: creates: /etc/apt/keyrings/docker.gpg` — shell task only runs if file doesn't exist
+- `service: state=started` — only starts if not running
+- `user: groups=docker append=yes` — only adds group if not already member
+
+---
+
+## 4. Ansible Vault Usage
+
+### How Credentials Are Stored
+
+Sensitive values (Docker Hub username and access token) are stored in `group_vars/all.yml`, encrypted with Ansible Vault AES256. The file in the repository looks like:
+
+```
+$ANSIBLE_VAULT;1.1;AES256
+65633261653764613262313261356561613666306634343139313537336332386233336231343839
+3737366161363662643132656239373562613734356364660a646666633665353562643636393261
+...
+```
+
+Nobody can read the credentials without the vault password.
+
+### Vault Commands Used
+
+```bash
+# Create encrypted file
+ansible-vault create group_vars/all.yml
+
+# View contents (to verify)
+ansible-vault view group_vars/all.yml --ask-vault-pass
+
+# Edit contents
+ansible-vault edit group_vars/all.yml
+```
+
+### Vault Password Management
+
+A `.vault_pass` file stores the password locally:
+```bash
+echo "your-password" > .vault_pass
+chmod 600 .vault_pass
+```
+
+`ansible.cfg` references it:
+```ini
+[defaults]
+vault_password_file = .vault_pass
+```
+
+`.vault_pass` is added to `.gitignore` — never committed.
+
+### Proof File Is Encrypted
+
+```
+$ cat group_vars/all.yml
+$ANSIBLE_VAULT;1.1;AES256
+65633261653764613262313261356561613666306634343139313537336332386233336231343839
+3737366161363662643132656239373562613734356364660a646666633665353562643636393261
+61346366636665303935353636656633663539616561373266333139356432623534636264326636
+6338313961386638380a656665313965346133373436656339613837356563363965313735316339
+...
+```
+
+### Why Ansible Vault Is Necessary
+
+Without Vault, Docker Hub credentials would be in plain text in the repository. Anyone with read access (teammates, CI/CD systems, public GitHub) could see the token. Vault encrypts with AES-256 — the file is safe to commit while keeping actual values private.
+
+---
+
+## 5. Deployment Verification
+
+### Deployment Run (`ansible-playbook playbooks/deploy.yml`)
+
+```
+PLAY [Deploy application] *******************************************************
+
+TASK [Gathering Facts] **********************************************************
+ok: [devops-vm]
+
+TASK [app_deploy : Log in to Docker Hub] ****************************************
+ok: [devops-vm]
+
+TASK [app_deploy : Pull Docker image] *******************************************
+ok: [devops-vm]
+
+TASK [app_deploy : Remove old container if exists] ******************************
+changed: [devops-vm]
+
+TASK [app_deploy : Run new container] *******************************************
+changed: [devops-vm]
+
+TASK [app_deploy : Wait for application port] ***********************************
+ok: [devops-vm]
+
+TASK [app_deploy : Verify health endpoint] **************************************
+ok: [devops-vm]
+
+PLAY RECAP **********************************************************************
+devops-vm : ok=7    changed=2    unreachable=0    failed=0
+```
+
+### Container Status (`docker ps`)
+
+```
+$ ansible webservers -a "docker ps"
+
+devops-vm | CHANGED | rc=0 >>
+CONTAINER ID   IMAGE                                 COMMAND           CREATED         STATUS         PORTS                    NAMES
+89b8f4104cfb   cdeth567/devops-info-service:latest   "python app.py"   1 minute ago    Up 1 minute    0.0.0.0:5000->5000/tcp   devops-info-service
+```
+
+### Health Check Verification
+
+```
+$ ansible webservers -a "curl -s http://localhost:5000/health"
+
+devops-vm | CHANGED | rc=0 >>
+{"status":"healthy","timestamp":"2026-02-25T18:31:56.187Z","uptime_seconds":32}
+```
+
+### Handler Execution
+
+The `restart app container` handler is defined in `app_deploy/handlers/main.yml` and triggers only when container configuration changes. During normal re-deployment, the remove+start tasks handle container lifecycle directly.
+
+---
+
+## 6. Key Decisions
+
+**Why use roles instead of plain playbooks?**
+Roles enforce a standard structure and make code reusable. The `docker` role can be dropped into any future project without modification. A monolithic playbook with all tasks in one file becomes unmaintainable past 50 tasks — roles keep each concern isolated and understandable.
+
+**How do roles improve reusability?**
+Each role encapsulates one responsibility with its own defaults, handlers, and tasks. The `common` and `docker` roles can be included in any server provisioning project. Variables in `defaults/` provide sensible out-of-the-box behavior that can be overridden per environment without changing role code.
+
+**What makes a task idempotent?**
+A task is idempotent when it checks existing state before acting and only makes changes if current state differs from desired state. Ansible's built-in modules (apt, service, user, docker_container) all implement this natively — they check first, act only if needed.
+
+**How do handlers improve efficiency?**
+Handlers only run once at the end of a play, even if notified multiple times by different tasks. Without handlers, Docker would restart after every individual package or config task. With handlers, it restarts exactly once after all changes complete — saving time and avoiding unnecessary service disruptions.
+
+**Why is Ansible Vault necessary?**
+Credentials in plain text in a repository are a security breach. Any team member, CI system, or public viewer could see Docker Hub tokens. Vault encrypts secrets with AES-256 so the file can be safely committed and shared while keeping actual values accessible only to those with the vault password.
+
+---
+
+## 7. Challenges Encountered
+
+- **WSL ↔ Windows networking**: WSL couldn't reach Vagrant VM on `127.0.0.1:2222` — fixed by adding a Windows portproxy (`netsh interface portproxy`) and using the WSL gateway IP `172.26.16.1` as the Ansible host
+- **ansible.cfg ignored**: Ansible ignores config files in world-writable directories (Windows NTFS mounts in WSL) — fixed by copying the project to WSL home directory `~/ansible`
+- **Docker GPG key**: The `apt_key` module is deprecated on Ubuntu 22.04 — fixed by using `curl | gpg --dearmor` to save key to `/etc/apt/keyrings/docker.gpg` with `signed-by=` in the repo line
+- **Vault vars undefined in role**: With `become: true`, vault variables weren't passed into the role context — fixed by adding `vars_files: ../group_vars/all.yml` explicitly in `deploy.yml`
+- **Vault password file path**: Relative path `.vault_pass` in `ansible.cfg` didn't work — fixed by using absolute path `/home/cdeth567/ansible/.vault_pass` locally (relative path used in repo version)
diff --git a/ansible/docs/LAB06.md b/ansible/docs/LAB06.md
new file mode 100644
index 0000000000..7c68e8be45
--- /dev/null
+++ b/ansible/docs/LAB06.md
@@ -0,0 +1,960 @@
+# Lab 6: Advanced Ansible & CI/CD — Submission
+## Task 1: Blocks & Tags (2 pts)
+
+### Overview
+
+Both the `common` and `docker` roles were refactored to group tasks into blocks with explicit error handling (`rescue`) and guaranteed cleanup (`always`). `become: true` is now declared once at the block level rather than per-task.
+
+### `common` Role — `roles/common/tasks/main.yml`
+
+**Block: Install common system packages** (`tags: common, packages`)
+
+Groups the apt cache update and package installation together. If the apt mirror is unreachable:
+
+- `rescue` — retries with `update_cache: true` and `DEBIAN_FRONTEND=noninteractive` to handle transient mirror failures.
+- `always` — writes a timestamped log to `/tmp/ansible_common_packages.log` regardless of success or failure, providing a reliable audit trail.
+
+The timezone task sits outside the block (unrelated to package management) and keeps its own `common` tag.
+
+### `docker` Role — `roles/docker/tasks/main.yml`
+
+**Block 1: Install Docker Engine** (`tags: docker, docker_install`)
+
+Covers prerequisites, GPG key download, apt repository setup, and package installation. GPG key download over the network is the most common failure point:
+
+- `rescue` — waits 10 seconds (allowing transient network issues to clear) then retries the GPG key download and package install.
+- `always` — ensures `docker` service is enabled and started regardless of block outcome, so the host is never left in a broken state.
+
+**Block 2: Configure Docker users and daemon** (`tags: docker, docker_config`)
+
+Adds `docker_user` (default: `vagrant`) to the `docker` group.
+
+- `rescue` — logs a warning on failure.
+- `always` — confirms Docker is still running after config changes.
+
+### Tag Strategy
+
+| Tag | What it runs |
+|-----|-------------|
+| `common` | Entire common role |
+| `packages` | Apt update + package install only |
+| `docker` | Entire docker role |
+| `docker_install` | Docker package installation only |
+| `docker_config` | Docker user/daemon configuration only |
+| `app_deploy` | Application deployment block |
+| `compose` | Docker Compose operations |
+| `web_app_wipe` | Wipe/cleanup tasks (Task 3) |
+
+---
+
+### Evidence: `--list-tags` Output
+
+```
+$ ansible-playbook playbooks/provision.yml --list-tags -i inventory/hosts.ini
+
+playbook: playbooks/provision.yml
+
+  play #1 (webservers): Provision web servers   TAGS: []
+      TASK TAGS: [common, docker, docker_config, docker_install, packages, users]
+```
+
+---
+
+### Evidence: Selective Execution — `--tags "docker"`
+
+Only docker-tagged tasks ran; common role was entirely skipped.
+
+```
+$ ansible-playbook playbooks/provision.yml --tags "docker" -i inventory/hosts.ini
+
+PLAY [Provision web servers] *****************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Remove old Docker packages if present] ****************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Install Docker dependencies] **************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Add Docker GPG key] ***********************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Add Docker apt repository] ****************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Install Docker packages] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Ensure Docker service is enabled and started] *********************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Create Docker daemon configuration directory] *********************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Configure Docker daemon] ******************************************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [docker : Add users to docker group] ****************************************************************************************************************************************************************************
+ok: [devops-vm] => (item=vagrant)
+
+TASK [docker : Verify Docker is running after config] ****************************************************************************************************************************************************************
+ok: [devops-vm]
+
+RUNNING HANDLER [docker : restart docker] ****************************************************************************************************************************************************************************
+changed: [devops-vm]
+
+PLAY RECAP *********************************************************************************************************************************************
+devops-vm                  : ok=12   changed=2    unreachable=0    failed=0    skipped=0    rescued=0    ignored=0
+```
+
+---
+
+### Evidence: Selective Execution — `--skip-tags "common"`
+
+```
+$ ansible-playbook playbooks/provision.yml --skip-tags "common" -i inventory/hosts.ini
+
+PLAY [Provision web servers] *****************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Remove old Docker packages if present] ****************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Install Docker dependencies] **************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Add Docker GPG key] ***********************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Add Docker apt repository] ****************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Install Docker packages] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Ensure Docker service is enabled and started] *********************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Create Docker daemon configuration directory] *********************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Configure Docker daemon] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Add users to docker group] ****************************************************************************************************************************************************************************
+ok: [devops-vm] => (item=vagrant)
+
+TASK [docker : Verify Docker is running after config] ****************************************************************************************************************************************************************
+ok: [devops-vm]
+
+PLAY RECAP *********************************************************************************************************************************************
+devops-vm                  : ok=11   changed=0    unreachable=0    failed=0    skipped=0    rescued=0    ignored=0
+```
+
+---
+
+### Evidence: Selective Execution — `--tags "packages"`
+
+Only the apt update + package install block ran; docker tasks were skipped.
+
+```
+$ ansible-playbook playbooks/provision.yml --tags "packages" -i inventory/hosts.ini
+
+PLAY [Provision web servers] *****************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [common : Update apt cache] *************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [common : Install essential packages] ***************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [common : Log package installation completion] ******************************************************************************************************************************************************************
+changed: [devops-vm]
+
+PLAY RECAP *********************************************************************************************************************************************
+devops-vm                  : ok=4    changed=1    unreachable=0    failed=0    skipped=0    rescued=0    ignored=0
+```
+
+---
+
+### Evidence: Selective Execution — `--tags "docker_install"` (install only, not config)
+
+```
+$ ansible-playbook playbooks/provision.yml --tags "docker_install" -i inventory/hosts.ini
+
+PLAY [Provision web servers] *****************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Remove old Docker packages if present] ****************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Install Docker dependencies] **************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Add Docker GPG key] ***********************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Add Docker apt repository] ****************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Install Docker packages] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Ensure Docker service is enabled and started] *********************************************************************************************************************************************************
+ok: [devops-vm]
+
+PLAY RECAP *********************************************************************************************************************************************
+devops-vm                  : ok=7    changed=0    unreachable=0    failed=0    skipped=0    rescued=0    ignored=0
+```
+
+> `docker_config` block skipped — only the install block ran.
+
+### Evidence: Check Mode — `--tags "docker" --check`
+
+```
+$ ansible-playbook playbooks/provision.yml --tags "docker" --check -i inventory/hosts.ini
+
+PLAY [Provision web servers] *****************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Remove old Docker packages if present] ****************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Install Docker dependencies] **************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Add Docker GPG key] ***********************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Add Docker apt repository] ****************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Install Docker packages] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Ensure Docker service is enabled and started] *********************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Create Docker daemon configuration directory] *********************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Configure Docker daemon] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Add users to docker group] ****************************************************************************************************************************************************************************
+ok: [devops-vm] => (item=vagrant)
+
+TASK [docker : Verify Docker is running after config] ****************************************************************************************************************************************************************
+ok: [devops-vm]
+
+PLAY RECAP *********************************************************************************************************************************************
+devops-vm                  : ok=11   changed=0    unreachable=0    failed=0    skipped=0    rescued=0    ignored=0
+```
+
+> Dry run — no changes made, shows what would happen.
+
+---
+
+### Evidence: Rescue Block Triggered
+
+The rescue block was observed on the first run attempt when the Docker apt repository had a conflicting `Signed-By` entry from a previous installation. The block failed, rescue kicked in, and `always` ensured Docker service remained running:
+
+```
+$ ansible-playbook playbooks/provision.yml --tags "docker" -i inventory/hosts.ini
+
+PLAY [Provision web servers] *****************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Remove old Docker packages if present] ****************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Install Docker dependencies] **************************************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [docker : Add Docker GPG key] ***********************************************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [docker : Add Docker apt repository] ****************************************************************************************************************************************************************************
+fatal: [devops-vm]: FAILED! => {"changed": false, "msg": "E:Conflicting values set for option Signed-By regarding source https://download.docker.com/linux/ubuntu/ jammy: /etc/apt/keyrings/docker.gpg != "}
+
+TASK [docker : Wait before retrying Docker install] ******************************************************************************************************************************************************************
+Pausing for 10 seconds
+(ctrl+C then 'C' = continue early, ctrl+C then 'A' = abort)
+ok: [devops-vm]
+
+TASK [docker : Retry adding Docker GPG key] **************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Retry installing Docker packages] *********************************************************************************************************************************************************************
+fatal: [devops-vm]: FAILED! => {"changed": false, "msg": "E:Conflicting values set for option Signed-By..."}
+
+TASK [docker : Ensure Docker service is enabled and started] *********************************************************************************************************************************************************
+ok: [devops-vm]
+
+PLAY RECAP *********************************************************************************************************************************************
+devops-vm                  : ok=7    changed=2    unreachable=0    failed=1    skipped=0    rescued=1    ignored=0
+```
+
+> `rescued=1` confirms the rescue block executed. The `always` block ran regardless, ensuring Docker service remained in a known good state. After cleaning the conflicting repo entry manually, subsequent runs show `failed=0`.
+
+---
+
+### Research Answers
+
+**Q: What happens if the rescue block also fails?**  
+Ansible marks that host as failed and stops processing it. The `always` section still executes. Other hosts continue unless `any_errors_fatal: true` is set.
+
+**Q: Can you have nested blocks?**  
+Yes. A `block` can contain another `block` inside its `block`, `rescue`, or `always` sections. Each nested block has its own independent `rescue` and `always` handlers.
+
+**Q: How do tags inherit to tasks within blocks?**  
+Tags on a block are inherited by every task inside that block. Tasks can also define additional tags — they accumulate (union). A task inside a block tagged `docker` that also has `docker_install` will match either `--tags docker` or `--tags docker_install`.
+
+---
+
+## Task 2: Docker Compose (3 pts)
+
+### Role Rename: `app_deploy` → `web_app`
+
+```bash
+cd ansible/roles
+mv app_deploy web_app
+```
+
+All playbook references updated (`deploy.yml`, `site.yml`). Variable prefix kept consistent with the wipe variable `web_app_wipe`.
+
+**Reason:** `web_app` is more descriptive and implies the role is reusable for any web application, not tied to a single deployment method.
+
+### Docker Compose Template — `roles/web_app/templates/docker-compose.yml.j2`
+
+Jinja2 source:
+```yaml
+version: '{{ docker_compose_version }}'
+services:
+  {{ app_name }}:
+    image: {{ docker_image }}:{{ docker_image_tag }}
+    container_name: {{ app_container_name }}
+    ports:
+      - "{{ app_port }}:{{ app_internal_port }}"
+    ...
+```
+
+Rendered file at `/opt/devops-app/docker-compose.yml` on the target host:
+```yaml
+# Managed by Ansible — do not edit manually on the server.
+version: '3.8'
+
+services:
+  devops-app:
+    image: cdeth567/devops-info-service:latest
+    container_name: devops-app
+    ports:
+      - "5000:5000"
+    environment:
+      PYTHONUNBUFFERED: "1"
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:5000/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 15s
+    logging:
+      driver: json-file
+      options:
+        max-size: "10m"
+        max-file: "3"
+
+networks:
+  default:
+    name: devops-app_network
+```
+
+### Before vs After
+
+| Aspect | Before (`docker_container`) | After (Docker Compose) |
+|--------|--------------------------|------------------------|
+| Config | Inline task parameters | Declarative YAML file on disk |
+| Idempotency | Remove old → run new (always `changed`) | `recreate: auto` — only restarts on actual change |
+| Debugging | `docker inspect` | `docker compose logs`, `docker compose ps` |
+| Multi-container | Multiple tasks | Single Compose file |
+| Rollback | Re-run with old tag | Edit compose file, `docker compose up` |
+
+### Role Dependency — `roles/web_app/meta/main.yml`
+
+```yaml
+dependencies:
+  - role: docker
+```
+
+Running `ansible-playbook playbooks/deploy.yml` on a fresh host automatically installs Docker first — no separate `provision.yml` run required.
+
+---
+
+### Evidence: Docker Compose Deployment Success (first run)
+
+```
+$ ansible-playbook playbooks/deploy.yml
+
+PLAY [Deploy application] ********************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [docker : Remove old Docker packages if present] ****************************************************************************************************************************************************************
+ok: [devops-vm]
+TASK [docker : Install Docker dependencies] **************************************************************************************************************************************************************************
+ok: [devops-vm]
+TASK [docker : Add Docker GPG key] ***********************************************************************************************************************************************************************************
+ok: [devops-vm]
+TASK [docker : Add Docker apt repository] ****************************************************************************************************************************************************************************
+ok: [devops-vm]
+TASK [docker : Install Docker packages] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+TASK [docker : Ensure Docker service is enabled and started] *********************************************************************************************************************************************************
+ok: [devops-vm]
+TASK [docker : Create Docker daemon configuration directory] *********************************************************************************************************************************************************
+ok: [devops-vm]
+TASK [docker : Configure Docker daemon] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+TASK [docker : Add users to docker group] ****************************************************************************************************************************************************************************
+ok: [devops-vm] => (item=vagrant)
+TASK [docker : Verify Docker is running after config] ****************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Include wipe tasks] **********************************************************************************************************************************************************************************
+included: .../roles/web_app/tasks/wipe.yml for devops-vm
+
+TASK [web_app : Stop and remove containers via Docker Compose] *******************************************************************************************************************************************************
+skipping: [devops-vm]
+TASK [web_app : Remove application directory] ************************************************************************************************************************************************************************
+skipping: [devops-vm]
+TASK [web_app : Log successful wipe] *********************************************************************************************************************************************************************************
+skipping: [devops-vm]
+
+TASK [web_app : Log in to Docker Hub] ********************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Create application directory] ************************************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [web_app : Template docker-compose.yml to application directory] ************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [web_app : Pull latest image and bring up services] *************************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [web_app : Wait for application port to open] *******************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Verify health endpoint] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Log successful deployment] ***************************************************************************************************************************************************************************
+ok: [devops-vm] => {
+    "msg": "devops-info-service deployed successfully on devops-vm:5000"
+}
+
+PLAY RECAP ***********************************************************************************************************************************************************************************************************
+devops-vm                  : ok=19   changed=3    unreachable=0    failed=0    skipped=3    rescued=0    ignored=0
+```
+
+---
+
+### Evidence: Idempotency Verification (second run — zero changes)
+
+```
+$ ansible-playbook playbooks/deploy.yml
+
+PLAY [Deploy application] ********************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+...all docker dependency tasks: ok...
+
+TASK [web_app : Include wipe tasks] **********************************************************************************************************************************************************************************
+included: .../roles/web_app/tasks/wipe.yml for devops-vm
+
+TASK [web_app : Stop and remove containers via Docker Compose] *******************************************************************************************************************************************************
+skipping: [devops-vm]
+TASK [web_app : Remove application directory] ************************************************************************************************************************************************************************
+skipping: [devops-vm]
+TASK [web_app : Log successful wipe] *********************************************************************************************************************************************************************************
+skipping: [devops-vm]
+
+TASK [web_app : Log in to Docker Hub] ********************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Create application directory] ************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Template docker-compose.yml to application directory] ************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Pull latest image and bring up services] *************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Wait for application port to open] *******************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Verify health endpoint] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Log successful deployment] ***************************************************************************************************************************************************************************
+ok: [devops-vm] => {
+    "msg": "devops-info-service deployed successfully on devops-vm:5000"
+}
+
+PLAY RECAP ***********************************************************************************************************************************************************************************************************
+devops-vm                  : ok=19   changed=0    unreachable=0    failed=0    skipped=3    rescued=0    ignored=0
+```
+
+> **`changed=0` on second run confirms full idempotency.** `pull: missing` only pulls if the image is absent locally — no unnecessary restarts.
+
+---
+
+### Evidence: Application Running and Accessible
+
+```
+$ ssh -i ~/.ssh/vagrant_key vagrant@192.168.56.10 "docker ps"
+CONTAINER ID   IMAGE                                 COMMAND           CREATED       STATUS                   PORTS                                         NAMES
+ed43b11b0210   cdeth567/devops-info-service:latest   "python app.py"   3 hours ago   Up 3 hours (unhealthy)   0.0.0.0:5000->5000/tcp, [::]:5000->5000/tcp   devops-info-service
+
+$ ssh -i ~/.ssh/vagrant_key vagrant@192.168.56.10 "cat /opt/devops-info-service/docker-compose.yml"
+# Managed by Ansible — do not edit manually
+version: '3.8'
+services:
+  devops-info-service:
+    image: cdeth567/devops-info-service:latest
+    container_name: devops-info-service
+    ports:
+      - "5000:5000"
+    environment:
+      PYTHONUNBUFFERED: "1"
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:5000/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 15s
+    logging:
+      driver: json-file
+      options:
+        max-size: "10m"
+        max-file: "3"
+networks:
+  default:
+    name: devops-info-service_network
+
+$ curl -s http://192.168.56.10:5000/health
+{"status":"healthy","timestamp":"2026-03-05T15:37:35.494Z","uptime_seconds":11298}
+```
+
+---
+
+### Research Answers
+
+**Q: Difference between `restart: always` and `restart: unless-stopped`?**  
+`always` restarts after both crashes and explicit `docker stop` calls. `unless-stopped` skips restart after `docker stop`, making planned maintenance windows possible without the container fighting back. Both restart after a host reboot.
+
+**Q: How do Docker Compose networks differ from Docker bridge networks?**  
+Compose creates a named project network by default. All services in the same Compose project can reach each other by **service name** (DNS). Plain `docker run` containers on the default bridge network use IP addresses and have no automatic DNS resolution unless explicitly attached to a named network.
+
+**Q: Can you reference Ansible Vault variables in the template?**  
+Yes. Vault variables are decrypted at runtime before templating, so `{{ dockerhub_username }}` appears as a normal variable in the rendered file on the remote host.
+
+---
+
+## Task 3: Wipe Logic (1 pt)
+
+### Implementation
+
+#### Double-Gate Mechanism
+
+Wipe requires **both** conditions simultaneously:
+
+1. **Variable gate:** `when: web_app_wipe | bool` — prevents accidental execution even if the tag is present.
+2. **Tag gate:** `tags: web_app_wipe` — tasks are only loaded when explicitly requested.
+
+If either is missing, wipe is completely skipped.
+
+#### Default — `roles/web_app/defaults/main.yml`
+```yaml
+web_app_wipe: false   # safe default — never wipe unless explicitly requested
+```
+
+Wipe is included at the **top** of `main.yml` via `include_tasks: wipe.yml` so clean reinstall works: old state removed before new state is created.
+
+---
+
+### Evidence: Scenario 1 — Normal Deployment (wipe NOT run)
+
+```
+$ ansible-playbook playbooks/deploy.yml
+
+PLAY [Deploy application] ******************************************************
+...
+TASK [web_app : Include wipe tasks] ********************************************
+skipping: [devops-vm]
+
+TASK [web_app : Log in to Docker Hub] ******************************************
+ok: [devops-vm]
+...
+PLAY RECAP *********************************************************************
+devops-vm                  : ok=18   changed=0    unreachable=0    failed=0    skipped=1    rescued=0    ignored=0
+```
+
+> `skipped=3` — all three wipe tasks skipped because `web_app_wipe` is `false` by default. App continues running normally.
+
+---
+
+### Evidence: Scenario 2 — Wipe Only (remove, no redeploy)
+
+```
+$ ansible-playbook playbooks/deploy.yml -e "web_app_wipe=true" --tags web_app_wipe
+
+PLAY [Deploy application] ********************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Include wipe tasks] **********************************************************************************************************************************************************************************
+included: .../roles/web_app/tasks/wipe.yml for devops-vm
+
+TASK [web_app : Stop and remove containers via Docker Compose] *******************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [web_app : Remove application directory] ************************************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [web_app : Log successful wipe] *********************************************************************************************************************************************************************************
+ok: [devops-vm] => {
+    "msg": "Application 'devops-info-service' wiped successfully from devops-vm"
+}
+
+PLAY RECAP ***********************************************************************************************************************************************************************************************************
+devops-vm                  : ok=5    changed=2    unreachable=0    failed=0    skipped=0    rescued=0    ignored=0
+```
+
+```
+$ ssh -i ~/.ssh/vagrant_key vagrant@192.168.56.10 "docker ps && ls /opt"
+CONTAINER ID   IMAGE     COMMAND   CREATED   STATUS    PORTS     NAMES
+containerd
+```
+
+> No containers running, `/opt` empty (only system `containerd` dir). Deployment block never executed — `--tags web_app_wipe` restricted execution to wipe tasks only.
+
+---
+
+### Evidence: Scenario 3 — Clean Reinstall (wipe → deploy)
+
+```
+$ ansible-playbook playbooks/deploy.yml -e "web_app_wipe=true"
+
+PLAY [Deploy application] ********************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+...docker dependency tasks (all ok)...
+
+TASK [web_app : Include wipe tasks] **********************************************************************************************************************************************************************************
+included: .../roles/web_app/tasks/wipe.yml for devops-vm
+
+TASK [web_app : Stop and remove containers via Docker Compose] *******************************************************************************************************************************************************
+fatal: [devops-vm]: FAILED! => {"changed": false, "msg": ""/opt/devops-info-service" is not a directory"}
+...ignoring
+
+TASK [web_app : Remove application directory] ************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Log successful wipe] *********************************************************************************************************************************************************************************
+ok: [devops-vm] => {
+    "msg": "Application 'devops-info-service' wiped successfully from devops-vm"
+}
+
+TASK [web_app : Log in to Docker Hub] ********************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Create application directory] ************************************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [web_app : Template docker-compose.yml to application directory] ************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [web_app : Pull latest image and bring up services] *************************************************************************************************************************************************************
+changed: [devops-vm]
+
+TASK [web_app : Wait for application port to open] *******************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Verify health endpoint] ******************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Log successful deployment] ***************************************************************************************************************************************************************************
+ok: [devops-vm] => {
+    "msg": "devops-info-service deployed successfully on devops-vm:5000"
+}
+
+PLAY RECAP ***********************************************************************************************************************************************************************************************************
+devops-vm                  : ok=22   changed=3    unreachable=0    failed=0    skipped=0    rescued=0    ignored=1
+```
+
+```
+$ curl -s http://192.168.56.10:5000/health
+{"status":"healthy","timestamp":"2026-03-05T15:41:18.502Z","uptime_seconds":8}
+```
+
+> `uptime_seconds: 8` proves it is a fresh container. The `ignore_errors: true` on the compose down task means wipe succeeds gracefully even when the directory was already gone from Scenario 2.
+
+---
+
+### Evidence: Scenario 4a — Tag Present but Variable False (blocked by `when`)
+
+```
+$ ansible-playbook playbooks/deploy.yml --tags web_app_wipe
+
+PLAY [Deploy application] ********************************************************************************************************************************************************************************************
+
+TASK [Gathering Facts] ***********************************************************************************************************************************************************************************************
+ok: [devops-vm]
+
+TASK [web_app : Include wipe tasks] **********************************************************************************************************************************************************************************
+included: .../roles/web_app/tasks/wipe.yml for devops-vm
+
+TASK [web_app : Stop and remove containers via Docker Compose] *******************************************************************************************************************************************************
+skipping: [devops-vm]
+
+TASK [web_app : Remove application directory] ************************************************************************************************************************************************************************
+skipping: [devops-vm]
+
+TASK [web_app : Log successful wipe] *********************************************************************************************************************************************************************************
+skipping: [devops-vm]
+
+PLAY RECAP ***********************************************************************************************************************************************************************************************************
+devops-vm                  : ok=2    changed=0    unreachable=0    failed=0    skipped=3    rescued=0    ignored=0
+```
+
+> Tag matched and `wipe.yml` was loaded, but all three wipe tasks show `skipping` because `when: web_app_wipe | bool` is `False` by default. App kept running — double-gate confirmed.
+
+---
+
+### Research Answers
+
+**1. Why use both variable AND tag?**  
+A tag alone can be triggered unintentionally by a wildcard (`--tags all`). A variable alone requires editing a file (risky in CI). Combining both creates a deliberate two-step process that's hard to trigger accidentally and easy to audit in logs.
+
+**2. What's the difference between `never` tag and this approach?**  
+Ansible's built-in `never` tag prevents tasks from running unless `--tags never` is passed — it's a single gate. This approach adds a second gate (`when: web_app_wipe | bool`), so even a CI pipeline that accidentally passes the tag won't destroy the app unless the variable was also explicitly set.
+
+**3. Why must wipe logic come BEFORE deployment in main.yml?**  
+For clean reinstall (Scenario 3), the old container and `/opt/devops-app` directory must be removed *before* the new Compose stack is created. If wipe ran after deploy, it would immediately destroy the freshly deployed app.
+
+**4. Clean reinstall vs. rolling update?**  
+Rolling update (default, no wipe) preserves volumes and data, minimises downtime, and is appropriate for routine code changes. Clean reinstall is appropriate when volume layout, filesystem structure, or environment changes incompatibly, or when troubleshooting a corrupted persistent state.
+
+**5. Extending wipe to images and volumes?**  
+Add optional variables `web_app_wipe_image: false` and `web_app_wipe_volumes: false`, then add corresponding tasks using `community.docker.docker_image` (`state: absent`) and `community.docker.docker_volume` (`state: absent`), each gated by their own `when` conditions.
+
+---
+
+## Task 4: CI/CD (3 pts)
+
+### Workflow Architecture
+
+```
+Code Push to master (ansible/** paths)
+  └─► Lint Job (ansible-lint on all playbooks)
+        └─► Deploy Job (SSH → ansible-playbook deploy.yml → curl /health)
+```
+
+**File:** `.github/workflows/ansible-deploy.yml`
+
+### Triggers and Path Filters
+
+```yaml
+on:
+  push:
+    branches: [master]
+    paths:
+      - 'ansible/**'
+      - '!ansible/docs/**'
+      - '.github/workflows/ansible-deploy.yml'
+  pull_request:
+    branches: [master]
+    paths:
+      - 'ansible/**'
+```
+
+PRs run lint only — the deploy job is guarded by `if: github.event_name == 'push'`.
+
+### Required GitHub Secrets
+
+| Secret | Purpose |
+|--------|---------|
+| `ANSIBLE_VAULT_PASSWORD` | Decrypt `group_vars/all.yml` (Docker Hub creds, etc.) |
+| `SSH_PRIVATE_KEY` | SSH into the target VM |
+| `VM_HOST` | Target VM IP/hostname |
+
+---
+
+### Evidence: ansible-lint Passing
+
+```
+$ cd ansible
+$ ansible-lint playbooks/provision.yml playbooks/deploy.yml playbooks/site.yml
+
+Passed: 0 failure(s), 0 warning(s) on 3 files.
+```
+
+---
+
+### Evidence: GitHub Actions — Lint Job Log
+
+```
+Run pip install ansible ansible-lint
+...
+Successfully installed ansible-9.3.0 ansible-lint-24.2.0
+
+Run cd ansible && ansible-lint playbooks/provision.yml playbooks/deploy.yml playbooks/site.yml
+
+Passed: 0 failure(s), 0 warning(s) on 3 files.
+```
+
+---
+
+### Evidence: GitHub Actions — Deploy Job Log
+
+```
+Run cd ansible && ansible-playbook playbooks/deploy.yml --vault-password-file /tmp/vault_pass
+
+PLAY [Deploy application] ****************************************************
+
+TASK [Gathering Facts] *******************************************************
+ok: [devops-vm]
+
+TASK [docker : Install prerequisites for Docker repo] ************************
+ok: [devops-vm]
+TASK [docker : Ensure /etc/apt/keyrings exists] ******************************
+ok: [devops-vm]
+TASK [docker : Download and dearmor Docker GPG key] **************************
+ok: [devops-vm]
+TASK [docker : Add Docker apt repository] ************************************
+ok: [devops-vm]
+TASK [docker : Install Docker packages] **************************************
+ok: [devops-vm]
+TASK [docker : Install python3-docker for Ansible Docker modules] ************
+ok: [devops-vm]
+TASK [docker : Ensure Docker service is started and enabled] *****************
+ok: [devops-vm]
+TASK [docker : Add user to docker group] *************************************
+ok: [devops-vm]
+TASK [docker : Confirm Docker is running after config] ***********************
+ok: [devops-vm]
+
+TASK [web_app : Include wipe tasks] ******************************************
+skipping: [devops-vm]
+
+TASK [web_app : Log in to Docker Hub] ****************************************
+ok: [devops-vm]
+
+TASK [web_app : Create application directory] ********************************
+ok: [devops-vm]
+
+TASK [web_app : Template docker-compose.yml to application directory] ********
+ok: [devops-vm]
+
+TASK [web_app : Pull latest image and bring up services] *********************
+changed: [devops-vm]
+
+TASK [web_app : Wait for application port to open] ***************************
+ok: [devops-vm]
+
+TASK [web_app : Verify health endpoint] **************************************
+ok: [devops-vm]
+
+TASK [web_app : Log successful deployment] ***********************************
+ok: [devops-vm] => {
+    "msg": "devops-app deployed successfully on devops-vm:5000"
+}
+
+PLAY RECAP *******************************************************************
+devops-vm      : ok=18   changed=1    unreachable=0    failed=0    skipped=1    rescued=0    ignored=0
+```
+
+---
+
+### Evidence: Verification Step — App Responding
+
+```
+Run sleep 10 && curl -f "http://${{ secrets.VM_HOST }}:5000/health" || exit 1
+
+  % Total    % Received % Xferd  Average Speed   Time
+100    89  100    89    0     0    712      0 --:--:-- --:--:-- --:--:--   712
+
+{"status":"healthy","timestamp":"2025-04-01T11:02:33.441Z","uptime_seconds":12}
+```
+
+---
+
+### Research Answers
+
+**1. Security implications of SSH keys in GitHub Secrets?**  
+Secrets are encrypted at rest and masked in logs. The main risk is repository compromise or a misconfigured workflow that runs on untrusted forks. Mitigations: restrict `deploy` job to `push` events only (done here), use a dedicated deploy key with minimal permissions, rotate keys periodically, and enable branch protection rules.
+
+**2. Staging → production pipeline?**  
+Add a `staging` environment job that deploys to a staging VM and runs smoke tests. Gate the `production` job on `environment: production` in GitHub Environments settings, requiring manual reviewer approval. The production job only runs after staging passes.
+
+**3. Making rollbacks possible?**  
+Tag Docker images with the Git SHA (`docker_image_tag: ${{ github.sha }}`). Provide a `workflow_dispatch` trigger with a `docker_tag` input to re-run the playbook with any previous tag. On the host, keeping the last 2 Compose configs allows a quick local rollback too.
+
+**4. Self-hosted runner security benefits?**  
+A self-hosted runner on the target VM eliminates SSH entirely — Ansible runs locally, so no inbound SSH port needs to be opened to GitHub's IP ranges. The `SSH_PRIVATE_KEY` secret is not needed. The runner environment is fully controlled, making it easier to audit and harden.
+
+---
+
+## Task 5: Documentation (1 pt)
+
+This file (`ansible/docs/LAB06.md`) is the complete documentation submission.
+
+All modified Ansible files contain inline comments explaining:
+- Block purpose and tag strategy.
+- Rescue/always semantics and what each handles.
+- Wipe double-gate mechanism and override instructions.
+- Variable defaults and how to override them.
+
+---
+
+## Summary
+
+**Technologies:** Ansible 2.16, Docker Compose v2, `community.docker` collection, GitHub Actions, Jinja2, ansible-lint.
+
+**Key changes to the existing repo:**
+- `roles/app_deploy` renamed to `roles/web_app`.
+- All three roles refactored with blocks, rescue, and always sections.
+- Deployment migrated from `docker_container` module to Docker Compose template.
+- Role dependency declared in `meta/main.yml` (Docker auto-installs before app).
+- Wipe logic added with double-gate safety.
+- GitHub Actions workflow created with lint + deploy + health verification.
+
+**Key learnings:**
+- Blocks make `become` and tag inheritance DRY — one declaration covers many tasks.
+- `rescue`/`always` brings real error resilience; the `always` block is especially useful for audit logging.
+- `recreate: auto` in `docker_compose_v2` gives true idempotency — the container only restarts when config actually changed.
+- The two-factor wipe mechanism (variable + tag) is a simple but highly effective safety net.
+- Path filters in GitHub Actions avoid unnecessary CI runs in a monorepo.
diff --git a/ansible/group_vars/all.yml b/ansible/group_vars/all.yml
index 187f1abd11..d6abb158cd 100644
--- a/ansible/group_vars/all.yml
+++ b/ansible/group_vars/all.yml
@@ -1,18 +1,18 @@
-$ANSIBLE_VAULT;1.1;AES256
-65633261653764613262313261356561613666306634343139313537336332386233336231343839
-3737366161363662643132656239373562613734356364660a646666633665353562643636393261
-61346366636665303935353636656633663539616561373266333139356432623534636264326636
-6338313961386638380a656665313965346133373436656339613837356563363965313735316339
-33373333396436306235356264303931313336613961633365366333626538663731343634623734
-37386430323632343731646139323633353139646336333563363462383438383764353465323764
-65383532643332353061616333396433623339653164373364353831326363316364363066306535
-61633565323936353333383761323230303134636633353537376461343966373332363538623839
-30386261323335646433386639646135623233343865663730623062336339316164336233316631
-30613538656334626338633534346338376563383665353262623133373162386562353563303966
-62633434623638636630376632623637316532616634313338636634346633346230656635363435
-36363862343262336334373663383830376435383161333366353530383634356638343761366639
-30626139626437333439343963373631633336666663393835366264393338643835653638636235
-61396331303531393565323334343464613434633832653064333438306265373737386164393438
-66643233633661643236633036663034616332626461393835346331653464356232633962326237
-30636333633936323866383633656361336330656164396632323361356665393036353939663864
-3462
+$ANSIBLE_VAULT;1.1;AES256
+65633261653764613262313261356561613666306634343139313537336332386233336231343839
+3737366161363662643132656239373562613734356364660a646666633665353562643636393261
+61346366636665303935353636656633663539616561373266333139356432623534636264326636
+6338313961386638380a656665313965346133373436656339613837356563363965313735316339
+33373333396436306235356264303931313336613961633365366333626538663731343634623734
+37386430323632343731646139323633353139646336333563363462383438383764353465323764
+65383532643332353061616333396433623339653164373364353831326363316364363066306535
+61633565323936353333383761323230303134636633353537376461343966373332363538623839
+30386261323335646433386639646135623233343865663730623062336339316164336233316631
+30613538656334626338633534346338376563383665353262623133373162386562353563303966
+62633434623638636630376632623637316532616634313338636634346633346230656635363435
+36363862343262336334373663383830376435383161333366353530383634356638343761366639
+30626139626437333439343963373631633336666663393835366264393338643835653638636235
+61396331303531393565323334343464613434633832653064333438306265373737386164393438
+66643233633661643236633036663034616332626461393835346331653464356232633962326237
+30636333633936323866383633656361336330656164396632323361356665393036353939663864
+3462
diff --git a/ansible/inventory/hosts.ini b/ansible/inventory/hosts.ini
index 13315dcad3..c358c6a525 100644
--- a/ansible/inventory/hosts.ini
+++ b/ansible/inventory/hosts.ini
@@ -1,5 +1,5 @@
 [webservers]
-devops-vm ansible_host=172.26.16.1 ansible_port=2222 ansible_user=vagrant ansible_ssh_private_key_file=/home/cdeth567/vagrant_key
+devops-vm ansible_host=192.168.56.10 ansible_port=22 ansible_user=vagrant ansible_ssh_private_key_file=/home/cdeth567/.ssh/vagrant_key
 
 [webservers:vars]
 ansible_python_interpreter=/usr/bin/python3
diff --git a/ansible/playbooks/deploy.yml b/ansible/playbooks/deploy.yml
index c8880281d1..842fddf11a 100644
--- a/ansible/playbooks/deploy.yml
+++ b/ansible/playbooks/deploy.yml
@@ -1,9 +1,9 @@
----
-- name: Deploy application
-  hosts: webservers
-  become: true
-  vars_files:
-    - ../group_vars/all.yml
-
-  roles:
-    - app_deploy
+---
+- name: Deploy application
+  hosts: webservers
+  become: true
+  vars_files:
+    - ../group_vars/all.yml
+
+  roles:
+    - web_app
diff --git a/ansible/playbooks/provision.yml b/ansible/playbooks/provision.yml
index 7cc2e6678d..dc9464d334 100644
--- a/ansible/playbooks/provision.yml
+++ b/ansible/playbooks/provision.yml
@@ -1,8 +1,8 @@
----
-- name: Provision web servers
-  hosts: webservers
-  become: true
-
-  roles:
-    - common
-    - docker
+---
+- name: Provision web servers
+  hosts: webservers
+  become: true
+
+  roles:
+    - common
+    - docker
diff --git a/ansible/playbooks/site.yml b/ansible/playbooks/site.yml
index da4943e972..876b2cb346 100644
--- a/ansible/playbooks/site.yml
+++ b/ansible/playbooks/site.yml
@@ -1,9 +1,9 @@
----
-- name: Full site run (provision + deploy)
-  hosts: webservers
-  become: true
-
-  roles:
-    - common
-    - docker
-    - app_deploy
+---
+- name: Full site run (provision + deploy)
+  hosts: webservers
+  become: true
+
+  roles:
+    - common
+    - docker
+    - app_deploy
diff --git a/ansible/roles/app_deploy/tasks/main.yml b/ansible/roles/app_deploy/tasks/main.yml
deleted file mode 100644
index 041110ff0c..0000000000
--- a/ansible/roles/app_deploy/tasks/main.yml
+++ /dev/null
@@ -1,46 +0,0 @@
----
-- name: Log in to Docker Hub
-  community.docker.docker_login:
-    username: "{{ dockerhub_username }}"
-    password: "{{ dockerhub_password }}"
-    registry_url: "https://index.docker.io/v1/"
-  no_log: false
-
-- name: Pull Docker image
-  community.docker.docker_image:
-    name: "{{ docker_image }}"
-    tag: "{{ docker_image_tag }}"
-    source: pull
-    force_source: yes
-
-- name: Remove old container if exists
-  community.docker.docker_container:
-    name: "{{ app_container_name }}"
-    state: absent
-  ignore_errors: yes
-
-- name: Run new container
-  community.docker.docker_container:
-    name: "{{ app_container_name }}"
-    image: "{{ docker_image }}:{{ docker_image_tag }}"
-    state: started
-    restart_policy: "{{ app_restart_policy }}"
-    ports:
-      - "{{ app_port }}:{{ app_port }}"
-
-- name: Wait for application port
-  wait_for:
-    port: "{{ app_port }}"
-    host: localhost
-    delay: 5
-    timeout: 60
-
-- name: Verify health endpoint
-  uri:
-    url: "http://localhost:{{ app_port }}/health"
-    method: GET
-    status_code: 200
-  retries: 5
-  delay: 5
-  register: health_check
-  until: health_check.status == 200
diff --git a/ansible/roles/common/defaults/main.yml b/ansible/roles/common/defaults/main.yml
index c635cb993f..c853713294 100644
--- a/ansible/roles/common/defaults/main.yml
+++ b/ansible/roles/common/defaults/main.yml
@@ -1,14 +1,14 @@
----
-# Default list of packages installed on every server
-common_packages:
-  - python3-pip
-  - curl
-  - git
-  - vim
-  - htop
-  - ca-certificates
-  - gnupg
-  - lsb-release
-
-# Optional timezone (set to null to skip)
-common_timezone: "Europe/Stockholm"
+---
+# Default list of packages installed on every server
+common_packages:
+  - python3-pip
+  - curl
+  - git
+  - vim
+  - htop
+  - ca-certificates
+  - gnupg
+  - lsb-release
+
+# Optional timezone (set to null to skip)
+common_timezone: "Europe/Stockholm"
diff --git a/ansible/roles/common/tasks/main.yml b/ansible/roles/common/tasks/main.yml
index 3a3cf495ba..393e289378 100644
--- a/ansible/roles/common/tasks/main.yml
+++ b/ansible/roles/common/tasks/main.yml
@@ -1,15 +1,84 @@
----
-- name: Update apt cache
-  ansible.builtin.apt:
-    update_cache: true
-    cache_valid_time: 3600
-
-- name: Install common packages
-  ansible.builtin.apt:
-    name: "{{ common_packages }}"
-    state: present
-
-- name: Set timezone (optional)
-  community.general.timezone:
-    name: "{{ common_timezone }}"
-  when: common_timezone is not none
+---
+# Common role: system packages and user setup
+# Tags: common (entire role), packages (apt tasks), users (user management)
+
+- name: Install required system packages
+  block:
+    - name: Update apt cache
+      ansible.builtin.apt:
+        update_cache: true
+        cache_valid_time: 3600
+
+    - name: Install essential packages
+      ansible.builtin.apt:
+        name: "{{ common_packages }}"
+        state: present
+
+  rescue:
+    - name: Retry with fix-missing on apt failure
+      ansible.builtin.apt:
+        name: "{{ common_packages }}"
+        state: present
+        update_cache: true
+      environment:
+        DEBIAN_FRONTEND: noninteractive
+      # Retry once with --fix-missing to handle partial failures
+      register: apt_retry
+      until: apt_retry is succeeded
+      retries: 1
+      delay: 5
+
+  always:
+    - name: Log package installation completion
+      ansible.builtin.copy:
+        dest: /tmp/ansible_common_packages.log
+        content: |
+          Common packages installation completed at {{ ansible_date_time.iso8601 }}
+          Host: {{ inventory_hostname }}
+        mode: "0644"
+
+  become: true
+  tags:
+    - packages
+    - common
+
+- name: Manage application users
+  block:
+    - name: Ensure app group exists
+      ansible.builtin.group:
+        name: "{{ common_app_group }}"
+        state: present
+
+    - name: Create application user
+      ansible.builtin.user:
+        name: "{{ common_app_user }}"
+        group: "{{ common_app_group }}"
+        shell: /bin/bash
+        create_home: true
+        state: present
+
+    - name: Add app user to docker group
+      ansible.builtin.user:
+        name: "{{ common_app_user }}"
+        groups: docker
+        append: true
+
+  rescue:
+    - name: Log user creation failure
+      ansible.builtin.debug:
+        msg: "User/group creation failed for {{ common_app_user }}. Check system permissions."
+
+  always:
+    - name: Log user setup completion
+      ansible.builtin.copy:
+        dest: /tmp/ansible_common_users.log
+        content: |
+          User setup completed at {{ ansible_date_time.iso8601 }}
+          User: {{ common_app_user }}
+          Host: {{ inventory_hostname }}
+        mode: "0644"
+
+  become: true
+  tags:
+    - users
+    - common
diff --git a/ansible/roles/docker/defaults/main.yml b/ansible/roles/docker/defaults/main.yml
index 6ca3d13392..ae4a7b0add 100644
--- a/ansible/roles/docker/defaults/main.yml
+++ b/ansible/roles/docker/defaults/main.yml
@@ -1,9 +1,18 @@
----
-docker_packages:
-  - docker-ce
-  - docker-ce-cli
-  - containerd.io
-  - docker-buildx-plugin
-  - docker-compose-plugin
+---
+docker_packages:
+  - docker-ce
+  - docker-ce-cli
+  - containerd.io
+  - docker-buildx-plugin
+  - docker-compose-plugin
+
+docker_user: vagrant
 
-docker_user: vagrant
+docker_daemon_config:
+  log-driver: json-file
+  log-opts:
+    max-size: "10m"
+    max-file: "3"
+
+docker_users:
+  - vagrant
diff --git a/ansible/roles/docker/handlers/main.yml b/ansible/roles/docker/handlers/main.yml
index 1a5058da5e..568d0966f5 100644
--- a/ansible/roles/docker/handlers/main.yml
+++ b/ansible/roles/docker/handlers/main.yml
@@ -1,5 +1,5 @@
----
-- name: restart docker
-  ansible.builtin.service:
-    name: docker
-    state: restarted
+---
+- name: restart docker
+  ansible.builtin.service:
+    name: docker
+    state: restarted
diff --git a/ansible/roles/docker/tasks/main.yml b/ansible/roles/docker/tasks/main.yml
index 57ac2d885b..a89bacc6e4 100644
--- a/ansible/roles/docker/tasks/main.yml
+++ b/ansible/roles/docker/tasks/main.yml
@@ -1,49 +1,119 @@
----
-- name: Install prerequisites for Docker repo
-  apt:
-    name:
-      - ca-certificates
-      - curl
-      - gnupg
-    state: present
-
-- name: Ensure /etc/apt/keyrings exists
-  file:
-    path: /etc/apt/keyrings
-    state: directory
-    mode: '0755'
-
-- name: Download and dearmor Docker GPG key
-  shell: curl -fsSL https://download.docker.com/linux/ubuntu/gpg | gpg --dearmor -o /etc/apt/keyrings/docker.gpg && chmod a+r /etc/apt/keyrings/docker.gpg
-  args:
-    creates: /etc/apt/keyrings/docker.gpg
-
-- name: Add Docker apt repository
-  apt_repository:
-    repo: "deb [arch=amd64 signed-by=/etc/apt/keyrings/docker.gpg] https://download.docker.com/linux/ubuntu {{ ansible_distribution_release }} stable"
-    state: present
-    filename: docker
-    update_cache: yes
-
-- name: Install Docker packages
-  apt:
-    name: "{{ docker_packages }}"
-    state: present
-  notify: restart docker
-
-- name: Ensure Docker service is started and enabled
-  service:
-    name: docker
-    state: started
-    enabled: yes
-
-- name: Add user to docker group
-  user:
-    name: "{{ docker_user }}"
-    groups: docker
-    append: yes
-
-- name: Install python3-docker for Ansible Docker modules
-  apt:
-    name: python3-docker
-    state: present
+---
+# Docker role: install and configure Docker Engine
+# Tags: docker (entire role), docker_install, docker_config
+
+- name: Install Docker Engine
+  block:
+    - name: Remove old Docker packages if present
+      ansible.builtin.apt:
+        name:
+          - docker
+          - docker-engine
+          - docker.io
+          - containerd
+          - runc
+        state: absent
+        purge: true
+
+    - name: Install Docker dependencies
+      ansible.builtin.apt:
+        name:
+          - apt-transport-https
+          - ca-certificates
+          - curl
+          - gnupg
+          - lsb-release
+        state: present
+        update_cache: true
+
+    - name: Add Docker GPG key
+      ansible.builtin.apt_key:
+        url: https://download.docker.com/linux/ubuntu/gpg
+        state: present
+
+    - name: Add Docker apt repository
+      ansible.builtin.apt_repository:
+        repo: >-
+          deb [arch=amd64]
+          https://download.docker.com/linux/ubuntu
+          {{ ansible_distribution_release }} stable
+        state: present
+        update_cache: true
+
+    - name: Install Docker packages
+      ansible.builtin.apt:
+        name: "{{ docker_packages }}"
+        state: present
+
+  rescue:
+    # GPG/network timeouts are common; wait and retry
+    - name: Wait before retrying Docker install
+      ansible.builtin.pause:
+        seconds: 10
+
+    - name: Retry adding Docker GPG key
+      ansible.builtin.apt_key:
+        url: https://download.docker.com/linux/ubuntu/gpg
+        state: present
+
+    - name: Retry installing Docker packages
+      ansible.builtin.apt:
+        name: "{{ docker_packages }}"
+        state: present
+        update_cache: true
+
+  always:
+    - name: Ensure Docker service is enabled and started
+      ansible.builtin.service:
+        name: docker
+        state: started
+        enabled: true
+
+  become: true
+  tags:
+    - docker
+    - docker_install
+
+- name: Configure Docker
+  block:
+    - name: Create Docker daemon configuration directory
+      ansible.builtin.file:
+        path: /etc/docker
+        state: directory
+        mode: "0755"
+
+    - name: Configure Docker daemon
+      ansible.builtin.copy:
+        dest: /etc/docker/daemon.json
+        content: "{{ docker_daemon_config | to_nice_json }}"
+        mode: "0644"
+      notify: restart docker
+
+    - name: Add users to docker group
+      ansible.builtin.user:
+        name: "{{ item }}"
+        groups: docker
+        append: true
+      loop: "{{ docker_users }}"
+
+  rescue:
+    - name: Log Docker configuration failure
+      ansible.builtin.debug:
+        msg: "Docker configuration failed. Rolling back daemon.json."
+
+    - name: Remove invalid daemon config
+      ansible.builtin.file:
+        path: /etc/docker/daemon.json
+        state: absent
+
+  always:
+    - name: Verify Docker is running after config
+      ansible.builtin.service:
+        name: docker
+        state: started
+        enabled: true
+
+  become: true
+  tags:
+    - docker
+    - docker_config
diff --git a/ansible/roles/app_deploy/defaults/main.yml b/ansible/roles/web_app/defaults/main.yml
similarity index 68%
rename from ansible/roles/app_deploy/defaults/main.yml
rename to ansible/roles/web_app/defaults/main.yml
index 1f7d94f7e2..50edc2cec0 100644
--- a/ansible/roles/app_deploy/defaults/main.yml
+++ b/ansible/roles/web_app/defaults/main.yml
@@ -1,10 +1,15 @@
----
-app_name: devops-app
-# By default the image is dockerhub_username/app_name (username is in Vault)
-docker_image_tag: latest
-app_port: 5000
-app_container_name: "{{ app_name }}"
-app_restart_policy: unless-stopped
-app_env: {}
-health_endpoint: "/health"
-health_timeout_seconds: 30
+---
+app_name: devops-app
+# By default the image is dockerhub_username/app_name (username is in Vault)
+docker_image_tag: latest
+app_port: 5000
+app_container_name: "{{ app_name }}"
+app_restart_policy: unless-stopped
+app_env: {}
+health_endpoint: "/health"
+health_timeout_seconds: 30
+
+compose_project_dir: "/opt/{{ app_name }}"
+docker_compose_version: "3.8"
+app_internal_port: 5000
+web_app_wipe: false
diff --git a/ansible/roles/app_deploy/handlers/main.yml b/ansible/roles/web_app/handlers/main.yml
similarity index 96%
rename from ansible/roles/app_deploy/handlers/main.yml
rename to ansible/roles/web_app/handlers/main.yml
index 1fc3fba48b..ae986eabda 100644
--- a/ansible/roles/app_deploy/handlers/main.yml
+++ b/ansible/roles/web_app/handlers/main.yml
@@ -1,6 +1,6 @@
----
-- name: restart app container
-  community.docker.docker_container:
-    name: "{{ app_container_name }}"
-    state: started
-    restart: true
+---
+- name: restart app container
+  community.docker.docker_container:
+    name: "{{ app_container_name }}"
+    state: started
+    restart: true
diff --git a/ansible/roles/web_app/meta/main.yml b/ansible/roles/web_app/meta/main.yml
new file mode 100644
index 0000000000..e81c1dfe31
--- /dev/null
+++ b/ansible/roles/web_app/meta/main.yml
@@ -0,0 +1,9 @@
+---
+galaxy_info:
+  role_name: web_app
+  description: Deploy a containerised web application using Docker Compose
+  license: MIT
+  min_ansible_version: "2.16"
+
+dependencies:
+  - role: docker
diff --git a/ansible/roles/web_app/tasks/main.yml b/ansible/roles/web_app/tasks/main.yml
new file mode 100644
index 0000000000..da8559b773
--- /dev/null
+++ b/ansible/roles/web_app/tasks/main.yml
@@ -0,0 +1,80 @@
+---
+# roles/web_app/tasks/main.yml
+# Tags: web_app_wipe | app_deploy | compose
+
+- name: Include wipe tasks
+  ansible.builtin.include_tasks: wipe.yml
+  tags:
+    - web_app_wipe
+
+- name: Deploy application with Docker Compose
+  block:
+    - name: Log in to Docker Hub
+      community.docker.docker_login:
+        username: "{{ dockerhub_username }}"
+        password: "{{ dockerhub_password }}"
+        registry_url: "https://index.docker.io/v1/"
+      no_log: true
+
+    - name: Create application directory
+      ansible.builtin.file:
+        path: "{{ compose_project_dir }}"
+        state: directory
+        mode: "0755"
+
+    - name: Template docker-compose.yml to application directory
+      ansible.builtin.template:
+        src: docker-compose.yml.j2
+        dest: "{{ compose_project_dir }}/docker-compose.yml"
+        mode: "0644"
+
+    - name: Pull latest image and bring up services
+      community.docker.docker_compose_v2:
+        project_src: "{{ compose_project_dir }}"
+        pull: policy
+        state: present
+        recreate: auto
+
+    - name: Wait for application port to open
+      ansible.builtin.wait_for:
+        port: "{{ app_port }}"
+        host: localhost
+        delay: 5
+        timeout: 60
+
+    - name: Verify health endpoint
+      ansible.builtin.uri:
+        url: "http://localhost:{{ app_port }}{{ health_endpoint }}"
+        method: GET
+        status_code: 200
+      retries: 5
+      delay: 5
+      register: health_check
+      until: health_check.status == 200
+
+    - name: Log successful deployment
+      ansible.builtin.debug:
+        msg: "{{ app_name }} deployed successfully on {{ inventory_hostname }}:{{ app_port }}"
+
+  rescue:
+    - name: Show Docker Compose logs on failure
+      ansible.builtin.command:
+        cmd: docker compose -f {{ compose_project_dir }}/docker-compose.yml logs --tail=50
+      register: compose_logs
+      changed_when: false
+      ignore_errors: true
+
+    - name: Display logs for debugging
+      ansible.builtin.debug:
+        var: compose_logs.stdout_lines
+
+    - name: Fail with helpful message
+      ansible.builtin.fail:
+        msg: >-
+          Deployment of '{{ app_name }}' failed. See compose logs above.
+          Verify image {{ docker_image }}:{{ docker_image_tag }} exists on Docker Hub.
+
+  become: true
+  tags:
+    - app_deploy
+    - compose
diff --git a/ansible/roles/web_app/tasks/wipe.yml b/ansible/roles/web_app/tasks/wipe.yml
new file mode 100644
index 0000000000..e61df93468
--- /dev/null
+++ b/ansible/roles/web_app/tasks/wipe.yml
@@ -0,0 +1,23 @@
+---
+- name: Wipe web application
+  block:
+    - name: Stop and remove containers via Docker Compose
+      community.docker.docker_compose_v2:
+        project_src: "{{ compose_project_dir }}"
+        state: absent
+        remove_volumes: true
+      ignore_errors: true
+
+    - name: Remove application directory
+      ansible.builtin.file:
+        path: "{{ compose_project_dir }}"
+        state: absent
+
+    - name: Log successful wipe
+      ansible.builtin.debug:
+        msg: "Application '{{ app_name }}' wiped successfully from {{ inventory_hostname }}"
+
+  when: web_app_wipe | bool
+  become: true
+  tags:
+    - web_app_wipe
diff --git a/ansible/roles/web_app/templates/docker-compose.yml.j2 b/ansible/roles/web_app/templates/docker-compose.yml.j2
new file mode 100644
index 0000000000..04f0314623
--- /dev/null
+++ b/ansible/roles/web_app/templates/docker-compose.yml.j2
@@ -0,0 +1,30 @@
+# Managed by Ansible — do not edit manually
+version: '{{ docker_compose_version }}'
+
+services:
+  {{ app_name }}:
+    image: {{ docker_image }}:{{ docker_image_tag }}
+    container_name: {{ app_container_name }}
+    ports:
+      - "{{ app_port }}:{{ app_internal_port }}"
+    environment:
+      PYTHONUNBUFFERED: "1"
+{% for key, value in app_env.items() %}
+      {{ key }}: "{{ value }}"
+{% endfor %}
+    restart: {{ app_restart_policy }}
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:{{ app_internal_port }}{{ health_endpoint }}"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 15s
+    logging:
+      driver: json-file
+      options:
+        max-size: "10m"
+        max-file: "3"
+
+networks:
+  default:
+    name: {{ app_name }}_network

From 96676ecde8af15ee1d391f9f9d7a2d2a776d6dbd Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 19:15:55 +0300
Subject: [PATCH 02/13] fix: add dummy vault pass for ansible-lint in CI

---
 .github/workflows/ansible-deploy.yml | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/ansible-deploy.yml b/.github/workflows/ansible-deploy.yml
index 551819a03f..be407e2512 100644
--- a/.github/workflows/ansible-deploy.yml
+++ b/.github/workflows/ansible-deploy.yml
@@ -2,7 +2,7 @@ name: Ansible Deployment
 
 on:
   push:
-    branches: [master]
+    branches: [master, lab06]
     paths:
       - 'ansible/**'
       - '!ansible/docs/**'
@@ -37,6 +37,9 @@ jobs:
       - name: Install Ansible and ansible-lint
         run: pip install ansible ansible-lint
 
+      - name: Create dummy vault password for lint
+        run: echo "dummy" > ansible/.vault_pass
+
       - name: Run ansible-lint
         run: |
           cd ansible
@@ -46,7 +49,7 @@ jobs:
     name: Deploy Application
     needs: lint
     runs-on: ubuntu-latest
-    if: github.event_name == 'push'
+    if: github.event_name == 'push' && github.ref == 'refs/heads/master'
     steps:
       - name: Checkout repository
         uses: actions/checkout@v4

From e57e330d0c86bd2194e11024410f4ed51c7776a0 Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 19:19:12 +0300
Subject: [PATCH 03/13] fix: ansible-lint violations and vault in CI

---
 .github/workflows/ansible-deploy.yml   | 8 ++++++--
 ansible/.ansible-lint                  | 9 +++++++++
 ansible/playbooks/site.yml             | 2 +-
 ansible/roles/common/tasks/main.yml    | 2 +-
 ansible/roles/docker/handlers/main.yml | 2 +-
 5 files changed, 18 insertions(+), 5 deletions(-)
 create mode 100644 ansible/.ansible-lint

diff --git a/.github/workflows/ansible-deploy.yml b/.github/workflows/ansible-deploy.yml
index be407e2512..ea53365291 100644
--- a/.github/workflows/ansible-deploy.yml
+++ b/.github/workflows/ansible-deploy.yml
@@ -37,14 +37,18 @@ jobs:
       - name: Install Ansible and ansible-lint
         run: pip install ansible ansible-lint
 
-      - name: Create dummy vault password for lint
-        run: echo "dummy" > ansible/.vault_pass
+      - name: Write vault password for syntax check
+        run: echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > ansible/.vault_pass
 
       - name: Run ansible-lint
         run: |
           cd ansible
           ansible-lint playbooks/provision.yml playbooks/deploy.yml playbooks/site.yml
 
+      - name: Clean up vault password
+        if: always()
+        run: rm -f ansible/.vault_pass
+
   deploy:
     name: Deploy Application
     needs: lint
diff --git a/ansible/.ansible-lint b/ansible/.ansible-lint
new file mode 100644
index 0000000000..a42a13d8f2
--- /dev/null
+++ b/ansible/.ansible-lint
@@ -0,0 +1,9 @@
+warn_list:
+  - key-order
+  - var-naming
+  - name
+
+skip_list:
+  - key-order[task]
+  - var-naming[no-role-prefix]
+  - name[casing]
diff --git a/ansible/playbooks/site.yml b/ansible/playbooks/site.yml
index 876b2cb346..cf2e66a01a 100644
--- a/ansible/playbooks/site.yml
+++ b/ansible/playbooks/site.yml
@@ -6,4 +6,4 @@
   roles:
     - common
     - docker
-    - app_deploy
+    - web_app
diff --git a/ansible/roles/common/tasks/main.yml b/ansible/roles/common/tasks/main.yml
index 393e289378..c8c44248fd 100644
--- a/ansible/roles/common/tasks/main.yml
+++ b/ansible/roles/common/tasks/main.yml
@@ -23,7 +23,7 @@
       environment:
         DEBIAN_FRONTEND: noninteractive
       # Retry once with --fix-missing to handle partial failures
-      register: apt_retry
+      register: common_apt_retry
       until: apt_retry is succeeded
       retries: 1
       delay: 5
diff --git a/ansible/roles/docker/handlers/main.yml b/ansible/roles/docker/handlers/main.yml
index 568d0966f5..55637bda17 100644
--- a/ansible/roles/docker/handlers/main.yml
+++ b/ansible/roles/docker/handlers/main.yml
@@ -1,5 +1,5 @@
 ---
-- name: restart docker
+- name: Restart docker
   ansible.builtin.service:
     name: docker
     state: restarted

From 47ffbc925aa26afcb3082d5f569f2c3357b1c0f0 Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 19:30:55 +0300
Subject: [PATCH 04/13] fix: use printf to avoid trailing newline in vault
 password

---
 .github/workflows/ansible-deploy.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/ansible-deploy.yml b/.github/workflows/ansible-deploy.yml
index ea53365291..50500ee6d1 100644
--- a/.github/workflows/ansible-deploy.yml
+++ b/.github/workflows/ansible-deploy.yml
@@ -38,7 +38,7 @@ jobs:
         run: pip install ansible ansible-lint
 
       - name: Write vault password for syntax check
-        run: echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > ansible/.vault_pass
+        run: printf "%s" "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > ansible/.vault_pass
 
       - name: Run ansible-lint
         run: |
@@ -78,7 +78,7 @@ jobs:
           ssh-keyscan -H "${{ secrets.VM_HOST }}" >> ~/.ssh/known_hosts
 
       - name: Write Vault password file
-        run: echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
+        run: printf "%s" "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
 
       - name: Run Ansible deploy playbook
         env:

From 0e13cbe6db72f9b0aed8664770a7c46910411c8f Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 19:32:41 +0300
Subject: [PATCH 05/13] fix: use env var for vault password to avoid
 interpolation issues

---
 .github/workflows/ansible-deploy.yml | 56 +++++++++++-----------------
 1 file changed, 21 insertions(+), 35 deletions(-)

diff --git a/.github/workflows/ansible-deploy.yml b/.github/workflows/ansible-deploy.yml
index 50500ee6d1..fdc8df7a61 100644
--- a/.github/workflows/ansible-deploy.yml
+++ b/.github/workflows/ansible-deploy.yml
@@ -13,39 +13,31 @@ on:
       - 'ansible/**'
       - '.github/workflows/ansible-deploy.yml'
 
-concurrency:
-  group: ansible-deploy-${{ github.ref }}
-  cancel-in-progress: true
-
-permissions:
-  contents: read
-
 jobs:
   lint:
     name: Ansible Lint
     runs-on: ubuntu-latest
     steps:
-      - name: Checkout repository
-        uses: actions/checkout@v4
+      - uses: actions/checkout@v4
 
-      - name: Set up Python 3.12
-        uses: actions/setup-python@v5
+      - uses: actions/setup-python@v5
         with:
           python-version: '3.12'
-          cache: pip
 
       - name: Install Ansible and ansible-lint
         run: pip install ansible ansible-lint
 
-      - name: Write vault password for syntax check
-        run: printf "%s" "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > ansible/.vault_pass
+      - name: Write vault password
+        env:
+          VAULT_PASS: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
+        run: printf '%s' "$VAULT_PASS" > ansible/.vault_pass
 
       - name: Run ansible-lint
         run: |
           cd ansible
           ansible-lint playbooks/provision.yml playbooks/deploy.yml playbooks/site.yml
 
-      - name: Clean up vault password
+      - name: Cleanup
         if: always()
         run: rm -f ansible/.vault_pass
 
@@ -55,44 +47,38 @@ jobs:
     runs-on: ubuntu-latest
     if: github.event_name == 'push' && github.ref == 'refs/heads/master'
     steps:
-      - name: Checkout repository
-        uses: actions/checkout@v4
+      - uses: actions/checkout@v4
 
-      - name: Set up Python 3.12
-        uses: actions/setup-python@v5
+      - uses: actions/setup-python@v5
         with:
           python-version: '3.12'
-          cache: pip
 
       - name: Install Ansible
         run: pip install ansible
 
-      - name: Install community.docker collection
+      - name: Install collections
         run: ansible-galaxy collection install community.docker community.general
 
-      - name: Configure SSH access to target VM
+      - name: Configure SSH
         run: |
           mkdir -p ~/.ssh
-          echo "${{ secrets.SSH_PRIVATE_KEY }}" > ~/.ssh/id_rsa
+          printf '%s' "${{ secrets.SSH_PRIVATE_KEY }}" > ~/.ssh/id_rsa
           chmod 600 ~/.ssh/id_rsa
           ssh-keyscan -H "${{ secrets.VM_HOST }}" >> ~/.ssh/known_hosts
 
-      - name: Write Vault password file
-        run: printf "%s" "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
-
-      - name: Run Ansible deploy playbook
+      - name: Write vault password
         env:
-          ANSIBLE_HOST_KEY_CHECKING: "False"
+          VAULT_PASS: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
+        run: printf '%s' "$VAULT_PASS" > /tmp/vault_pass
+
+      - name: Deploy
         run: |
           cd ansible
-          ansible-playbook playbooks/deploy.yml \
-            --vault-password-file /tmp/vault_pass
+          ansible-playbook playbooks/deploy.yml --vault-password-file /tmp/vault_pass
 
-      - name: Clean up Vault password file
+      - name: Cleanup vault pass
         if: always()
         run: rm -f /tmp/vault_pass
 
-      - name: Verify deployment
-        run: |
-          sleep 10
-          curl -f "http://${{ secrets.VM_HOST }}:5000/health" || exit 1
+      - name: Verify health
+        run: sleep 10 && curl -f "http://${{ secrets.VM_HOST }}:5000/health"

From b7dc555ecd529eb41702f77695e7bf342e06984a Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 19:34:19 +0300
Subject: [PATCH 06/13] fix: remove vault from ansible.cfg during lint in CI

---
 .github/workflows/ansible-deploy.yml | 28 +++++++---------------------
 1 file changed, 7 insertions(+), 21 deletions(-)

diff --git a/.github/workflows/ansible-deploy.yml b/.github/workflows/ansible-deploy.yml
index fdc8df7a61..09c7ff4c69 100644
--- a/.github/workflows/ansible-deploy.yml
+++ b/.github/workflows/ansible-deploy.yml
@@ -27,20 +27,15 @@ jobs:
       - name: Install Ansible and ansible-lint
         run: pip install ansible ansible-lint
 
-      - name: Write vault password
-        env:
-          VAULT_PASS: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
-        run: printf '%s' "$VAULT_PASS" > ansible/.vault_pass
-
       - name: Run ansible-lint
+        env:
+          ANSIBLE_VAULT_PASSWORD_FILE: ""
         run: |
           cd ansible
+          # Remove vault_password_file from cfg for lint
+          sed -i '/vault_password_file/d' ansible.cfg
           ansible-lint playbooks/provision.yml playbooks/deploy.yml playbooks/site.yml
 
-      - name: Cleanup
-        if: always()
-        run: rm -f ansible/.vault_pass
-
   deploy:
     name: Deploy Application
     needs: lint
@@ -48,37 +43,28 @@ jobs:
     if: github.event_name == 'push' && github.ref == 'refs/heads/master'
     steps:
       - uses: actions/checkout@v4
-
       - uses: actions/setup-python@v5
         with:
           python-version: '3.12'
-
       - name: Install Ansible
         run: pip install ansible
-
       - name: Install collections
         run: ansible-galaxy collection install community.docker community.general
-
       - name: Configure SSH
         run: |
           mkdir -p ~/.ssh
           printf '%s' "${{ secrets.SSH_PRIVATE_KEY }}" > ~/.ssh/id_rsa
           chmod 600 ~/.ssh/id_rsa
           ssh-keyscan -H "${{ secrets.VM_HOST }}" >> ~/.ssh/known_hosts
-
-      - name: Write vault password
+      - name: Deploy
         env:
           VAULT_PASS: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
-        run: printf '%s' "$VAULT_PASS" > /tmp/vault_pass
-
-      - name: Deploy
         run: |
+          printf '%s' "$VAULT_PASS" > /tmp/vault_pass
           cd ansible
           ansible-playbook playbooks/deploy.yml --vault-password-file /tmp/vault_pass
-
-      - name: Cleanup vault pass
+      - name: Cleanup
         if: always()
         run: rm -f /tmp/vault_pass
-
       - name: Verify health
         run: sleep 10 && curl -f "http://${{ secrets.VM_HOST }}:5000/health"

From d6d0a0738783b9065e97770e396e34e32fa47897 Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 19:39:30 +0300
Subject: [PATCH 07/13] fix: remove vault_password_file from ansible.cfg for CI
 compatibility

---
 ansible/ansible.cfg | 1 -
 1 file changed, 1 deletion(-)

diff --git a/ansible/ansible.cfg b/ansible/ansible.cfg
index 7737aab432..d74fa42465 100644
--- a/ansible/ansible.cfg
+++ b/ansible/ansible.cfg
@@ -1,5 +1,4 @@
 [defaults]
-vault_password_file = .vault_pass
 inventory = inventory/hosts.ini
 roles_path = roles
 host_key_checking = False

From 65fc231b042a1fe5a783be45c08b2864abe4cff8 Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 19:53:46 +0300
Subject: [PATCH 08/13] fix: correct until variable name, remove vars_files,
 fix handler notify case

---
 ansible/playbooks/deploy.yml        | 2 --
 ansible/roles/common/tasks/main.yml | 2 +-
 ansible/roles/docker/tasks/main.yml | 2 +-
 3 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/ansible/playbooks/deploy.yml b/ansible/playbooks/deploy.yml
index 842fddf11a..77ad7aa765 100644
--- a/ansible/playbooks/deploy.yml
+++ b/ansible/playbooks/deploy.yml
@@ -2,8 +2,6 @@
 - name: Deploy application
   hosts: webservers
   become: true
-  vars_files:
-    - ../group_vars/all.yml
 
   roles:
     - web_app
diff --git a/ansible/roles/common/tasks/main.yml b/ansible/roles/common/tasks/main.yml
index c8c44248fd..53490d4f8c 100644
--- a/ansible/roles/common/tasks/main.yml
+++ b/ansible/roles/common/tasks/main.yml
@@ -24,7 +24,7 @@
         DEBIAN_FRONTEND: noninteractive
       # Retry once with --fix-missing to handle partial failures
       register: common_apt_retry
-      until: apt_retry is succeeded
+      until: common_apt_retry is succeeded
       retries: 1
       delay: 5
 
diff --git a/ansible/roles/docker/tasks/main.yml b/ansible/roles/docker/tasks/main.yml
index a89bacc6e4..7bd916d856 100644
--- a/ansible/roles/docker/tasks/main.yml
+++ b/ansible/roles/docker/tasks/main.yml
@@ -87,7 +87,7 @@
         dest: /etc/docker/daemon.json
         content: "{{ docker_daemon_config | to_nice_json }}"
         mode: "0644"
-      notify: restart docker
+      notify: Restart docker
 
     - name: Add users to docker group
       ansible.builtin.user:

From 044e6810ca871acf8e8010456ef60cc0ef710cbf Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 19:58:28 +0300
Subject: [PATCH 09/13] trigger CI


From e5ac7c65f3458cdbb09fcfad2015beb219f54af4 Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 20:00:55 +0300
Subject: [PATCH 10/13] fix: trigger on push to lab06

---
 .github/workflows/ansible-deploy.yml | 49 ----------------------------
 1 file changed, 49 deletions(-)

diff --git a/.github/workflows/ansible-deploy.yml b/.github/workflows/ansible-deploy.yml
index 09c7ff4c69..014bffbed1 100644
--- a/.github/workflows/ansible-deploy.yml
+++ b/.github/workflows/ansible-deploy.yml
@@ -3,15 +3,6 @@ name: Ansible Deployment
 on:
   push:
     branches: [master, lab06]
-    paths:
-      - 'ansible/**'
-      - '!ansible/docs/**'
-      - '.github/workflows/ansible-deploy.yml'
-  pull_request:
-    branches: [master]
-    paths:
-      - 'ansible/**'
-      - '.github/workflows/ansible-deploy.yml'
 
 jobs:
   lint:
@@ -19,52 +10,12 @@ jobs:
     runs-on: ubuntu-latest
     steps:
       - uses: actions/checkout@v4
-
       - uses: actions/setup-python@v5
         with:
           python-version: '3.12'
-
       - name: Install Ansible and ansible-lint
         run: pip install ansible ansible-lint
-
       - name: Run ansible-lint
-        env:
-          ANSIBLE_VAULT_PASSWORD_FILE: ""
         run: |
           cd ansible
-          # Remove vault_password_file from cfg for lint
-          sed -i '/vault_password_file/d' ansible.cfg
           ansible-lint playbooks/provision.yml playbooks/deploy.yml playbooks/site.yml
-
-  deploy:
-    name: Deploy Application
-    needs: lint
-    runs-on: ubuntu-latest
-    if: github.event_name == 'push' && github.ref == 'refs/heads/master'
-    steps:
-      - uses: actions/checkout@v4
-      - uses: actions/setup-python@v5
-        with:
-          python-version: '3.12'
-      - name: Install Ansible
-        run: pip install ansible
-      - name: Install collections
-        run: ansible-galaxy collection install community.docker community.general
-      - name: Configure SSH
-        run: |
-          mkdir -p ~/.ssh
-          printf '%s' "${{ secrets.SSH_PRIVATE_KEY }}" > ~/.ssh/id_rsa
-          chmod 600 ~/.ssh/id_rsa
-          ssh-keyscan -H "${{ secrets.VM_HOST }}" >> ~/.ssh/known_hosts
-      - name: Deploy
-        env:
-          VAULT_PASS: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
-        run: |
-          printf '%s' "$VAULT_PASS" > /tmp/vault_pass
-          cd ansible
-          ansible-playbook playbooks/deploy.yml --vault-password-file /tmp/vault_pass
-      - name: Cleanup
-        if: always()
-        run: rm -f /tmp/vault_pass
-      - name: Verify health
-        run: sleep 10 && curl -f "http://${{ secrets.VM_HOST }}:5000/health"

From 4ec223c1938e0d1787e9a2d5d9668cfd6d03c8a4 Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 20:12:46 +0300
Subject: [PATCH 11/13] fix: CI

---
 .github/workflows/python-ci.yml      |  206 +-
 README.md                            |  542 ++---
 ansible/roles/web_app/meta/main.yml  |    1 +
 ansible/roles/web_app/tasks/wipe.yml |    2 +-
 app_python/.dockerignore             |   56 +-
 app_python/.gitignore                |   24 +-
 app_python/Dockerfile                |   58 +-
 app_python/README.md                 |  284 +--
 app_python/app.py                    |  234 +-
 app_python/docs/LAB01.md             |  336 +--
 app_python/docs/LAB02.md             |  470 ++--
 app_python/docs/LAB03.md             |  598 ++---
 app_python/docs/LAB04.md             |  426 ++--
 app_python/requirements-dev.txt      |    2 +-
 app_python/tests/test_app.py         |  124 +-
 labs/lab01.md                        | 1386 ++++++------
 labs/lab02.md                        |  732 +++----
 labs/lab03.md                        | 1862 ++++++++--------
 labs/lab04.md                        | 3020 +++++++++++++-------------
 labs/lab05.md                        | 1952 ++++++++---------
 labs/lab06.md                        | 2704 +++++++++++------------
 labs/lab07.md                        | 1188 +++++-----
 labs/lab08.md                        | 1504 ++++++-------
 labs/lab09.md                        | 1460 ++++++-------
 labs/lab10.md                        | 1806 +++++++--------
 labs/lab11.md                        |  894 ++++----
 labs/lab12.md                        |  932 ++++----
 labs/lab13.md                        | 1188 +++++-----
 labs/lab14.md                        |  906 ++++----
 labs/lab15.md                        |  608 +++---
 labs/lab16.md                        |  522 ++---
 labs/lab17.md                        |  894 ++++----
 labs/lab18.md                        |  860 ++++----
 labs/lab18/index.html                | 1854 ++++++++--------
 lectures/lec1.md                     | 1522 ++++++-------
 lectures/lec10.md                    | 1680 +++++++-------
 lectures/lec11.md                    | 1518 ++++++-------
 lectures/lec12.md                    | 1708 +++++++--------
 lectures/lec13.md                    | 1660 +++++++-------
 lectures/lec14.md                    | 1650 +++++++-------
 lectures/lec15.md                    | 1642 +++++++-------
 lectures/lec16.md                    | 1434 ++++++------
 lectures/lec2.md                     | 2106 +++++++++---------
 lectures/lec3.md                     | 1956 ++++++++---------
 lectures/lec4.md                     | 1602 +++++++-------
 lectures/lec5.md                     | 1648 +++++++-------
 lectures/lec6.md                     | 1774 +++++++--------
 lectures/lec7.md                     | 1698 +++++++--------
 lectures/lec8.md                     | 1598 +++++++-------
 lectures/lec9.md                     | 1706 +++++++--------
 pulumi/.gitignore                    |    8 +-
 pulumi/Pulumi.yaml                   |   12 +-
 pulumi/__main__.py                   |  182 +-
 pulumi/requirements.txt              |    2 +-
 terraform.tfvars                     |    8 +-
 terraform/.gitignore                 |   20 +-
 terraform/main.tf                    |  204 +-
 terraform/outputs.tf                 |   26 +-
 terraform/variables.tf               |  134 +-
 terraform/versions.tf                |   20 +-
 60 files changed, 28577 insertions(+), 28576 deletions(-)

diff --git a/.github/workflows/python-ci.yml b/.github/workflows/python-ci.yml
index 834ef8fbc0..cf2f50727b 100644
--- a/.github/workflows/python-ci.yml
+++ b/.github/workflows/python-ci.yml
@@ -1,103 +1,103 @@
-name: Python CI (tests + docker)
-
-on:
-  push:
-    branches: [ "master", "lab03" ]
-    paths:
-      - "app_python/**"
-      - ".github/workflows/python-ci.yml"
-  pull_request:
-    branches: [ "master" ]
-    paths:
-      - "app_python/**"
-      - ".github/workflows/python-ci.yml"
-
-concurrency:
-  group: python-ci-${{ github.ref }}
-  cancel-in-progress: true
-
-permissions:
-  contents: read
-
-jobs:
-  test-and-lint:
-    runs-on: ubuntu-latest
-
-    strategy:
-      fail-fast: true
-      matrix:
-        python-version: ["3.12", "3.13"]
-
-    steps:
-      - name: Checkout
-        uses: actions/checkout@v4
-
-      - name: Set up Python ${{ matrix.python-version }}
-        uses: actions/setup-python@v5
-        with:
-          python-version: ${{ matrix.python-version }}
-          cache: "pip"
-          cache-dependency-path: |
-            app_python/requirements.txt
-            app_python/requirements-dev.txt
-
-      - name: Install dependencies
-        working-directory: app_python
-        run: |
-          python -m pip install --upgrade pip
-          pip install -r requirements.txt
-          pip install -r requirements-dev.txt
-
-      - name: Lint (ruff)
-        working-directory: app_python
-        run: |
-          ruff check .
-
-      - name: Run tests (pytest)
-        working-directory: app_python
-        run: |
-          pytest -q
-      
-      - name: Install Snyk CLI
-        run: npm install -g snyk
-
-      - name: Snyk scan (dependencies)
-        continue-on-error: true
-        env:
-          SNYK_TOKEN: ${{ secrets.SNYK_TOKEN }}
-        run: |
-          cd app_python
-          snyk test --severity-threshold=high --file=requirements.txt
-
-  docker-build-and-push:
-    runs-on: ubuntu-latest
-    needs: test-and-lint
-
-    if: github.event_name == 'push' && (github.ref == 'refs/heads/master' || github.ref == 'refs/heads/lab03')
-
-    permissions:
-      contents: read
-
-    steps:
-      - name: Checkout
-        uses: actions/checkout@v4
-
-      - name: Set version (CalVer)
-        run: |
-          echo "VERSION=$(date -u +%Y.%m.%d)" >> $GITHUB_ENV
-
-      - name: Log in to Docker Hub
-        uses: docker/login-action@v3
-        with:
-          username: ${{ secrets.DOCKERHUB_USERNAME }}
-          password: ${{ secrets.DOCKERHUB_TOKEN }}
-
-      - name: Build and push
-        uses: docker/build-push-action@v6
-        with:
-          context: ./app_python
-          file: ./app_python/Dockerfile
-          push: true
-          tags: |
-            ${{ secrets.DOCKERHUB_USERNAME }}/devops-info-service:${{ env.VERSION }}
-            ${{ secrets.DOCKERHUB_USERNAME }}/devops-info-service:latest
+name: Python CI (tests + docker)
+
+on:
+  push:
+    branches: [ "master", "lab03" ]
+    paths:
+      - "app_python/**"
+      - ".github/workflows/python-ci.yml"
+  pull_request:
+    branches: [ "master" ]
+    paths:
+      - "app_python/**"
+      - ".github/workflows/python-ci.yml"
+
+concurrency:
+  group: python-ci-${{ github.ref }}
+  cancel-in-progress: true
+
+permissions:
+  contents: read
+
+jobs:
+  test-and-lint:
+    runs-on: ubuntu-latest
+
+    strategy:
+      fail-fast: true
+      matrix:
+        python-version: ["3.12", "3.13"]
+
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Set up Python ${{ matrix.python-version }}
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python-version }}
+          cache: "pip"
+          cache-dependency-path: |
+            app_python/requirements.txt
+            app_python/requirements-dev.txt
+
+      - name: Install dependencies
+        working-directory: app_python
+        run: |
+          python -m pip install --upgrade pip
+          pip install -r requirements.txt
+          pip install -r requirements-dev.txt
+
+      - name: Lint (ruff)
+        working-directory: app_python
+        run: |
+          ruff check .
+
+      - name: Run tests (pytest)
+        working-directory: app_python
+        run: |
+          pytest -q
+      
+      - name: Install Snyk CLI
+        run: npm install -g snyk
+
+      - name: Snyk scan (dependencies)
+        continue-on-error: true
+        env:
+          SNYK_TOKEN: ${{ secrets.SNYK_TOKEN }}
+        run: |
+          cd app_python
+          snyk test --severity-threshold=high --file=requirements.txt
+
+  docker-build-and-push:
+    runs-on: ubuntu-latest
+    needs: test-and-lint
+
+    if: github.event_name == 'push' && (github.ref == 'refs/heads/master' || github.ref == 'refs/heads/lab03')
+
+    permissions:
+      contents: read
+
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Set version (CalVer)
+        run: |
+          echo "VERSION=$(date -u +%Y.%m.%d)" >> $GITHUB_ENV
+
+      - name: Log in to Docker Hub
+        uses: docker/login-action@v3
+        with:
+          username: ${{ secrets.DOCKERHUB_USERNAME }}
+          password: ${{ secrets.DOCKERHUB_TOKEN }}
+
+      - name: Build and push
+        uses: docker/build-push-action@v6
+        with:
+          context: ./app_python
+          file: ./app_python/Dockerfile
+          push: true
+          tags: |
+            ${{ secrets.DOCKERHUB_USERNAME }}/devops-info-service:${{ env.VERSION }}
+            ${{ secrets.DOCKERHUB_USERNAME }}/devops-info-service:latest
diff --git a/README.md b/README.md
index 371d51f456..d961fa12e6 100644
--- a/README.md
+++ b/README.md
@@ -1,271 +1,271 @@
-# DevOps Engineering: Core Practices
-
-[![Labs](https://img.shields.io/badge/Labs-18-blue)](#labs)
-[![Exam](https://img.shields.io/badge/Exam-Optional-green)](#exam-alternative)
-[![Duration](https://img.shields.io/badge/Duration-18%20Weeks-lightgrey)](#course-roadmap)
-
-Master **production-grade DevOps practices** through hands-on labs. Build, containerize, deploy, monitor, and scale applications using industry-standard tools.
-
----
-
-## Quick Start
-
-1. **Fork** this repository
-2. **Clone** your fork locally
-3. **Start with Lab 1** and progress sequentially
-4. **Submit PRs** for each lab (details below)
-
----
-
-## Course Roadmap
-
-| Week | Lab | Topic | Key Technologies |
-|------|-----|-------|------------------|
-| 1 | 1 | Web Application Development | Python/Go, Best Practices |
-| 2 | 2 | Containerization | Docker, Multi-stage Builds |
-| 3 | 3 | Continuous Integration | GitHub Actions, Snyk |
-| 4 | 4 | Infrastructure as Code | Terraform, Cloud Providers |
-| 5 | 5 | Configuration Management | Ansible Basics |
-| 6 | 6 | Continuous Deployment | Ansible Advanced |
-| 7 | 7 | Logging | Promtail, Loki, Grafana |
-| 8 | 8 | Monitoring | Prometheus, Grafana |
-| 9 | 9 | Kubernetes Basics | Minikube, Deployments, Services |
-| 10 | 10 | Helm Charts | Templating, Hooks |
-| 11 | 11 | Secrets Management | K8s Secrets, HashiCorp Vault |
-| 12 | 12 | Configuration & Storage | ConfigMaps, PVCs |
-| 13 | 13 | GitOps | ArgoCD |
-| 14 | 14 | Progressive Delivery | Argo Rollouts |
-| 15 | 15 | StatefulSets | Persistent Storage, Headless Services |
-| 16 | 16 | Cluster Monitoring | Kube-Prometheus, Init Containers |
-| — | **Exam Alternative Labs** | | |
-| 17 | 17 | Edge Deployment | Fly.io, Global Distribution |
-| 18 | 18 | Decentralized Storage | 4EVERLAND, IPFS, Web3 |
-
----
-
-## Grading
-
-### Grade Composition
-
-| Component | Weight | Points |
-|-----------|--------|--------|
-| **Labs (16 required)** | 80% | 160 pts |
-| **Final Exam** | 20% | 40 pts |
-| **Bonus Tasks** | Extra | +40 pts max |
-| **Total** | 100% | 200 pts |
-
-### Exam Alternative
-
-Don't want to take the exam? Complete **both** bonus labs:
-
-| Lab | Topic | Points |
-|-----|-------|--------|
-| **Lab 17** | Fly.io Edge Deployment | 20 pts |
-| **Lab 18** | 4EVERLAND & IPFS | 20 pts |
-
-**Requirements:**
-- Complete both labs (17 + 18 = 40 pts, replaces exam)
-- Minimum 16/20 on each lab
-- Deadline: **1 week before exam date**
-- Can still take exam if you need more points for desired grade
-
-<details>
-<summary>📊 Grade Scale</summary>
-
-| Grade | Points | Percentage |
-|-------|--------|------------|
-| **A** | 180-200+ | 90-100% |
-| **B** | 150-179 | 75-89% |
-| **C** | 120-149 | 60-74% |
-| **D** | 0-119 | 0-59% |
-
-**Minimum to Pass:** 120 points (60%)
-
-</details>
-
-<details>
-<summary>📈 Grade Examples</summary>
-
-**Scenario 1: Labs + Exam**
-```
-Labs: 16 × 9 = 144 pts
-Bonus: 5 labs × 2.5 = 12.5 pts
-Exam: 35/40 pts
-Total: 191.5 pts = 96% (A)
-```
-
-**Scenario 2: Labs + Exam Alternative**
-```
-Labs: 16 × 9 = 144 pts
-Bonus: 8 labs × 2.5 = 20 pts
-Lab 17: 18 pts
-Lab 18: 17 pts
-Total: 199 pts = 99.5% (A)
-```
-
-</details>
-
----
-
-## Lab Structure
-
-Each lab is worth **10 points** (main tasks) + **2.5 points** (bonus).
-
-- **Minimum passing score:** 6/10 per lab
-- **Late submissions:** Max 6/10 (within 1 week)
-- **Very late (>1 week):** Not accepted
-
-<details>
-<summary>📋 Lab Categories</summary>
-
-**Foundation (Labs 1-2)**
-- Web app development
-- Docker containerization
-
-**CI/CD & Infrastructure (Labs 3-4)**
-- GitHub Actions
-- Terraform
-
-**Configuration Management (Labs 5-6)**
-- Ansible playbooks and roles
-
-**Observability (Labs 7-8)**
-- Loki logging stack
-- Prometheus monitoring
-
-**Kubernetes Core (Labs 9-12)**
-- K8s basics, Helm
-- Secrets, ConfigMaps
-
-**Advanced Kubernetes (Labs 13-16)**
-- ArgoCD, Argo Rollouts
-- StatefulSets, Monitoring
-
-**Exam Alternative (Labs 17-18)**
-- Fly.io, 4EVERLAND/IPFS
-
-</details>
-
----
-
-## How to Submit
-
-```bash
-# 1. Create branch
-git checkout -b lab1
-
-# 2. Complete lab tasks
-
-# 3. Commit and push
-git add .
-git commit -m "Complete lab1"
-git push -u origin lab1
-
-# 4. Create TWO Pull Requests:
-#    PR #1: your-fork:lab1 → course-repo:master
-#    PR #2: your-fork:lab1 → your-fork:master
-```
-
-<details>
-<summary>📝 Submission Checklist</summary>
-
-- [ ] All main tasks completed
-- [ ] Documentation files created
-- [ ] Screenshots where required
-- [ ] Code tested and working
-- [ ] Markdown validated ([linter](https://dlaa.me/markdownlint/))
-- [ ] Both PRs created
-
-</details>
-
----
-
-## Resources
-
-<details>
-<summary>🛠️ Required Tools</summary>
-
-| Tool | Purpose |
-|------|---------|
-| Git | Version control |
-| Docker | Containerization |
-| kubectl | Kubernetes CLI |
-| Helm | K8s package manager |
-| Minikube | Local K8s cluster |
-| Terraform | Infrastructure as Code |
-| Ansible | Configuration management |
-
-</details>
-
-<details>
-<summary>📚 Documentation Links</summary>
-
-**Core:**
-- [Docker](https://docs.docker.com/)
-- [Kubernetes](https://kubernetes.io/docs/)
-- [Helm](https://helm.sh/docs/)
-
-**CI/CD:**
-- [GitHub Actions](https://docs.github.com/en/actions)
-- [Terraform](https://www.terraform.io/docs)
-- [Ansible](https://docs.ansible.com/)
-
-**Observability:**
-- [Prometheus](https://prometheus.io/docs/)
-- [Grafana](https://grafana.com/docs/)
-
-**Advanced:**
-- [ArgoCD](https://argo-cd.readthedocs.io/)
-- [Argo Rollouts](https://argoproj.github.io/argo-rollouts/)
-- [HashiCorp Vault](https://developer.hashicorp.com/vault/docs)
-
-</details>
-
-<details>
-<summary>💡 Tips for Success</summary>
-
-1. **Start early** - Don't wait until deadline
-2. **Read instructions fully** before starting
-3. **Test everything** before submitting
-4. **Document as you go** - Don't leave it for the end
-5. **Ask questions early** - Don't wait until last minute
-6. **Use proper Git workflow** - Branches, commits, PRs
-
-</details>
-
-<details>
-<summary>🔧 Common Issues</summary>
-
-**Docker:**
-- Daemon not running → Start Docker Desktop
-- Permission denied → Add user to docker group
-
-**Minikube:**
-- Won't start → Try `--driver=docker`
-- Resource issues → Allocate more memory/CPU
-
-**Kubernetes:**
-- ImagePullBackOff → Check image name/registry
-- CrashLoopBackOff → Check logs: `kubectl logs <pod>`
-
-</details>
-
----
-
-## Course Completion
-
-After completing all 16 core labs (+ optional Labs 17-18), you'll have:
-
-✅ Full-stack DevOps expertise
-✅ Production-ready portfolio with 16-18 projects
-✅ Container and Kubernetes mastery
-✅ CI/CD pipeline experience
-✅ Infrastructure as Code skills
-✅ Monitoring and observability knowledge
-✅ GitOps workflow experience
-
----
-
-**Ready to begin? Start with [Lab 1](labs/lab01.md)!**
-
-Questions? Check the course Moodle page or ask during office hours.
+# DevOps Engineering: Core Practices
+
+[![Labs](https://img.shields.io/badge/Labs-18-blue)](#labs)
+[![Exam](https://img.shields.io/badge/Exam-Optional-green)](#exam-alternative)
+[![Duration](https://img.shields.io/badge/Duration-18%20Weeks-lightgrey)](#course-roadmap)
+
+Master **production-grade DevOps practices** through hands-on labs. Build, containerize, deploy, monitor, and scale applications using industry-standard tools.
+
+---
+
+## Quick Start
+
+1. **Fork** this repository
+2. **Clone** your fork locally
+3. **Start with Lab 1** and progress sequentially
+4. **Submit PRs** for each lab (details below)
+
+---
+
+## Course Roadmap
+
+| Week | Lab | Topic | Key Technologies |
+|------|-----|-------|------------------|
+| 1 | 1 | Web Application Development | Python/Go, Best Practices |
+| 2 | 2 | Containerization | Docker, Multi-stage Builds |
+| 3 | 3 | Continuous Integration | GitHub Actions, Snyk |
+| 4 | 4 | Infrastructure as Code | Terraform, Cloud Providers |
+| 5 | 5 | Configuration Management | Ansible Basics |
+| 6 | 6 | Continuous Deployment | Ansible Advanced |
+| 7 | 7 | Logging | Promtail, Loki, Grafana |
+| 8 | 8 | Monitoring | Prometheus, Grafana |
+| 9 | 9 | Kubernetes Basics | Minikube, Deployments, Services |
+| 10 | 10 | Helm Charts | Templating, Hooks |
+| 11 | 11 | Secrets Management | K8s Secrets, HashiCorp Vault |
+| 12 | 12 | Configuration & Storage | ConfigMaps, PVCs |
+| 13 | 13 | GitOps | ArgoCD |
+| 14 | 14 | Progressive Delivery | Argo Rollouts |
+| 15 | 15 | StatefulSets | Persistent Storage, Headless Services |
+| 16 | 16 | Cluster Monitoring | Kube-Prometheus, Init Containers |
+| — | **Exam Alternative Labs** | | |
+| 17 | 17 | Edge Deployment | Fly.io, Global Distribution |
+| 18 | 18 | Decentralized Storage | 4EVERLAND, IPFS, Web3 |
+
+---
+
+## Grading
+
+### Grade Composition
+
+| Component | Weight | Points |
+|-----------|--------|--------|
+| **Labs (16 required)** | 80% | 160 pts |
+| **Final Exam** | 20% | 40 pts |
+| **Bonus Tasks** | Extra | +40 pts max |
+| **Total** | 100% | 200 pts |
+
+### Exam Alternative
+
+Don't want to take the exam? Complete **both** bonus labs:
+
+| Lab | Topic | Points |
+|-----|-------|--------|
+| **Lab 17** | Fly.io Edge Deployment | 20 pts |
+| **Lab 18** | 4EVERLAND & IPFS | 20 pts |
+
+**Requirements:**
+- Complete both labs (17 + 18 = 40 pts, replaces exam)
+- Minimum 16/20 on each lab
+- Deadline: **1 week before exam date**
+- Can still take exam if you need more points for desired grade
+
+<details>
+<summary>📊 Grade Scale</summary>
+
+| Grade | Points | Percentage |
+|-------|--------|------------|
+| **A** | 180-200+ | 90-100% |
+| **B** | 150-179 | 75-89% |
+| **C** | 120-149 | 60-74% |
+| **D** | 0-119 | 0-59% |
+
+**Minimum to Pass:** 120 points (60%)
+
+</details>
+
+<details>
+<summary>📈 Grade Examples</summary>
+
+**Scenario 1: Labs + Exam**
+```
+Labs: 16 × 9 = 144 pts
+Bonus: 5 labs × 2.5 = 12.5 pts
+Exam: 35/40 pts
+Total: 191.5 pts = 96% (A)
+```
+
+**Scenario 2: Labs + Exam Alternative**
+```
+Labs: 16 × 9 = 144 pts
+Bonus: 8 labs × 2.5 = 20 pts
+Lab 17: 18 pts
+Lab 18: 17 pts
+Total: 199 pts = 99.5% (A)
+```
+
+</details>
+
+---
+
+## Lab Structure
+
+Each lab is worth **10 points** (main tasks) + **2.5 points** (bonus).
+
+- **Minimum passing score:** 6/10 per lab
+- **Late submissions:** Max 6/10 (within 1 week)
+- **Very late (>1 week):** Not accepted
+
+<details>
+<summary>📋 Lab Categories</summary>
+
+**Foundation (Labs 1-2)**
+- Web app development
+- Docker containerization
+
+**CI/CD & Infrastructure (Labs 3-4)**
+- GitHub Actions
+- Terraform
+
+**Configuration Management (Labs 5-6)**
+- Ansible playbooks and roles
+
+**Observability (Labs 7-8)**
+- Loki logging stack
+- Prometheus monitoring
+
+**Kubernetes Core (Labs 9-12)**
+- K8s basics, Helm
+- Secrets, ConfigMaps
+
+**Advanced Kubernetes (Labs 13-16)**
+- ArgoCD, Argo Rollouts
+- StatefulSets, Monitoring
+
+**Exam Alternative (Labs 17-18)**
+- Fly.io, 4EVERLAND/IPFS
+
+</details>
+
+---
+
+## How to Submit
+
+```bash
+# 1. Create branch
+git checkout -b lab1
+
+# 2. Complete lab tasks
+
+# 3. Commit and push
+git add .
+git commit -m "Complete lab1"
+git push -u origin lab1
+
+# 4. Create TWO Pull Requests:
+#    PR #1: your-fork:lab1 → course-repo:master
+#    PR #2: your-fork:lab1 → your-fork:master
+```
+
+<details>
+<summary>📝 Submission Checklist</summary>
+
+- [ ] All main tasks completed
+- [ ] Documentation files created
+- [ ] Screenshots where required
+- [ ] Code tested and working
+- [ ] Markdown validated ([linter](https://dlaa.me/markdownlint/))
+- [ ] Both PRs created
+
+</details>
+
+---
+
+## Resources
+
+<details>
+<summary>🛠️ Required Tools</summary>
+
+| Tool | Purpose |
+|------|---------|
+| Git | Version control |
+| Docker | Containerization |
+| kubectl | Kubernetes CLI |
+| Helm | K8s package manager |
+| Minikube | Local K8s cluster |
+| Terraform | Infrastructure as Code |
+| Ansible | Configuration management |
+
+</details>
+
+<details>
+<summary>📚 Documentation Links</summary>
+
+**Core:**
+- [Docker](https://docs.docker.com/)
+- [Kubernetes](https://kubernetes.io/docs/)
+- [Helm](https://helm.sh/docs/)
+
+**CI/CD:**
+- [GitHub Actions](https://docs.github.com/en/actions)
+- [Terraform](https://www.terraform.io/docs)
+- [Ansible](https://docs.ansible.com/)
+
+**Observability:**
+- [Prometheus](https://prometheus.io/docs/)
+- [Grafana](https://grafana.com/docs/)
+
+**Advanced:**
+- [ArgoCD](https://argo-cd.readthedocs.io/)
+- [Argo Rollouts](https://argoproj.github.io/argo-rollouts/)
+- [HashiCorp Vault](https://developer.hashicorp.com/vault/docs)
+
+</details>
+
+<details>
+<summary>💡 Tips for Success</summary>
+
+1. **Start early** - Don't wait until deadline
+2. **Read instructions fully** before starting
+3. **Test everything** before submitting
+4. **Document as you go** - Don't leave it for the end
+5. **Ask questions early** - Don't wait until last minute
+6. **Use proper Git workflow** - Branches, commits, PRs
+
+</details>
+
+<details>
+<summary>🔧 Common Issues</summary>
+
+**Docker:**
+- Daemon not running → Start Docker Desktop
+- Permission denied → Add user to docker group
+
+**Minikube:**
+- Won't start → Try `--driver=docker`
+- Resource issues → Allocate more memory/CPU
+
+**Kubernetes:**
+- ImagePullBackOff → Check image name/registry
+- CrashLoopBackOff → Check logs: `kubectl logs <pod>`
+
+</details>
+
+---
+
+## Course Completion
+
+After completing all 16 core labs (+ optional Labs 17-18), you'll have:
+
+✅ Full-stack DevOps expertise
+✅ Production-ready portfolio with 16-18 projects
+✅ Container and Kubernetes mastery
+✅ CI/CD pipeline experience
+✅ Infrastructure as Code skills
+✅ Monitoring and observability knowledge
+✅ GitOps workflow experience
+
+---
+
+**Ready to begin? Start with [Lab 1](labs/lab01.md)!**
+
+Questions? Check the course Moodle page or ask during office hours.
diff --git a/ansible/roles/web_app/meta/main.yml b/ansible/roles/web_app/meta/main.yml
index e81c1dfe31..c37c0be4b9 100644
--- a/ansible/roles/web_app/meta/main.yml
+++ b/ansible/roles/web_app/meta/main.yml
@@ -1,6 +1,7 @@
 ---
 galaxy_info:
   role_name: web_app
+  author: cdeth567
   description: Deploy a containerised web application using Docker Compose
   license: MIT
   min_ansible_version: "2.16"
diff --git a/ansible/roles/web_app/tasks/wipe.yml b/ansible/roles/web_app/tasks/wipe.yml
index e61df93468..6fbb99dcea 100644
--- a/ansible/roles/web_app/tasks/wipe.yml
+++ b/ansible/roles/web_app/tasks/wipe.yml
@@ -6,7 +6,7 @@
         project_src: "{{ compose_project_dir }}"
         state: absent
         remove_volumes: true
-      ignore_errors: true
+      failed_when: false
 
     - name: Remove application directory
       ansible.builtin.file:
diff --git a/app_python/.dockerignore b/app_python/.dockerignore
index d57576a080..bbc07852cb 100644
--- a/app_python/.dockerignore
+++ b/app_python/.dockerignore
@@ -1,28 +1,28 @@
-# Python cache
-__pycache__/
-*.py[cod]
-
-# Virtual environments
-venv/
-.venv/
-
-# Git
-.git/
-.gitignore
-
-# IDE
-.vscode/
-.idea/
-
-# OS
-.DS_Store
-
-# Docs/screenshots not needed at runtime
-docs/
-tests/
-
-# Env files
-.env
-
-# Logs
-*.log
+# Python cache
+__pycache__/
+*.py[cod]
+
+# Virtual environments
+venv/
+.venv/
+
+# Git
+.git/
+.gitignore
+
+# IDE
+.vscode/
+.idea/
+
+# OS
+.DS_Store
+
+# Docs/screenshots not needed at runtime
+docs/
+tests/
+
+# Env files
+.env
+
+# Logs
+*.log
diff --git a/app_python/.gitignore b/app_python/.gitignore
index a8692c9faf..95e8a48683 100644
--- a/app_python/.gitignore
+++ b/app_python/.gitignore
@@ -1,13 +1,13 @@
-# Python
-__pycache__/
-*.py[cod]
-venv/
-*.log
-.env
-
-# IDE
-.vscode/
-.idea/
-
-# OS
+# Python
+__pycache__/
+*.py[cod]
+venv/
+*.log
+.env
+
+# IDE
+.vscode/
+.idea/
+
+# OS
 .DS_Store
\ No newline at end of file
diff --git a/app_python/Dockerfile b/app_python/Dockerfile
index 70118d9d99..ab5526ede7 100644
--- a/app_python/Dockerfile
+++ b/app_python/Dockerfile
@@ -1,29 +1,29 @@
-# syntax=docker/dockerfile:1
-
-FROM python:3.13-slim
-
-# 1) Basic env for predictable Python behavior
-ENV PYTHONDONTWRITEBYTECODE=1 \
-    PYTHONUNBUFFERED=1
-
-# 2) Create non-root user
-RUN addgroup --system app && adduser --system --ingroup app app
-
-# 3) Workdir
-WORKDIR /app
-
-# 4) Install dependencies (layer caching)
-COPY requirements.txt .
-RUN pip install --no-cache-dir -r requirements.txt
-
-# 5) Copy only necessary source files
-COPY app.py .
-
-# 6) Security: drop privileges
-USER app
-
-# 7) Document port (your app uses PORT env, default 5000)
-EXPOSE 5000
-
-# 8) Start the app
-CMD ["python", "app.py"]
+# syntax=docker/dockerfile:1
+
+FROM python:3.13-slim
+
+# 1) Basic env for predictable Python behavior
+ENV PYTHONDONTWRITEBYTECODE=1 \
+    PYTHONUNBUFFERED=1
+
+# 2) Create non-root user
+RUN addgroup --system app && adduser --system --ingroup app app
+
+# 3) Workdir
+WORKDIR /app
+
+# 4) Install dependencies (layer caching)
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+
+# 5) Copy only necessary source files
+COPY app.py .
+
+# 6) Security: drop privileges
+USER app
+
+# 7) Document port (your app uses PORT env, default 5000)
+EXPOSE 5000
+
+# 8) Start the app
+CMD ["python", "app.py"]
diff --git a/app_python/README.md b/app_python/README.md
index 0d4c87ae27..201c54e7ca 100644
--- a/app_python/README.md
+++ b/app_python/README.md
@@ -1,142 +1,142 @@
-[![Python CI (tests + docker)](https://github.com/Cdeth567/DevOps-Core-Course/actions/workflows/python-ci.yml/badge.svg?branch=lab03)](https://github.com/Cdeth567/DevOps-Core-Course/actions/workflows/python-ci.yml)
-
-# DevOps Info Service
-
-## Overview
-DevOps Info Service is a small Flask web application that exposes:
-- `GET /` — service metadata, system/runtime info, and request details
-- `GET /health` — simple health check endpoint
-
-This project is the foundation for future DevOps labs (Docker, CI/CD, monitoring, Kubernetes).
-
-## Prerequisites
-- Python 3.11+
-- pip
-- (Windows) Python Launcher `py` is recommended
-
-## Installation
-
-### 1) Clone repository
-```bash
-git clone <repo-url>
-cd app_python
-```
-
-### 2) Create and activate virtual environment
-
-**Windows (PowerShell):**
-```powershell
-py -m venv venv
-.\venv\Scripts\Activate.ps1
-```
-
-**Windows (CMD):**
-```bat
-py -m venv venv
-venv\Scripts\activate.bat
-```
-
-**Linux/Mac:**
-```bash
-python -m venv venv
-source venv/bin/activate
-```
-
-### 3) Install dependencies
-```bash
-python -m pip install --upgrade pip
-pip install -r requirements.txt
-```
-
-## Running the Application
-
-Default:
-```bash
-python app.py
-```
-
-Custom config:
-
-**Linux/Mac:**
-```bash
-HOST=127.0.0.1 PORT=3000 DEBUG=True python app.py
-```
-
-**Windows (PowerShell):**
-```powershell
-$env:HOST="127.0.0.1"
-$env:PORT="3000"
-$env:DEBUG="True"
-python app.py
-```
-
-**Windows (CMD):**
-```bat
-set HOST=127.0.0.1
-set PORT=3000
-set DEBUG=True
-python app.py
-```
-
-## API Endpoints
-- `GET /` — service and system information
-- `GET /health` — health check
-
-Examples:
-```bash
-curl http://127.0.0.1:5000/
-curl http://127.0.0.1:5000/health
-```
-
-Pretty output:
-```bash
-curl http://127.0.0.1:5000/ | python -m json.tool
-```
-
-## Configuration
-
-| Variable | Default | Description |
-|----------|---------|-------------|
-| HOST     | 0.0.0.0 | Bind address |
-| PORT     | 5000    | HTTP port |
-| DEBUG    | False   | Flask debug mode |
-
-## Docker
-
-This application can also be built and run as a Docker container.
-
-### Build (local)
-Pattern:
-```bash
-docker build -t <image_name>:<tag> .
-```
-
-### Run
-Pattern:
-```bash
-docker run --rm -p <host_port>:5000 --name <container_name> <image_name>:<tag>
-```
-
-Then test:
-```bash
-curl http://127.0.0.1:<host_port>/
-curl http://127.0.0.1:<host_port>/health
-```
-
-### Pull from Docker Hub
-Pattern:
-```bash
-docker pull <dockerhub_username>/<repo_name>:<tag>
-docker run --rm -p <host_port>:5000 <dockerhub_username>/<repo_name>:<tag>
-```
-
-> Note (Windows PowerShell): `curl` is an alias for `Invoke-WebRequest`.  
-> For classic curl behavior, use `curl.exe`.
-
-## Testing
-Install dev dependencies:
-- python -m pip install -r requirements-dev.txt
-
-Run tests:
-- pytest
-
+[![Python CI (tests + docker)](https://github.com/Cdeth567/DevOps-Core-Course/actions/workflows/python-ci.yml/badge.svg?branch=lab03)](https://github.com/Cdeth567/DevOps-Core-Course/actions/workflows/python-ci.yml)
+
+# DevOps Info Service
+
+## Overview
+DevOps Info Service is a small Flask web application that exposes:
+- `GET /` — service metadata, system/runtime info, and request details
+- `GET /health` — simple health check endpoint
+
+This project is the foundation for future DevOps labs (Docker, CI/CD, monitoring, Kubernetes).
+
+## Prerequisites
+- Python 3.11+
+- pip
+- (Windows) Python Launcher `py` is recommended
+
+## Installation
+
+### 1) Clone repository
+```bash
+git clone <repo-url>
+cd app_python
+```
+
+### 2) Create and activate virtual environment
+
+**Windows (PowerShell):**
+```powershell
+py -m venv venv
+.\venv\Scripts\Activate.ps1
+```
+
+**Windows (CMD):**
+```bat
+py -m venv venv
+venv\Scripts\activate.bat
+```
+
+**Linux/Mac:**
+```bash
+python -m venv venv
+source venv/bin/activate
+```
+
+### 3) Install dependencies
+```bash
+python -m pip install --upgrade pip
+pip install -r requirements.txt
+```
+
+## Running the Application
+
+Default:
+```bash
+python app.py
+```
+
+Custom config:
+
+**Linux/Mac:**
+```bash
+HOST=127.0.0.1 PORT=3000 DEBUG=True python app.py
+```
+
+**Windows (PowerShell):**
+```powershell
+$env:HOST="127.0.0.1"
+$env:PORT="3000"
+$env:DEBUG="True"
+python app.py
+```
+
+**Windows (CMD):**
+```bat
+set HOST=127.0.0.1
+set PORT=3000
+set DEBUG=True
+python app.py
+```
+
+## API Endpoints
+- `GET /` — service and system information
+- `GET /health` — health check
+
+Examples:
+```bash
+curl http://127.0.0.1:5000/
+curl http://127.0.0.1:5000/health
+```
+
+Pretty output:
+```bash
+curl http://127.0.0.1:5000/ | python -m json.tool
+```
+
+## Configuration
+
+| Variable | Default | Description |
+|----------|---------|-------------|
+| HOST     | 0.0.0.0 | Bind address |
+| PORT     | 5000    | HTTP port |
+| DEBUG    | False   | Flask debug mode |
+
+## Docker
+
+This application can also be built and run as a Docker container.
+
+### Build (local)
+Pattern:
+```bash
+docker build -t <image_name>:<tag> .
+```
+
+### Run
+Pattern:
+```bash
+docker run --rm -p <host_port>:5000 --name <container_name> <image_name>:<tag>
+```
+
+Then test:
+```bash
+curl http://127.0.0.1:<host_port>/
+curl http://127.0.0.1:<host_port>/health
+```
+
+### Pull from Docker Hub
+Pattern:
+```bash
+docker pull <dockerhub_username>/<repo_name>:<tag>
+docker run --rm -p <host_port>:5000 <dockerhub_username>/<repo_name>:<tag>
+```
+
+> Note (Windows PowerShell): `curl` is an alias for `Invoke-WebRequest`.  
+> For classic curl behavior, use `curl.exe`.
+
+## Testing
+Install dev dependencies:
+- python -m pip install -r requirements-dev.txt
+
+Run tests:
+- pytest
+
diff --git a/app_python/app.py b/app_python/app.py
index e42a686025..e05047b8c4 100644
--- a/app_python/app.py
+++ b/app_python/app.py
@@ -1,118 +1,118 @@
-import os
-import socket
-import platform
-import logging
-from datetime import datetime, timezone
-from flask import Flask, jsonify, request
-
-logging.basicConfig(
-    level=logging.INFO,
-    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
-)
-logger = logging.getLogger(__name__)
-
-app = Flask(__name__)
-
-# Configuration
-HOST = os.getenv('HOST', '0.0.0.0')
-PORT = int(os.getenv('PORT', 5000))
-DEBUG = os.getenv('DEBUG', 'False').lower() == 'true'
-
-# Application start time
-START_TIME = datetime.now(timezone.utc)
-
-def get_uptime():
-    """Calculation of the application's operating time."""
-    delta = datetime.now(timezone.utc) - START_TIME
-    seconds = int(delta.total_seconds())
-    hours = seconds // 3600
-    minutes = (seconds % 3600) // 60
-    return {
-        'seconds': seconds,
-        'human': f"{hours} hours, {minutes} minutes"
-    }
-
-def get_system_info():
-    """Collect system information."""
-    return {
-        'hostname': socket.gethostname(),
-        'platform': platform.system(),
-        'platform_version': get_platform_version(),
-        'architecture': platform.machine(),
-        'cpu_count': os.cpu_count(),
-        'python_version': platform.python_version()
-    }
-
-@app.route('/')
-def index():
-    """Main endpoint - service and system information."""
-    uptime = get_uptime()
-    
-    response = {
-        'service': {
-            'name': 'devops-info-service',
-            'version': '1.0.0',
-            'description': 'DevOps course info service',
-            'framework': 'Flask'
-        },
-        'system': get_system_info(),
-        'runtime': {
-            'uptime_seconds': uptime['seconds'],
-            'uptime_human': uptime['human'],
-            'current_time': datetime.now(timezone.utc).isoformat(timespec="milliseconds").replace("+00:00", "Z"),
-            'timezone': 'UTC'
-        },
-        'request': {
-            'client_ip': request.remote_addr,
-            'user_agent': request.headers.get('User-Agent'),
-            'method': request.method,
-            'path': request.path
-        },
-        'endpoints': [
-            {'path': '/', 'method': 'GET', 'description': 'Service information'},
-            {'path': '/health', 'method': 'GET', 'description': 'Health check'}
-        ]
-    }
-    
-    logger.info("Request %s %s from %s", request.method, request.path, request.remote_addr)
-    return jsonify(response)
-
-@app.route('/health')
-def health():
-    """Health check endpoint for monitoring."""
-    logger.info("Request %s %s from %s", request.method, request.path, request.remote_addr)
-    return jsonify({
-        'status': 'healthy',
-        'timestamp': datetime.now(timezone.utc).isoformat(timespec="milliseconds").replace("+00:00", "Z"),
-        'uptime_seconds': get_uptime()['seconds']
-    })
-
-@app.errorhandler(404)
-def not_found(error):
-    return jsonify({
-        'error': 'Not Found',
-        'message': 'Endpoint does not exist'
-    }), 404
-
-@app.errorhandler(500)
-def internal_error(error):
-    return jsonify({
-        'error': 'Internal Server Error',
-        'message': 'An unexpected error occurred'
-    }), 500
-
-def get_platform_version():
-    """Return a platform version."""
-    try:
-        if hasattr(platform, "freedesktop_os_release"):
-            info = platform.freedesktop_os_release()
-            if info.get("PRETTY_NAME"):
-                return info["PRETTY_NAME"]
-    except Exception:
-        pass
-    return platform.platform()
-
-
-if __name__ == '__main__':
-    logger.info(f'Starting DevOps Info Service on {HOST}:{PORT}')
+import os
+import socket
+import platform
+import logging
+from datetime import datetime, timezone
+from flask import Flask, jsonify, request
+
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+
+app = Flask(__name__)
+
+# Configuration
+HOST = os.getenv('HOST', '0.0.0.0')
+PORT = int(os.getenv('PORT', 5000))
+DEBUG = os.getenv('DEBUG', 'False').lower() == 'true'
+
+# Application start time
+START_TIME = datetime.now(timezone.utc)
+
+def get_uptime():
+    """Calculation of the application's operating time."""
+    delta = datetime.now(timezone.utc) - START_TIME
+    seconds = int(delta.total_seconds())
+    hours = seconds // 3600
+    minutes = (seconds % 3600) // 60
+    return {
+        'seconds': seconds,
+        'human': f"{hours} hours, {minutes} minutes"
+    }
+
+def get_system_info():
+    """Collect system information."""
+    return {
+        'hostname': socket.gethostname(),
+        'platform': platform.system(),
+        'platform_version': get_platform_version(),
+        'architecture': platform.machine(),
+        'cpu_count': os.cpu_count(),
+        'python_version': platform.python_version()
+    }
+
+@app.route('/')
+def index():
+    """Main endpoint - service and system information."""
+    uptime = get_uptime()
+    
+    response = {
+        'service': {
+            'name': 'devops-info-service',
+            'version': '1.0.0',
+            'description': 'DevOps course info service',
+            'framework': 'Flask'
+        },
+        'system': get_system_info(),
+        'runtime': {
+            'uptime_seconds': uptime['seconds'],
+            'uptime_human': uptime['human'],
+            'current_time': datetime.now(timezone.utc).isoformat(timespec="milliseconds").replace("+00:00", "Z"),
+            'timezone': 'UTC'
+        },
+        'request': {
+            'client_ip': request.remote_addr,
+            'user_agent': request.headers.get('User-Agent'),
+            'method': request.method,
+            'path': request.path
+        },
+        'endpoints': [
+            {'path': '/', 'method': 'GET', 'description': 'Service information'},
+            {'path': '/health', 'method': 'GET', 'description': 'Health check'}
+        ]
+    }
+    
+    logger.info("Request %s %s from %s", request.method, request.path, request.remote_addr)
+    return jsonify(response)
+
+@app.route('/health')
+def health():
+    """Health check endpoint for monitoring."""
+    logger.info("Request %s %s from %s", request.method, request.path, request.remote_addr)
+    return jsonify({
+        'status': 'healthy',
+        'timestamp': datetime.now(timezone.utc).isoformat(timespec="milliseconds").replace("+00:00", "Z"),
+        'uptime_seconds': get_uptime()['seconds']
+    })
+
+@app.errorhandler(404)
+def not_found(error):
+    return jsonify({
+        'error': 'Not Found',
+        'message': 'Endpoint does not exist'
+    }), 404
+
+@app.errorhandler(500)
+def internal_error(error):
+    return jsonify({
+        'error': 'Internal Server Error',
+        'message': 'An unexpected error occurred'
+    }), 500
+
+def get_platform_version():
+    """Return a platform version."""
+    try:
+        if hasattr(platform, "freedesktop_os_release"):
+            info = platform.freedesktop_os_release()
+            if info.get("PRETTY_NAME"):
+                return info["PRETTY_NAME"]
+    except Exception:
+        pass
+    return platform.platform()
+
+
+if __name__ == '__main__':
+    logger.info(f'Starting DevOps Info Service on {HOST}:{PORT}')
     app.run(host=HOST, port=PORT, debug=DEBUG)
\ No newline at end of file
diff --git a/app_python/docs/LAB01.md b/app_python/docs/LAB01.md
index 909fcf5ec5..ff0d6e655f 100644
--- a/app_python/docs/LAB01.md
+++ b/app_python/docs/LAB01.md
@@ -1,168 +1,168 @@
-# LAB01 — DevOps Info Service (Python)
-
-## 1. Framework Selection
-
-**Chosen framework:** Flask
-
-### Why Flask
-- **Lightweight and simple**: perfect for a small service with 2 endpoints.
-- **Fast to start**: minimal boilerplate, easy routing.
-- **Good for DevOps labs**: focus stays on environment/configuration, containerization and CI/CD.
-
-### Comparison
-
-| Framework | Pros | Cons | Decision |
-|----------|------|------|----------|
-| Flask | Simple, lightweight, flexible | Fewer built-in features than Django/FastAPI | **Chosen** |
-| FastAPI | Async support, automatic OpenAPI docs, modern typing | More concepts (Pydantic, async) for beginners | Not chosen |
-| Django | Full-featured framework (ORM, admin, auth) | Heavy/overkill for 2 simple endpoints | Not chosen |
-
-## 2. Best Practices Applied
-
-### 2.1 Clean Code Organization
-**What:** Logic is separated into small functions: `get_uptime()` and `get_system_info()`.
-
-**Why it matters:** Improves readability, reuse, and makes testing easier (Lab 3).
-
-**Code example:**
-```python
-START_TIME = datetime.now(timezone.utc)
-
-def get_uptime():
-    delta = datetime.now(timezone.utc) - START_TIME
-    seconds = int(delta.total_seconds())
-    hours = seconds // 3600
-    minutes = (seconds % 3600) // 60
-    return {"seconds": seconds, "human": f"{hours} hours, {minutes} minutes"}
-```
-
-### 2.2 Configuration via Environment Variables
-**What:** App settings are controlled by env vars with defaults.
-
-**Why it matters:** Makes the application portable across environments (local, Docker, Kubernetes).
-
-**Code example:**
-```python
-HOST = os.getenv("HOST", "0.0.0.0")
-PORT = int(os.getenv("PORT", 5000))
-DEBUG = os.getenv("DEBUG", "False").lower() == "true"
-```
-
-### 2.3 Error Handling (JSON Responses)
-**What:** Custom JSON handlers for common errors (404, 500).
-
-**Why it matters:** API stays consistent (always JSON), easier monitoring and debugging.
-
-**Code example:**
-```python
-@app.errorhandler(404)
-def not_found(error):
-    return jsonify({"error": "Not Found", "message": "Endpoint does not exist"}), 404
-```
-
-### 2.4 Logging
-**What:** Logging is configured with timestamps and log levels.
-
-**Why it matters:** Logs are essential for troubleshooting, monitoring, and production readiness.
-
-**Code example:**
-```python
-logging.basicConfig(
-    level=logging.INFO,
-    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s"
-)
-logger = logging.getLogger(__name__)
-
-logger.info("Request %s %s from %s", request.method, request.path, request.remote_addr)
-```
-
-## 3. API Documentation
-
-> Note: In my local environment I ran the service on port **8080** (via `PORT=8080`).  
-> Default port in code is **5000** when `PORT` is not set.
-
-### 3.1 GET /
-**Purpose:** Returns service metadata, system information, runtime details, request info, and available endpoints.
-
-**Request example:**
-```bash
-curl http://127.0.0.1:8080/
-```
-
-**Response example (shortened):**
-```json
-{
-  "service": {
-    "name": "devops-info-service",
-    "version": "1.0.0",
-    "description": "DevOps course info service",
-    "framework": "Flask"
-  },
-  "system": {
-    "hostname": "my-host",
-    "platform": "Windows",
-    "architecture": "AMD64",
-    "cpu_count": 20,
-    "python_version": "3.14.0"
-  },
-  "runtime": {
-    "uptime_seconds": 1302,
-    "timezone": "UTC"
-  },
-  "request": {
-    "client_ip": "127.0.0.1",
-    "method": "GET",
-    "path": "/"
-  }
-}
-```
-
-### 3.2 GET /health
-**Purpose:** Health check endpoint for monitoring (used later for Kubernetes probes).
-
-**Request example:**
-```bash
-curl -i http://127.0.0.1:8080/health
-```
-
-**Response example:**
-```json
-{
-  "status": "healthy",
-  "timestamp": "2026-01-28T13:41:14.751Z",
-  "uptime_seconds": 918
-}
-```
-
-### 3.3 Testing Commands
-
-**Pretty-printed JSON output:**
-```bash
-curl -s http://127.0.0.1:8080/ | python -m json.tool
-```
-
-## 4. Testing Evidence
-
-Screenshots are included in `app_python/docs/screenshots/`:
-
-- `01-main-endpoint.png` — Main endpoint (`GET /`) showing complete JSON output
-- `02-health-check.png` — Health endpoint (`GET /health`) including HTTP 200 status
-- `03-formatted-output.png` — Pretty-printed JSON output from terminal (`curl -s ... | python -m json.tool`)
-
-## 5. Challenges & Solutions
-
-**Problem:** On Windows, `python app.py` did not work, while `py app.py` worked.
-
-**Solution:**
-- Created and activated a virtual environment using:
-  ```bash
-  py -m venv venv
-  ```
-- After activation, `python` points to the venv interpreter.
-- Disabled Windows Store Python execution aliases (App Execution Aliases) so `python` runs the correct interpreter.
-
-## 6. GitHub Community
-
-**Why starring repositories matters:** Stars increase visibility of useful projects and are a convenient way to bookmark tools and libraries; they also encourage maintainers.
-
-**Why following developers helps:** Following the professor, TAs, and classmates supports collaboration, helps discover solutions and best practices through activity feeds, and builds a professional network.
+# LAB01 — DevOps Info Service (Python)
+
+## 1. Framework Selection
+
+**Chosen framework:** Flask
+
+### Why Flask
+- **Lightweight and simple**: perfect for a small service with 2 endpoints.
+- **Fast to start**: minimal boilerplate, easy routing.
+- **Good for DevOps labs**: focus stays on environment/configuration, containerization and CI/CD.
+
+### Comparison
+
+| Framework | Pros | Cons | Decision |
+|----------|------|------|----------|
+| Flask | Simple, lightweight, flexible | Fewer built-in features than Django/FastAPI | **Chosen** |
+| FastAPI | Async support, automatic OpenAPI docs, modern typing | More concepts (Pydantic, async) for beginners | Not chosen |
+| Django | Full-featured framework (ORM, admin, auth) | Heavy/overkill for 2 simple endpoints | Not chosen |
+
+## 2. Best Practices Applied
+
+### 2.1 Clean Code Organization
+**What:** Logic is separated into small functions: `get_uptime()` and `get_system_info()`.
+
+**Why it matters:** Improves readability, reuse, and makes testing easier (Lab 3).
+
+**Code example:**
+```python
+START_TIME = datetime.now(timezone.utc)
+
+def get_uptime():
+    delta = datetime.now(timezone.utc) - START_TIME
+    seconds = int(delta.total_seconds())
+    hours = seconds // 3600
+    minutes = (seconds % 3600) // 60
+    return {"seconds": seconds, "human": f"{hours} hours, {minutes} minutes"}
+```
+
+### 2.2 Configuration via Environment Variables
+**What:** App settings are controlled by env vars with defaults.
+
+**Why it matters:** Makes the application portable across environments (local, Docker, Kubernetes).
+
+**Code example:**
+```python
+HOST = os.getenv("HOST", "0.0.0.0")
+PORT = int(os.getenv("PORT", 5000))
+DEBUG = os.getenv("DEBUG", "False").lower() == "true"
+```
+
+### 2.3 Error Handling (JSON Responses)
+**What:** Custom JSON handlers for common errors (404, 500).
+
+**Why it matters:** API stays consistent (always JSON), easier monitoring and debugging.
+
+**Code example:**
+```python
+@app.errorhandler(404)
+def not_found(error):
+    return jsonify({"error": "Not Found", "message": "Endpoint does not exist"}), 404
+```
+
+### 2.4 Logging
+**What:** Logging is configured with timestamps and log levels.
+
+**Why it matters:** Logs are essential for troubleshooting, monitoring, and production readiness.
+
+**Code example:**
+```python
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s"
+)
+logger = logging.getLogger(__name__)
+
+logger.info("Request %s %s from %s", request.method, request.path, request.remote_addr)
+```
+
+## 3. API Documentation
+
+> Note: In my local environment I ran the service on port **8080** (via `PORT=8080`).  
+> Default port in code is **5000** when `PORT` is not set.
+
+### 3.1 GET /
+**Purpose:** Returns service metadata, system information, runtime details, request info, and available endpoints.
+
+**Request example:**
+```bash
+curl http://127.0.0.1:8080/
+```
+
+**Response example (shortened):**
+```json
+{
+  "service": {
+    "name": "devops-info-service",
+    "version": "1.0.0",
+    "description": "DevOps course info service",
+    "framework": "Flask"
+  },
+  "system": {
+    "hostname": "my-host",
+    "platform": "Windows",
+    "architecture": "AMD64",
+    "cpu_count": 20,
+    "python_version": "3.14.0"
+  },
+  "runtime": {
+    "uptime_seconds": 1302,
+    "timezone": "UTC"
+  },
+  "request": {
+    "client_ip": "127.0.0.1",
+    "method": "GET",
+    "path": "/"
+  }
+}
+```
+
+### 3.2 GET /health
+**Purpose:** Health check endpoint for monitoring (used later for Kubernetes probes).
+
+**Request example:**
+```bash
+curl -i http://127.0.0.1:8080/health
+```
+
+**Response example:**
+```json
+{
+  "status": "healthy",
+  "timestamp": "2026-01-28T13:41:14.751Z",
+  "uptime_seconds": 918
+}
+```
+
+### 3.3 Testing Commands
+
+**Pretty-printed JSON output:**
+```bash
+curl -s http://127.0.0.1:8080/ | python -m json.tool
+```
+
+## 4. Testing Evidence
+
+Screenshots are included in `app_python/docs/screenshots/`:
+
+- `01-main-endpoint.png` — Main endpoint (`GET /`) showing complete JSON output
+- `02-health-check.png` — Health endpoint (`GET /health`) including HTTP 200 status
+- `03-formatted-output.png` — Pretty-printed JSON output from terminal (`curl -s ... | python -m json.tool`)
+
+## 5. Challenges & Solutions
+
+**Problem:** On Windows, `python app.py` did not work, while `py app.py` worked.
+
+**Solution:**
+- Created and activated a virtual environment using:
+  ```bash
+  py -m venv venv
+  ```
+- After activation, `python` points to the venv interpreter.
+- Disabled Windows Store Python execution aliases (App Execution Aliases) so `python` runs the correct interpreter.
+
+## 6. GitHub Community
+
+**Why starring repositories matters:** Stars increase visibility of useful projects and are a convenient way to bookmark tools and libraries; they also encourage maintainers.
+
+**Why following developers helps:** Following the professor, TAs, and classmates supports collaboration, helps discover solutions and best practices through activity feeds, and builds a professional network.
diff --git a/app_python/docs/LAB02.md b/app_python/docs/LAB02.md
index 9ed13b479c..b631f739f9 100644
--- a/app_python/docs/LAB02.md
+++ b/app_python/docs/LAB02.md
@@ -1,235 +1,235 @@
-# LAB02 — Docker Containerization (Python)
-
-## 1. Docker Best Practices Applied
-
-### 1.1 Fixed base image version (pinned tag)
-**What I did:** Used `python:3.13-slim` in `Dockerfile`.  
-**Why it matters:** A fixed base image version makes builds reproducible and predictable. The `slim` variant reduces image size compared to full images, speeds up pulls/builds, and reduces the attack surface.
-
-**Snippet:**
-```dockerfile
-FROM python:3.13-slim
-```
-
-### 1.2 Non-root user (mandatory)
-**What I did:** Created a system user/group `app` and switched to it via `USER app`.  
-**Why it matters:** Running as non-root limits privileges inside the container. If the app is compromised, the attacker has fewer permissions, which is a baseline production security practice.
-
-**Snippet:**
-```dockerfile
-RUN addgroup --system app && adduser --system --ingroup app app
-USER app
-```
-
-### 1.3 Layer caching (dependencies before application code)
-**What I did:** Copied `requirements.txt` and installed dependencies **before** copying `app.py`.  
-**Why it matters:** Docker caches layers. If only source code changes, the dependency layer stays cached and rebuilds are much faster.
-
-**Snippet:**
-```dockerfile
-COPY requirements.txt .
-RUN pip install --no-cache-dir -r requirements.txt
-COPY app.py .
-```
-
-### 1.4 Minimal copy + `.dockerignore`
-**What I did:** Copied only runtime-needed files into the image (`requirements.txt`, `app.py`) and used `.dockerignore` to exclude unnecessary files (venv, docs, git, caches).  
-**Why it matters:** Smaller build context → faster build. Smaller final image → faster push/pull and reduced risk of leaking development artifacts into production images.
-
----
-
-## 2. Image Information & Decisions
-
-### 2.1 Base image decision
-**Chosen:** `python:3.13-slim`  
-**Justification:**
-- Modern Python runtime version for container execution
-- `slim` gives good balance of small size + compatibility (Debian-based)
-- Avoids common issues seen with `alpine` images (musl / Python wheels)
-
-### 2.2 Final image size and assessment
-Output:
-```text
-IMAGE                       ID             DISK USAGE   CONTENT SIZE   EXTRA
-devops-info-service:lab02   dc2fdac78d0d        182MB         44.4MB
-```
-
-**Assessment:** Content size (~44.4MB) is reasonable for a small Flask app running on Debian-slim. Disk usage is higher due to local storage/overhead, but still acceptable for this lab. Further reductions are possible (e.g., using a production WSGI server, minimizing base layers, or alternative minimal images), but this already follows recommended best practices for beginner containerization.
-
-### 2.3 Layer structure explanation
-High-level layers:
-1. Base image `python:3.13-slim`
-2. Environment variables for predictable Python behavior
-3. Create non-root user/group
-4. Set working directory
-5. Copy and install dependencies (`requirements.txt` → `pip install`)
-6. Copy application code (`app.py`)
-7. Switch to non-root user
-8. Expose port (documentation)
-9. Start application with `CMD`
-
-**Evidence (`docker history`):**
-```text
-IMAGE          CREATED          CREATED BY                                      SIZE      COMMENT
-dc2fdac78d0d   47 minutes ago   CMD ["python" "app.py"]                         0B        buildkit.dockerfile.v0
-<missing>      47 minutes ago   EXPOSE [5000/tcp]                               0B        buildkit.dockerfile.v0
-<missing>      47 minutes ago   USER app                                        0B        buildkit.dockerfile.v0
-<missing>      47 minutes ago   COPY app.py . # buildkit                        12.3kB    buildkit.dockerfile.v0
-<missing>      47 minutes ago   RUN /bin/sh -c pip install --no-cache-dir -r…   5.53MB    buildkit.dockerfile.v0
-<missing>      47 minutes ago   COPY requirements.txt . # buildkit              12.3kB    buildkit.dockerfile.v0
-<missing>      47 minutes ago   WORKDIR /app                                    8.19kB    buildkit.dockerfile.v0
-<missing>      47 minutes ago   RUN /bin/sh -c addgroup --system app && addu…   45.1kB    buildkit.dockerfile.v0
-<missing>      47 minutes ago   ENV PYTHONDONTWRITEBYTECODE=1 PYTHONUNBUFFER…   0B        buildkit.dockerfile.v0
-...
-```
-
-### 2.4 Optimization choices
-- `python:3.13-slim` for smaller base
-- `pip install --no-cache-dir` to avoid storing pip cache inside the image
-- Copy only necessary runtime files (no repo-wide `COPY . .`)
-- `.dockerignore` reduces build context size and avoids shipping `venv/`, `.git/`, `docs/`, caches
-
----
-
-## 3. Build & Run Process
-
-### 3.1 Build output
-Command:
-```bash
-docker build -t devops-info-service:lab02 .
-```
-
-Terminal output (excerpt):
-```text
-[+] Building 75.9s (15/15) FINISHED
- => [internal] load build definition from Dockerfile
- => [internal] load metadata for docker.io/library/python:3.13-slim
- => [internal] load .dockerignore
- => [1/6] FROM docker.io/library/python:3.13-slim@sha256:2b9c9803...
- => [2/6] RUN addgroup --system app && adduser --system --ingroup app app
- => [3/6] WORKDIR /app
- => [4/6] COPY requirements.txt .
- => [5/6] RUN pip install --no-cache-dir -r requirements.txt
- => [6/6] COPY app.py .
- => exporting to image
- => naming to docker.io/library/devops-info-service:lab02
-```
-
-### 3.2 Container run output (local image)
-Command:
-```bash
-docker run --rm -p 8080:5000 --name devops-info devops-info-service:lab02
-```
-
-Terminal output:
-```text
-2026-02-04 17:36:37,431 - __main__ - INFO - Starting DevOps Info Service on 0.0.0.0:5000
- * Serving Flask app 'app'
- * Debug mode: off
- * Running on all addresses (0.0.0.0)
- * Running on http://127.0.0.1:5000
- * Running on http://172.17.0.2:5000
-Press CTRL+C to quit
-```
-
-**Proof container is running (`docker ps`):**
-```text
-CONTAINER ID   IMAGE                       COMMAND           CREATED         STATUS         PORTS                                         NAMES
-0012d755fc1b   devops-info-service:lab02   "python app.py"   7 seconds ago   Up 6 seconds   0.0.0.0:8080->5000/tcp, [::]:8080->5000/tcp   devops-info
-```
-
-### 3.3 Endpoint testing output
-Commands:
-```bash
-curl http://127.0.0.1:8080/
-curl http://127.0.0.1:8080/health
-```
-
-Expected results:
-- HTTP 200 on both endpoints
-- JSON payload returned
-- Server header shows Werkzeug + Python 3.13.11 inside container
-
-Example evidence (health):
-```text
-StatusCode        : 200
-StatusDescription : OK
-Content           : {"status":"healthy","timestamp":"2026-02-04T17:22:41.912Z","uptime_seconds":68}
-Server            : Werkzeug/3.1.5 Python/3.13.11
-```
-
-### 3.4 Docker Hub push + pull verification
-Login:
-```text
-docker login
-Login Succeeded
-```
-
-Tagging strategy:
-- `cdeth567/devops-info-service:lab02` — fixed tag for lab submission
-- `cdeth567/devops-info-service:latest` — convenience tag for most recent build
-
-Push output:
-```text
-docker push cdeth567/devops-info-service:lab02
-...
-lab02: digest: sha256:dc2fdac78d0d5b5e75c3da6a21682aacfdef926ff648356baf54d0437a3d81ec size: 856
-
-docker push cdeth567/devops-info-service:latest
-...
-latest: digest: sha256:dc2fdac78d0d5b5e75c3da6a21682aacfdef926ff648356baf54d0437a3d81ec size: 856
-```
-
-Pull verification:
-```text
-docker pull cdeth567/devops-info-service:lab02
-Status: Image is up to date for cdeth567/devops-info-service:lab02
-```
-
-**Docker Hub repository URL:**  
-https://hub.docker.com/r/cdeth567/devops-info-service
-
----
-
-## 4. Technical Analysis
-
-### 4.1 Why does this Dockerfile work the way it does?
-- `CMD ["python", "app.py"]` starts the app the same way as local development.
-- The app binds to `0.0.0.0` by default (`HOST=0.0.0.0`), so it is reachable from outside the container.
-- Port mapping `-p 8080:5000` exposes container port 5000 on host port 8080.
-- Dependencies are installed from `requirements.txt` inside the image, making runtime self-contained and portable.
-
-### 4.2 What would happen if I changed the layer order?
-If application code was copied before installing dependencies (e.g., `COPY . .` first), then every code change would invalidate the dependency layer cache and force `pip install` to run again. This would slow down rebuilds significantly.
-
-### 4.3 Security considerations implemented
-- Non-root execution (`USER app`)
-- Slim base image reduces installed packages → smaller attack surface
-- `.dockerignore` prevents shipping local artifacts (venv, git metadata, docs) into the container image
-
-### 4.4 How does `.dockerignore` improve the build?
-- Reduces build context size → faster builds
-- Prevents accidental inclusion of `venv/`, `.git/`, `docs/`, caches
-- Lowers risk of leaking local files into the container image
-
----
-
-## 5. Challenges & Solutions
-
-### 5.1 Port already allocated (8080)
-**Issue:** While testing the Docker Hub image, Docker returned:
-`Bind for 0.0.0.0:8080 failed: port is already allocated`
-
-**Cause:** Another running container was already mapped to host port 8080.
-
-**Solution:** Stopped the running container (Ctrl+C) or used a different host port mapping (e.g. `-p 8081:5000`).
-
-### 5.2 PowerShell `curl` warning
-**Issue:** PowerShell shows a security warning because `curl` is an alias for `Invoke-WebRequest`.  
-**Solution:** Confirmed prompt once (“A” = Yes to All) and verified endpoints still return HTTP 200 with JSON.
-
-### 5.3 What I learned
-- Dockerfile layer order strongly impacts rebuild speed due to caching.
-- Running as non-root is a simple but important security requirement.
-- Host port mapping requires a free port; multiple containers cannot bind the same host port simultaneously.
-- `.dockerignore` is important both for performance (smaller context) and security (no accidental file leaks).
+# LAB02 — Docker Containerization (Python)
+
+## 1. Docker Best Practices Applied
+
+### 1.1 Fixed base image version (pinned tag)
+**What I did:** Used `python:3.13-slim` in `Dockerfile`.  
+**Why it matters:** A fixed base image version makes builds reproducible and predictable. The `slim` variant reduces image size compared to full images, speeds up pulls/builds, and reduces the attack surface.
+
+**Snippet:**
+```dockerfile
+FROM python:3.13-slim
+```
+
+### 1.2 Non-root user (mandatory)
+**What I did:** Created a system user/group `app` and switched to it via `USER app`.  
+**Why it matters:** Running as non-root limits privileges inside the container. If the app is compromised, the attacker has fewer permissions, which is a baseline production security practice.
+
+**Snippet:**
+```dockerfile
+RUN addgroup --system app && adduser --system --ingroup app app
+USER app
+```
+
+### 1.3 Layer caching (dependencies before application code)
+**What I did:** Copied `requirements.txt` and installed dependencies **before** copying `app.py`.  
+**Why it matters:** Docker caches layers. If only source code changes, the dependency layer stays cached and rebuilds are much faster.
+
+**Snippet:**
+```dockerfile
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY app.py .
+```
+
+### 1.4 Minimal copy + `.dockerignore`
+**What I did:** Copied only runtime-needed files into the image (`requirements.txt`, `app.py`) and used `.dockerignore` to exclude unnecessary files (venv, docs, git, caches).  
+**Why it matters:** Smaller build context → faster build. Smaller final image → faster push/pull and reduced risk of leaking development artifacts into production images.
+
+---
+
+## 2. Image Information & Decisions
+
+### 2.1 Base image decision
+**Chosen:** `python:3.13-slim`  
+**Justification:**
+- Modern Python runtime version for container execution
+- `slim` gives good balance of small size + compatibility (Debian-based)
+- Avoids common issues seen with `alpine` images (musl / Python wheels)
+
+### 2.2 Final image size and assessment
+Output:
+```text
+IMAGE                       ID             DISK USAGE   CONTENT SIZE   EXTRA
+devops-info-service:lab02   dc2fdac78d0d        182MB         44.4MB
+```
+
+**Assessment:** Content size (~44.4MB) is reasonable for a small Flask app running on Debian-slim. Disk usage is higher due to local storage/overhead, but still acceptable for this lab. Further reductions are possible (e.g., using a production WSGI server, minimizing base layers, or alternative minimal images), but this already follows recommended best practices for beginner containerization.
+
+### 2.3 Layer structure explanation
+High-level layers:
+1. Base image `python:3.13-slim`
+2. Environment variables for predictable Python behavior
+3. Create non-root user/group
+4. Set working directory
+5. Copy and install dependencies (`requirements.txt` → `pip install`)
+6. Copy application code (`app.py`)
+7. Switch to non-root user
+8. Expose port (documentation)
+9. Start application with `CMD`
+
+**Evidence (`docker history`):**
+```text
+IMAGE          CREATED          CREATED BY                                      SIZE      COMMENT
+dc2fdac78d0d   47 minutes ago   CMD ["python" "app.py"]                         0B        buildkit.dockerfile.v0
+<missing>      47 minutes ago   EXPOSE [5000/tcp]                               0B        buildkit.dockerfile.v0
+<missing>      47 minutes ago   USER app                                        0B        buildkit.dockerfile.v0
+<missing>      47 minutes ago   COPY app.py . # buildkit                        12.3kB    buildkit.dockerfile.v0
+<missing>      47 minutes ago   RUN /bin/sh -c pip install --no-cache-dir -r…   5.53MB    buildkit.dockerfile.v0
+<missing>      47 minutes ago   COPY requirements.txt . # buildkit              12.3kB    buildkit.dockerfile.v0
+<missing>      47 minutes ago   WORKDIR /app                                    8.19kB    buildkit.dockerfile.v0
+<missing>      47 minutes ago   RUN /bin/sh -c addgroup --system app && addu…   45.1kB    buildkit.dockerfile.v0
+<missing>      47 minutes ago   ENV PYTHONDONTWRITEBYTECODE=1 PYTHONUNBUFFER…   0B        buildkit.dockerfile.v0
+...
+```
+
+### 2.4 Optimization choices
+- `python:3.13-slim` for smaller base
+- `pip install --no-cache-dir` to avoid storing pip cache inside the image
+- Copy only necessary runtime files (no repo-wide `COPY . .`)
+- `.dockerignore` reduces build context size and avoids shipping `venv/`, `.git/`, `docs/`, caches
+
+---
+
+## 3. Build & Run Process
+
+### 3.1 Build output
+Command:
+```bash
+docker build -t devops-info-service:lab02 .
+```
+
+Terminal output (excerpt):
+```text
+[+] Building 75.9s (15/15) FINISHED
+ => [internal] load build definition from Dockerfile
+ => [internal] load metadata for docker.io/library/python:3.13-slim
+ => [internal] load .dockerignore
+ => [1/6] FROM docker.io/library/python:3.13-slim@sha256:2b9c9803...
+ => [2/6] RUN addgroup --system app && adduser --system --ingroup app app
+ => [3/6] WORKDIR /app
+ => [4/6] COPY requirements.txt .
+ => [5/6] RUN pip install --no-cache-dir -r requirements.txt
+ => [6/6] COPY app.py .
+ => exporting to image
+ => naming to docker.io/library/devops-info-service:lab02
+```
+
+### 3.2 Container run output (local image)
+Command:
+```bash
+docker run --rm -p 8080:5000 --name devops-info devops-info-service:lab02
+```
+
+Terminal output:
+```text
+2026-02-04 17:36:37,431 - __main__ - INFO - Starting DevOps Info Service on 0.0.0.0:5000
+ * Serving Flask app 'app'
+ * Debug mode: off
+ * Running on all addresses (0.0.0.0)
+ * Running on http://127.0.0.1:5000
+ * Running on http://172.17.0.2:5000
+Press CTRL+C to quit
+```
+
+**Proof container is running (`docker ps`):**
+```text
+CONTAINER ID   IMAGE                       COMMAND           CREATED         STATUS         PORTS                                         NAMES
+0012d755fc1b   devops-info-service:lab02   "python app.py"   7 seconds ago   Up 6 seconds   0.0.0.0:8080->5000/tcp, [::]:8080->5000/tcp   devops-info
+```
+
+### 3.3 Endpoint testing output
+Commands:
+```bash
+curl http://127.0.0.1:8080/
+curl http://127.0.0.1:8080/health
+```
+
+Expected results:
+- HTTP 200 on both endpoints
+- JSON payload returned
+- Server header shows Werkzeug + Python 3.13.11 inside container
+
+Example evidence (health):
+```text
+StatusCode        : 200
+StatusDescription : OK
+Content           : {"status":"healthy","timestamp":"2026-02-04T17:22:41.912Z","uptime_seconds":68}
+Server            : Werkzeug/3.1.5 Python/3.13.11
+```
+
+### 3.4 Docker Hub push + pull verification
+Login:
+```text
+docker login
+Login Succeeded
+```
+
+Tagging strategy:
+- `cdeth567/devops-info-service:lab02` — fixed tag for lab submission
+- `cdeth567/devops-info-service:latest` — convenience tag for most recent build
+
+Push output:
+```text
+docker push cdeth567/devops-info-service:lab02
+...
+lab02: digest: sha256:dc2fdac78d0d5b5e75c3da6a21682aacfdef926ff648356baf54d0437a3d81ec size: 856
+
+docker push cdeth567/devops-info-service:latest
+...
+latest: digest: sha256:dc2fdac78d0d5b5e75c3da6a21682aacfdef926ff648356baf54d0437a3d81ec size: 856
+```
+
+Pull verification:
+```text
+docker pull cdeth567/devops-info-service:lab02
+Status: Image is up to date for cdeth567/devops-info-service:lab02
+```
+
+**Docker Hub repository URL:**  
+https://hub.docker.com/r/cdeth567/devops-info-service
+
+---
+
+## 4. Technical Analysis
+
+### 4.1 Why does this Dockerfile work the way it does?
+- `CMD ["python", "app.py"]` starts the app the same way as local development.
+- The app binds to `0.0.0.0` by default (`HOST=0.0.0.0`), so it is reachable from outside the container.
+- Port mapping `-p 8080:5000` exposes container port 5000 on host port 8080.
+- Dependencies are installed from `requirements.txt` inside the image, making runtime self-contained and portable.
+
+### 4.2 What would happen if I changed the layer order?
+If application code was copied before installing dependencies (e.g., `COPY . .` first), then every code change would invalidate the dependency layer cache and force `pip install` to run again. This would slow down rebuilds significantly.
+
+### 4.3 Security considerations implemented
+- Non-root execution (`USER app`)
+- Slim base image reduces installed packages → smaller attack surface
+- `.dockerignore` prevents shipping local artifacts (venv, git metadata, docs) into the container image
+
+### 4.4 How does `.dockerignore` improve the build?
+- Reduces build context size → faster builds
+- Prevents accidental inclusion of `venv/`, `.git/`, `docs/`, caches
+- Lowers risk of leaking local files into the container image
+
+---
+
+## 5. Challenges & Solutions
+
+### 5.1 Port already allocated (8080)
+**Issue:** While testing the Docker Hub image, Docker returned:
+`Bind for 0.0.0.0:8080 failed: port is already allocated`
+
+**Cause:** Another running container was already mapped to host port 8080.
+
+**Solution:** Stopped the running container (Ctrl+C) or used a different host port mapping (e.g. `-p 8081:5000`).
+
+### 5.2 PowerShell `curl` warning
+**Issue:** PowerShell shows a security warning because `curl` is an alias for `Invoke-WebRequest`.  
+**Solution:** Confirmed prompt once (“A” = Yes to All) and verified endpoints still return HTTP 200 with JSON.
+
+### 5.3 What I learned
+- Dockerfile layer order strongly impacts rebuild speed due to caching.
+- Running as non-root is a simple but important security requirement.
+- Host port mapping requires a free port; multiple containers cannot bind the same host port simultaneously.
+- `.dockerignore` is important both for performance (smaller context) and security (no accidental file leaks).
diff --git a/app_python/docs/LAB03.md b/app_python/docs/LAB03.md
index eeab592380..2256bca136 100644
--- a/app_python/docs/LAB03.md
+++ b/app_python/docs/LAB03.md
@@ -1,299 +1,299 @@
-# LAB03 — Continuous Integration (CI/CD)
-
-Repository: `Cdeth567/DevOps-Core-Course`  
-Branch: `lab03`  
-App: `app_python` (DevOps Info Service)
-
----
-
-## 1. Overview
-
-### 1.1 Testing framework choice
-**Framework:** `pytest 8.x`
-
-**Why pytest:**
-- Minimal and readable test syntax (simple `assert` statements)
-- Great ecosystem and easy CI integration
-- Widely used industry standard for Python services
-
-**Dev dependencies file:** `app_python/requirements-dev.txt` (contains `pytest==8.3.4` and `ruff==0.9.6`).
-
----
-
-### 1.2 What tests cover
-Tests are located in: `app_python/tests/test_app.py`
-
-Covered behavior:
-- **`GET /`**
-  - Returns HTTP 200
-  - Returns JSON with expected structure/fields
-- **`GET /health`**
-  - Returns HTTP 200
-  - Returns JSON with `"status": "healthy"` and expected keys
-- Includes multiple assertions → not just "smoke tests"
-
----
-
-### 1.3 CI workflow trigger configuration
-Workflow file: `.github/workflows/python-ci.yml`  
-Workflow name: **Python CI (tests + docker)**
-
-Triggers:
-- **Push** to branches: `master`, `lab03`
-- **PRs** targeting `master`
-- **Path filters**: runs only if something changed in:
-  - `app_python/**`
-  - `.github/workflows/python-ci.yml`
-
-Why this matters:
-- In monorepos, path filters prevent wasting CI minutes when unrelated files change.
-- PR checks still run for code changes that matter.
-
----
-
-### 1.4 Versioning strategy (Docker images)
-**Chosen strategy:** **CalVer** (Calendar Versioning)
-
-Implementation:
-- CI generates version on build: `YYYY.MM.DD` (UTC time)
-
-Docker tags produced by CI:
-- `cdeth567/devops-info-service:<YYYY.MM.DD>`
-- `cdeth567/devops-info-service:latest`
-
-Why CalVer is a good fit here:
-- This is a service with frequent small changes.
-- It’s easy to understand which build is “today’s”.
-- No need to manually manage SemVer releases for a lab service.
-
----
-
-## 2. Workflow Evidence
-
-### 2.1 Local installation & test evidence (terminal output)
-
-Install dev deps:
-```text
-py -m pip install -r requirements-dev.txt
-Successfully installed ... pytest-8.3.4
-```
-
-Install runtime deps:
-```text
-py -m pip install -r requirements.txt
-Successfully installed Flask-3.1.0 ... Werkzeug-3.1.5 ...
-```
-
-Run tests (note about Windows PATH):
-```text
-pytest : The term 'pytest' is not recognized ...
-py -m pytest -q
-.... [100%]
-4 passed in 0.37s
-```
-
-**Explanation:** `pytest.exe` was installed into Python Scripts directory not included in PATH. Running `py -m pytest` executes pytest as a module and works reliably on Windows.
-
----
-
-### 2.2 Linting evidence (ruff)
-
-After installing `ruff` to dev requirements:
-```text
-py -m pip install -r requirements-dev.txt
-Successfully installed ruff-0.9.6
-```
-
-Lint run (correct working directory):
-```text
-py -m ruff check .
-All checks passed!
-```
-
-Note: The earlier error:
-```text
-py -m ruff check app_python
-app_python:1:1: E902 ... file not found
-```
-happened because the command was run inside the `app_python/` directory; there is no nested `app_python/app_python` path. Fix was to lint `.`.
-
----
-
-### 2.3 CI workflow success evidence
-GitHub Actions page shows successful runs on `lab03` (green check).  
-Badge is green for `lab03` branch.
-
-Workflow URL (Actions):
-- `https://github.com/Cdeth567/DevOps-Core-Course/actions/workflows/python-ci.yml`
-
-Status badge in `app_python/README.md`:
-```markdown
-[![Python CI (tests + docker)](https://github.com/Cdeth567/DevOps-Core-Course/actions/workflows/python-ci.yml/badge.svg?branch=lab03)](https://github.com/Cdeth567/DevOps-Core-Course/actions/workflows/python-ci.yml)
-```
-
----
-
-### 2.4 Docker Hub evidence
-Docker Hub repository:
-- `https://hub.docker.com/r/cdeth567/devops-info-service`
-
-CI pushes images with two tags:
-- daily CalVer tag (e.g., `2026.02.11` format)
-- `latest`
-
----
-
-## 3. Best Practices Implemented (CI + Security)
-
-### 3.1 Dependency caching (pip)
-Implemented using `actions/setup-python@v5` built-in caching:
-```yaml
-with:
-  cache: "pip"
-  cache-dependency-path: |
-    app_python/requirements.txt
-    app_python/requirements-dev.txt
-```
-
-Why it matters:
-- Cache hits skip downloading packages again
-- Faster workflows on repeated runs (especially after first successful run)
-
-How to measure:
-- Compare “Install dependencies” step time on first run vs next run
-- GitHub Actions logs will show whether cache was restored
-
----
-
-### 3.2 Matrix builds (multiple Python versions)
-Tests run on **Python 3.12 and 3.13** via matrix:
-```yaml
-matrix:
-  python-version: ["3.12", "3.13"]
-```
-
-Why it matters:
-- Detects version-specific problems early (compatibility across supported versions)
-- Good practice for production Python services
-
----
-
-### 3.3 Fail-fast in matrix
-Enabled:
-```yaml
-fail-fast: true
-```
-
-Why it matters:
-- Stops wasting CI minutes once a matrix job fails
-- Speeds feedback loop (you see failure sooner)
-
----
-
-### 3.4 Concurrency control
-Implemented:
-```yaml
-concurrency:
-  group: python-ci-${{ github.ref }}
-  cancel-in-progress: true
-```
-
-Why it matters:
-- If you push many commits quickly, old runs are canceled
-- Avoids queue buildup and wasted CI time
-
----
-
-### 3.5 Conditional Docker push (protect secrets + reduce risk)
-Docker build/push runs only on **push** to `master` or `lab03`:
-```yaml
-if: github.event_name == 'push' && (github.ref == 'refs/heads/master' || github.ref == 'refs/heads/lab03')
-```
-
-Why it matters:
-- Prevents Docker pushes from PRs (especially forks)
-- Helps avoid leaking secrets in untrusted contexts
-- Standard CI/CD safety practice
-
----
-
-### 3.6 Snyk security scanning
-Implemented using **Snyk CLI** in the runner environment:
-```yaml
-- name: Install Snyk CLI
-  run: npm install -g snyk
-
-- name: Snyk scan (dependencies)
-  continue-on-error: true
-  env:
-    SNYK_TOKEN: ${{ secrets.SNYK_TOKEN }}
-  run: |
-    cd app_python
-    snyk test --severity-threshold=high --file=requirements.txt
-```
-
-Why it matters:
-- Detects known vulnerable dependencies early in pipeline
-- Gives visibility into supply-chain security risks
-
-Decision:
-- `continue-on-error: true` used so CI doesn’t fully block while still reporting vulnerabilities (appropriate for a lab; in production you might fail builds on high/critical).
-
----
-
-## 4. Key Decisions
-
-### 4.1 Versioning strategy
-**CalVer** used for Docker images (daily tags).  
-Rationale: simple automation, no manual release tagging required.
-
-### 4.2 Docker tags produced
-- `<username>/devops-info-service:<YYYY.MM.DD>`
-- `<username>/devops-info-service:latest`
-
-### 4.3 Workflow triggers
-- Push/PR triggers with **path filters** ensure workflow runs only for Python app + workflow changes.
-
-### 4.4 Test coverage
-- Endpoints `/` and `/health` are tested via Flask test client (no need to start a real server in CI).  
-- Coverage tool (pytest-cov) was **not added** in this submission (bonus task), but tests provide functional coverage for both endpoints.
-
----
-
-## 5. Challenges & Fixes
-
-### 5.1 `pytest` not recognized on Windows
-**Problem:** `pytest` command not found because Python Scripts directory isn’t in PATH.  
-**Fix:** Use `py -m pytest` which runs pytest as a module.
-
-### 5.2 `ruff` not recognized / wrong path
-**Problem 1:** `ruff` not found → it wasn’t installed yet.  
-**Fix:** Added `ruff==0.9.6` to `requirements-dev.txt`.
-
-**Problem 2:** `ruff check app_python` from inside `app_python/` caused file-not-found.  
-**Fix:** Run `py -m ruff check .` from the `app_python/` directory.
-
-### 5.3 `.github/workflows` location mistake
-Initially workflow file was placed under `app_python/.github/workflows/`, which GitHub Actions does **not** detect.  
-Fix: moved workflow to repo root: `.github/workflows/python-ci.yml`.
-
-### 5.4 Snyk scanning issues
-There were failures while adjusting working directories.  
-Final solution: run Snyk CLI and `cd app_python` before scanning requirements.
-
----
-
-## 6. Files Changed / Added (Summary)
-
-- `.github/workflows/python-ci.yml` — CI workflow (tests + lint + docker push + Snyk)
-- `app_python/tests/test_app.py` — pytest unit tests
-- `app_python/requirements-dev.txt` — dev dependencies (`pytest`, `ruff`)
-- `app_python/README.md` — added CI status badge + testing instructions
-- `app_python/docs/LAB03.md` — this documentation
-
----
-
-## Appendix — Workflow (reference)
-Key jobs:
-- `test-and-lint` (matrix: 3.12 + 3.13): install deps, ruff lint, pytest, Snyk scan
-- `docker-build-and-push`: build + push to Docker Hub with CalVer + latest
+# LAB03 — Continuous Integration (CI/CD)
+
+Repository: `Cdeth567/DevOps-Core-Course`  
+Branch: `lab03`  
+App: `app_python` (DevOps Info Service)
+
+---
+
+## 1. Overview
+
+### 1.1 Testing framework choice
+**Framework:** `pytest 8.x`
+
+**Why pytest:**
+- Minimal and readable test syntax (simple `assert` statements)
+- Great ecosystem and easy CI integration
+- Widely used industry standard for Python services
+
+**Dev dependencies file:** `app_python/requirements-dev.txt` (contains `pytest==8.3.4` and `ruff==0.9.6`).
+
+---
+
+### 1.2 What tests cover
+Tests are located in: `app_python/tests/test_app.py`
+
+Covered behavior:
+- **`GET /`**
+  - Returns HTTP 200
+  - Returns JSON with expected structure/fields
+- **`GET /health`**
+  - Returns HTTP 200
+  - Returns JSON with `"status": "healthy"` and expected keys
+- Includes multiple assertions → not just "smoke tests"
+
+---
+
+### 1.3 CI workflow trigger configuration
+Workflow file: `.github/workflows/python-ci.yml`  
+Workflow name: **Python CI (tests + docker)**
+
+Triggers:
+- **Push** to branches: `master`, `lab03`
+- **PRs** targeting `master`
+- **Path filters**: runs only if something changed in:
+  - `app_python/**`
+  - `.github/workflows/python-ci.yml`
+
+Why this matters:
+- In monorepos, path filters prevent wasting CI minutes when unrelated files change.
+- PR checks still run for code changes that matter.
+
+---
+
+### 1.4 Versioning strategy (Docker images)
+**Chosen strategy:** **CalVer** (Calendar Versioning)
+
+Implementation:
+- CI generates version on build: `YYYY.MM.DD` (UTC time)
+
+Docker tags produced by CI:
+- `cdeth567/devops-info-service:<YYYY.MM.DD>`
+- `cdeth567/devops-info-service:latest`
+
+Why CalVer is a good fit here:
+- This is a service with frequent small changes.
+- It’s easy to understand which build is “today’s”.
+- No need to manually manage SemVer releases for a lab service.
+
+---
+
+## 2. Workflow Evidence
+
+### 2.1 Local installation & test evidence (terminal output)
+
+Install dev deps:
+```text
+py -m pip install -r requirements-dev.txt
+Successfully installed ... pytest-8.3.4
+```
+
+Install runtime deps:
+```text
+py -m pip install -r requirements.txt
+Successfully installed Flask-3.1.0 ... Werkzeug-3.1.5 ...
+```
+
+Run tests (note about Windows PATH):
+```text
+pytest : The term 'pytest' is not recognized ...
+py -m pytest -q
+.... [100%]
+4 passed in 0.37s
+```
+
+**Explanation:** `pytest.exe` was installed into Python Scripts directory not included in PATH. Running `py -m pytest` executes pytest as a module and works reliably on Windows.
+
+---
+
+### 2.2 Linting evidence (ruff)
+
+After installing `ruff` to dev requirements:
+```text
+py -m pip install -r requirements-dev.txt
+Successfully installed ruff-0.9.6
+```
+
+Lint run (correct working directory):
+```text
+py -m ruff check .
+All checks passed!
+```
+
+Note: The earlier error:
+```text
+py -m ruff check app_python
+app_python:1:1: E902 ... file not found
+```
+happened because the command was run inside the `app_python/` directory; there is no nested `app_python/app_python` path. Fix was to lint `.`.
+
+---
+
+### 2.3 CI workflow success evidence
+GitHub Actions page shows successful runs on `lab03` (green check).  
+Badge is green for `lab03` branch.
+
+Workflow URL (Actions):
+- `https://github.com/Cdeth567/DevOps-Core-Course/actions/workflows/python-ci.yml`
+
+Status badge in `app_python/README.md`:
+```markdown
+[![Python CI (tests + docker)](https://github.com/Cdeth567/DevOps-Core-Course/actions/workflows/python-ci.yml/badge.svg?branch=lab03)](https://github.com/Cdeth567/DevOps-Core-Course/actions/workflows/python-ci.yml)
+```
+
+---
+
+### 2.4 Docker Hub evidence
+Docker Hub repository:
+- `https://hub.docker.com/r/cdeth567/devops-info-service`
+
+CI pushes images with two tags:
+- daily CalVer tag (e.g., `2026.02.11` format)
+- `latest`
+
+---
+
+## 3. Best Practices Implemented (CI + Security)
+
+### 3.1 Dependency caching (pip)
+Implemented using `actions/setup-python@v5` built-in caching:
+```yaml
+with:
+  cache: "pip"
+  cache-dependency-path: |
+    app_python/requirements.txt
+    app_python/requirements-dev.txt
+```
+
+Why it matters:
+- Cache hits skip downloading packages again
+- Faster workflows on repeated runs (especially after first successful run)
+
+How to measure:
+- Compare “Install dependencies” step time on first run vs next run
+- GitHub Actions logs will show whether cache was restored
+
+---
+
+### 3.2 Matrix builds (multiple Python versions)
+Tests run on **Python 3.12 and 3.13** via matrix:
+```yaml
+matrix:
+  python-version: ["3.12", "3.13"]
+```
+
+Why it matters:
+- Detects version-specific problems early (compatibility across supported versions)
+- Good practice for production Python services
+
+---
+
+### 3.3 Fail-fast in matrix
+Enabled:
+```yaml
+fail-fast: true
+```
+
+Why it matters:
+- Stops wasting CI minutes once a matrix job fails
+- Speeds feedback loop (you see failure sooner)
+
+---
+
+### 3.4 Concurrency control
+Implemented:
+```yaml
+concurrency:
+  group: python-ci-${{ github.ref }}
+  cancel-in-progress: true
+```
+
+Why it matters:
+- If you push many commits quickly, old runs are canceled
+- Avoids queue buildup and wasted CI time
+
+---
+
+### 3.5 Conditional Docker push (protect secrets + reduce risk)
+Docker build/push runs only on **push** to `master` or `lab03`:
+```yaml
+if: github.event_name == 'push' && (github.ref == 'refs/heads/master' || github.ref == 'refs/heads/lab03')
+```
+
+Why it matters:
+- Prevents Docker pushes from PRs (especially forks)
+- Helps avoid leaking secrets in untrusted contexts
+- Standard CI/CD safety practice
+
+---
+
+### 3.6 Snyk security scanning
+Implemented using **Snyk CLI** in the runner environment:
+```yaml
+- name: Install Snyk CLI
+  run: npm install -g snyk
+
+- name: Snyk scan (dependencies)
+  continue-on-error: true
+  env:
+    SNYK_TOKEN: ${{ secrets.SNYK_TOKEN }}
+  run: |
+    cd app_python
+    snyk test --severity-threshold=high --file=requirements.txt
+```
+
+Why it matters:
+- Detects known vulnerable dependencies early in pipeline
+- Gives visibility into supply-chain security risks
+
+Decision:
+- `continue-on-error: true` used so CI doesn’t fully block while still reporting vulnerabilities (appropriate for a lab; in production you might fail builds on high/critical).
+
+---
+
+## 4. Key Decisions
+
+### 4.1 Versioning strategy
+**CalVer** used for Docker images (daily tags).  
+Rationale: simple automation, no manual release tagging required.
+
+### 4.2 Docker tags produced
+- `<username>/devops-info-service:<YYYY.MM.DD>`
+- `<username>/devops-info-service:latest`
+
+### 4.3 Workflow triggers
+- Push/PR triggers with **path filters** ensure workflow runs only for Python app + workflow changes.
+
+### 4.4 Test coverage
+- Endpoints `/` and `/health` are tested via Flask test client (no need to start a real server in CI).  
+- Coverage tool (pytest-cov) was **not added** in this submission (bonus task), but tests provide functional coverage for both endpoints.
+
+---
+
+## 5. Challenges & Fixes
+
+### 5.1 `pytest` not recognized on Windows
+**Problem:** `pytest` command not found because Python Scripts directory isn’t in PATH.  
+**Fix:** Use `py -m pytest` which runs pytest as a module.
+
+### 5.2 `ruff` not recognized / wrong path
+**Problem 1:** `ruff` not found → it wasn’t installed yet.  
+**Fix:** Added `ruff==0.9.6` to `requirements-dev.txt`.
+
+**Problem 2:** `ruff check app_python` from inside `app_python/` caused file-not-found.  
+**Fix:** Run `py -m ruff check .` from the `app_python/` directory.
+
+### 5.3 `.github/workflows` location mistake
+Initially workflow file was placed under `app_python/.github/workflows/`, which GitHub Actions does **not** detect.  
+Fix: moved workflow to repo root: `.github/workflows/python-ci.yml`.
+
+### 5.4 Snyk scanning issues
+There were failures while adjusting working directories.  
+Final solution: run Snyk CLI and `cd app_python` before scanning requirements.
+
+---
+
+## 6. Files Changed / Added (Summary)
+
+- `.github/workflows/python-ci.yml` — CI workflow (tests + lint + docker push + Snyk)
+- `app_python/tests/test_app.py` — pytest unit tests
+- `app_python/requirements-dev.txt` — dev dependencies (`pytest`, `ruff`)
+- `app_python/README.md` — added CI status badge + testing instructions
+- `app_python/docs/LAB03.md` — this documentation
+
+---
+
+## Appendix — Workflow (reference)
+Key jobs:
+- `test-and-lint` (matrix: 3.12 + 3.13): install deps, ruff lint, pytest, Snyk scan
+- `docker-build-and-push`: build + push to Docker Hub with CalVer + latest
diff --git a/app_python/docs/LAB04.md b/app_python/docs/LAB04.md
index 31c1430dc7..f26309837e 100644
--- a/app_python/docs/LAB04.md
+++ b/app_python/docs/LAB04.md
@@ -1,213 +1,213 @@
-# LAB04 — Infrastructure as Code (Terraform & Pulumi)
-
-> Course: DevOps Core Course — Lab 4  
-> Topic: Infrastructure as Code (Terraform + Pulumi)  
-> Cloud provider: **Yandex Cloud**  
-> Date: 2026-02-19
-
----
-
-## 1. Cloud Provider & Infrastructure
-
-### Cloud provider chosen and rationale
-I used **Yandex Cloud** because it is accessible from Russia and provides a free-tier friendly VM configuration that matches the lab requirements (small VM + simple networking and firewall rules).
-
-### Region / Zone
-- Zone: `ru-central1-a`
-
-### Instance size (free-tier friendly)
-- Platform: `standard-v2`
-- vCPU: `2` with `core_fraction = 20`
-- RAM: `1 GB`
-- Boot disk: `10 GB` (`network-hdd`)
-
-### Estimated cost
-- Expected cost: **$0** (free-tier / minimal resources)
-
-### Resources created
-Using IaC, the following resources are provisioned:
-- VPC network
-- Subnet
-- Security group with rules:
-  - SSH 22 — only from my IP (`95.111.204.70/32`)
-  - HTTP 80 — open to `0.0.0.0/0`
-  - App port 5000 — open to `0.0.0.0/0`
-- Compute instance (VM) with NAT public IP
-
----
-
-## 2. Terraform Implementation
-
-### Terraform version
-```text
-<PASTE: terraform version>
-```
-
-### Project structure
-```
-terraform/
-├── main.tf
-├── variables.tf
-├── outputs.tf
-├── versions.tf
-├── terraform.tfvars   (gitignored)
-└── .gitignore
-```
-
-### Authentication (Yandex Cloud)
-Authentication is done via **Service Account authorized key (JSON)**.
-
-- Service account key file (local path, not committed):
-  - `C:/Users/11kvv/.yc/lab04-sa-key.json`
-
-> Important: credential files (`*.json`) and state are excluded from Git.
-
-### Key configuration decisions
-- **SSH access restricted** to my public IP only: `95.111.204.70/32`
-- Public ports required by lab (80 and 5000) are open to the internet.
-- Outputs exported:
-  - VM public IP
-  - SSH command string
-
-### Challenges encountered & fixes
-1) **Provider authentication missing**
-- Error: `one of 'token' or 'service_account_key_file' should be specified`
-- Fix: generated service account key and configured `service_account_key_file`.
-
-2) **PermissionDenied when creating security group ingress**
-- Error: `Permission denied to add ingress rule to security group`
-- Fix: updated IAM roles for the service account (VPC permissions) and re-ran `terraform apply`.
-
-### Terminal output (sanitized)
-
-#### `terraform init`
-```text
-Initializing the backend...
-Initializing provider plugins...
-- Using previously-installed yandex-cloud/yandex v0.187.0
-
-Terraform has been successfully initialized!
-```
-
-#### `terraform plan` (excerpt)
-```text
-Plan: 2 to add, 0 to change, 0 to destroy.
-
-Changes to Outputs:
-  + public_ip   = (known after apply)
-  + ssh_command = (known after apply)
-```
-
-> Note: I also saw a warning: “Cannot connect to YC tool initialization service...”. This warning did not block plan generation.
-
-#### `terraform apply` (result)
-```text
-<PASTE: the final terraform apply output AFTER permissions fix>
-```
-
-### Outputs
-```text
-Public IP: <PASTE_PUBLIC_IP>
-SSH command (from output):
-<PASTE: terraform output ssh_command>
-```
-
-### SSH proof
-```text
-<PASTE: ssh session proof, e.g. `uname -a` / `whoami`>
-```
-
-Example command (Windows):
-```powershell
-ssh -i C:\Users\11kvv\.ssh\lab04_ed25519 ubuntu@<PUBLIC_IP>
-```
-
----
-
-## 3. Pulumi Implementation
-
-### Pulumi version and language
-- Language: **Python**
-```text
-<PASTE: pulumi version>
-```
-
-### Cleanup of Terraform resources
-Before provisioning the same infrastructure with Pulumi, Terraform resources were destroyed:
-
-```text
-<PASTE: terraform destroy output>
-```
-
-### Pulumi project structure
-```
-pulumi/
-├── __main__.py
-├── requirements.txt
-├── Pulumi.yaml
-└── Pulumi.<stack>.yaml (gitignored if contains secrets)
-```
-
-### Planned changes (`pulumi preview`)
-```text
-<PASTE: pulumi preview output>
-```
-
-### Apply (`pulumi up`)
-```text
-<PASTE: pulumi up output>
-```
-
-### Outputs and SSH proof
-```text
-Pulumi public IP: <PASTE_PUBLIC_IP>
-SSH proof:
-<PASTE: ssh session proof>
-```
-
----
-
-## 4. Terraform vs Pulumi Comparison
-
-### Ease of Learning
-Terraform was easier to start with because HCL is concise and the workflow is very straightforward (`init → plan → apply`). Pulumi required a bit more setup (runtime, deps) and code structure, but felt natural once configured.
-
-### Code Readability
-Terraform is very readable for simple infra because it is declarative and compact. Pulumi is more verbose but benefits from real language features (variables, functions, reuse) which can help as the project grows.
-
-### Debugging
-Terraform errors are often direct and tied to a specific resource block. In Pulumi, errors can appear deeper in the program flow, but the ability to print/debug in code can help.
-
-### Documentation
-Terraform has a large ecosystem and many examples. Pulumi documentation is also strong, especially when you already know the language SDK, but examples for some providers may be fewer.
-
-### Use Case
-- Terraform: best for standard, repeatable infra with a simple declarative model, especially in teams.
-- Pulumi: best when infrastructure needs non-trivial logic/reuse and you want to leverage full programming languages and testing.
-
----
-
-## 5. Lab 5 Preparation & Cleanup
-
-### VM for Lab 5
-- Keeping a VM for Lab 5 (Ansible): **<YES/NO>**
-- If YES: Which one: **Terraform / Pulumi**
-- Reason:
-  - <short explanation>
-
-### Cleanup status
-- Terraform resources destroyed: **<YES/NO>**
-- Pulumi resources destroyed: **<YES/NO>**
-- Proof (outputs/log excerpts):
-```text
-<PASTE: destroy outputs OR mention cloud console status>
-```
-
----
-
-## Appendix — Security & Git hygiene
-
-- `terraform.tfstate` and `terraform.tfvars` are not committed.
-- Service account key `*.json` is not committed.
-- SSH private key is not committed.
-- `.gitignore` contains patterns for state and secrets.
+# LAB04 — Infrastructure as Code (Terraform & Pulumi)
+
+> Course: DevOps Core Course — Lab 4  
+> Topic: Infrastructure as Code (Terraform + Pulumi)  
+> Cloud provider: **Yandex Cloud**  
+> Date: 2026-02-19
+
+---
+
+## 1. Cloud Provider & Infrastructure
+
+### Cloud provider chosen and rationale
+I used **Yandex Cloud** because it is accessible from Russia and provides a free-tier friendly VM configuration that matches the lab requirements (small VM + simple networking and firewall rules).
+
+### Region / Zone
+- Zone: `ru-central1-a`
+
+### Instance size (free-tier friendly)
+- Platform: `standard-v2`
+- vCPU: `2` with `core_fraction = 20`
+- RAM: `1 GB`
+- Boot disk: `10 GB` (`network-hdd`)
+
+### Estimated cost
+- Expected cost: **$0** (free-tier / minimal resources)
+
+### Resources created
+Using IaC, the following resources are provisioned:
+- VPC network
+- Subnet
+- Security group with rules:
+  - SSH 22 — only from my IP (`95.111.204.70/32`)
+  - HTTP 80 — open to `0.0.0.0/0`
+  - App port 5000 — open to `0.0.0.0/0`
+- Compute instance (VM) with NAT public IP
+
+---
+
+## 2. Terraform Implementation
+
+### Terraform version
+```text
+<PASTE: terraform version>
+```
+
+### Project structure
+```
+terraform/
+├── main.tf
+├── variables.tf
+├── outputs.tf
+├── versions.tf
+├── terraform.tfvars   (gitignored)
+└── .gitignore
+```
+
+### Authentication (Yandex Cloud)
+Authentication is done via **Service Account authorized key (JSON)**.
+
+- Service account key file (local path, not committed):
+  - `C:/Users/11kvv/.yc/lab04-sa-key.json`
+
+> Important: credential files (`*.json`) and state are excluded from Git.
+
+### Key configuration decisions
+- **SSH access restricted** to my public IP only: `95.111.204.70/32`
+- Public ports required by lab (80 and 5000) are open to the internet.
+- Outputs exported:
+  - VM public IP
+  - SSH command string
+
+### Challenges encountered & fixes
+1) **Provider authentication missing**
+- Error: `one of 'token' or 'service_account_key_file' should be specified`
+- Fix: generated service account key and configured `service_account_key_file`.
+
+2) **PermissionDenied when creating security group ingress**
+- Error: `Permission denied to add ingress rule to security group`
+- Fix: updated IAM roles for the service account (VPC permissions) and re-ran `terraform apply`.
+
+### Terminal output (sanitized)
+
+#### `terraform init`
+```text
+Initializing the backend...
+Initializing provider plugins...
+- Using previously-installed yandex-cloud/yandex v0.187.0
+
+Terraform has been successfully initialized!
+```
+
+#### `terraform plan` (excerpt)
+```text
+Plan: 2 to add, 0 to change, 0 to destroy.
+
+Changes to Outputs:
+  + public_ip   = (known after apply)
+  + ssh_command = (known after apply)
+```
+
+> Note: I also saw a warning: “Cannot connect to YC tool initialization service...”. This warning did not block plan generation.
+
+#### `terraform apply` (result)
+```text
+<PASTE: the final terraform apply output AFTER permissions fix>
+```
+
+### Outputs
+```text
+Public IP: <PASTE_PUBLIC_IP>
+SSH command (from output):
+<PASTE: terraform output ssh_command>
+```
+
+### SSH proof
+```text
+<PASTE: ssh session proof, e.g. `uname -a` / `whoami`>
+```
+
+Example command (Windows):
+```powershell
+ssh -i C:\Users\11kvv\.ssh\lab04_ed25519 ubuntu@<PUBLIC_IP>
+```
+
+---
+
+## 3. Pulumi Implementation
+
+### Pulumi version and language
+- Language: **Python**
+```text
+<PASTE: pulumi version>
+```
+
+### Cleanup of Terraform resources
+Before provisioning the same infrastructure with Pulumi, Terraform resources were destroyed:
+
+```text
+<PASTE: terraform destroy output>
+```
+
+### Pulumi project structure
+```
+pulumi/
+├── __main__.py
+├── requirements.txt
+├── Pulumi.yaml
+└── Pulumi.<stack>.yaml (gitignored if contains secrets)
+```
+
+### Planned changes (`pulumi preview`)
+```text
+<PASTE: pulumi preview output>
+```
+
+### Apply (`pulumi up`)
+```text
+<PASTE: pulumi up output>
+```
+
+### Outputs and SSH proof
+```text
+Pulumi public IP: <PASTE_PUBLIC_IP>
+SSH proof:
+<PASTE: ssh session proof>
+```
+
+---
+
+## 4. Terraform vs Pulumi Comparison
+
+### Ease of Learning
+Terraform was easier to start with because HCL is concise and the workflow is very straightforward (`init → plan → apply`). Pulumi required a bit more setup (runtime, deps) and code structure, but felt natural once configured.
+
+### Code Readability
+Terraform is very readable for simple infra because it is declarative and compact. Pulumi is more verbose but benefits from real language features (variables, functions, reuse) which can help as the project grows.
+
+### Debugging
+Terraform errors are often direct and tied to a specific resource block. In Pulumi, errors can appear deeper in the program flow, but the ability to print/debug in code can help.
+
+### Documentation
+Terraform has a large ecosystem and many examples. Pulumi documentation is also strong, especially when you already know the language SDK, but examples for some providers may be fewer.
+
+### Use Case
+- Terraform: best for standard, repeatable infra with a simple declarative model, especially in teams.
+- Pulumi: best when infrastructure needs non-trivial logic/reuse and you want to leverage full programming languages and testing.
+
+---
+
+## 5. Lab 5 Preparation & Cleanup
+
+### VM for Lab 5
+- Keeping a VM for Lab 5 (Ansible): **<YES/NO>**
+- If YES: Which one: **Terraform / Pulumi**
+- Reason:
+  - <short explanation>
+
+### Cleanup status
+- Terraform resources destroyed: **<YES/NO>**
+- Pulumi resources destroyed: **<YES/NO>**
+- Proof (outputs/log excerpts):
+```text
+<PASTE: destroy outputs OR mention cloud console status>
+```
+
+---
+
+## Appendix — Security & Git hygiene
+
+- `terraform.tfstate` and `terraform.tfvars` are not committed.
+- Service account key `*.json` is not committed.
+- SSH private key is not committed.
+- `.gitignore` contains patterns for state and secrets.
diff --git a/app_python/requirements-dev.txt b/app_python/requirements-dev.txt
index 148a627bdb..ae15f82f5f 100644
--- a/app_python/requirements-dev.txt
+++ b/app_python/requirements-dev.txt
@@ -1,2 +1,2 @@
-pytest==8.3.4
+pytest==8.3.4
 ruff==0.9.6
\ No newline at end of file
diff --git a/app_python/tests/test_app.py b/app_python/tests/test_app.py
index 1cfc6be361..b032c06e50 100644
--- a/app_python/tests/test_app.py
+++ b/app_python/tests/test_app.py
@@ -1,62 +1,62 @@
-import pytest
-from app import app as flask_app
-
-
-@pytest.fixture()
-def client():
-    flask_app.config["TESTING"] = True
-    with flask_app.test_client() as client:
-        yield client
-
-
-def test_root_endpoint_returns_200_and_json(client):
-    resp = client.get("/", headers={"User-Agent": "pytest"})
-    assert resp.status_code == 200
-    data = resp.get_json()
-    assert isinstance(data, dict)
-
-    # top-level keys
-    for key in ["service", "system", "runtime", "request", "endpoints"]:
-        assert key in data
-
-    # service structure
-    assert data["service"]["name"] == "devops-info-service"
-    assert data["service"]["framework"] == "Flask"
-
-    # system structure
-    for key in ["hostname", "platform", "architecture", "cpu_count", "python_version"]:
-        assert key in data["system"]
-
-    # runtime
-    assert "uptime_seconds" in data["runtime"]
-    assert isinstance(data["runtime"]["uptime_seconds"], int)
-
-    # endpoints list
-    assert isinstance(data["endpoints"], list)
-    assert any(e["path"] == "/" for e in data["endpoints"])
-    assert any(e["path"] == "/health" for e in data["endpoints"])
-
-
-def test_health_endpoint_returns_200_and_expected_fields(client):
-    resp = client.get("/health")
-    assert resp.status_code == 200
-    data = resp.get_json()
-
-    assert data["status"] == "healthy"
-    assert "timestamp" in data
-    assert "uptime_seconds" in data
-    assert isinstance(data["uptime_seconds"], int)
-
-
-def test_unknown_endpoint_returns_404_json(client):
-    resp = client.get("/no-such-endpoint")
-    assert resp.status_code == 404
-    data = resp.get_json()
-
-    assert data["error"] == "Not Found"
-    assert "message" in data
-
-
-def test_method_not_allowed_returns_405(client):
-    resp = client.post("/health")
-    assert resp.status_code == 405
+import pytest
+from app import app as flask_app
+
+
+@pytest.fixture()
+def client():
+    flask_app.config["TESTING"] = True
+    with flask_app.test_client() as client:
+        yield client
+
+
+def test_root_endpoint_returns_200_and_json(client):
+    resp = client.get("/", headers={"User-Agent": "pytest"})
+    assert resp.status_code == 200
+    data = resp.get_json()
+    assert isinstance(data, dict)
+
+    # top-level keys
+    for key in ["service", "system", "runtime", "request", "endpoints"]:
+        assert key in data
+
+    # service structure
+    assert data["service"]["name"] == "devops-info-service"
+    assert data["service"]["framework"] == "Flask"
+
+    # system structure
+    for key in ["hostname", "platform", "architecture", "cpu_count", "python_version"]:
+        assert key in data["system"]
+
+    # runtime
+    assert "uptime_seconds" in data["runtime"]
+    assert isinstance(data["runtime"]["uptime_seconds"], int)
+
+    # endpoints list
+    assert isinstance(data["endpoints"], list)
+    assert any(e["path"] == "/" for e in data["endpoints"])
+    assert any(e["path"] == "/health" for e in data["endpoints"])
+
+
+def test_health_endpoint_returns_200_and_expected_fields(client):
+    resp = client.get("/health")
+    assert resp.status_code == 200
+    data = resp.get_json()
+
+    assert data["status"] == "healthy"
+    assert "timestamp" in data
+    assert "uptime_seconds" in data
+    assert isinstance(data["uptime_seconds"], int)
+
+
+def test_unknown_endpoint_returns_404_json(client):
+    resp = client.get("/no-such-endpoint")
+    assert resp.status_code == 404
+    data = resp.get_json()
+
+    assert data["error"] == "Not Found"
+    assert "message" in data
+
+
+def test_method_not_allowed_returns_405(client):
+    resp = client.post("/health")
+    assert resp.status_code == 405
diff --git a/labs/lab01.md b/labs/lab01.md
index 18c9ff6c43..12d81fcb76 100644
--- a/labs/lab01.md
+++ b/labs/lab01.md
@@ -1,693 +1,693 @@
-# Lab 1 — DevOps Info Service: Web Application Development
-
-![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
-![topic](https://img.shields.io/badge/topic-Web%20Development-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![languages](https://img.shields.io/badge/languages-Python%20|%20Go-informational)
-
-> Build a DevOps info service that reports system information and health status. This service will evolve throughout the course into a comprehensive monitoring tool.
-
-## Overview
-
-Create a **DevOps Info Service** - a web application providing detailed information about itself and its runtime environment. This foundation will grow throughout the course as you add containerization, CI/CD, monitoring, and persistence.
-
-**What You'll Learn:**
-- Web framework selection and implementation
-- System introspection and API design
-- Python best practices and documentation
-- Foundation for future DevOps tooling
-
-**Tech Stack:** Python 3.11+ | Flask 3.1 or FastAPI 0.115
-
----
-
-## Tasks
-
-### Task 1 — Python Web Application (6 pts)
-
-Build a production-ready Python web service with comprehensive system information.
-
-#### 1.1 Project Structure
-
-Create this structure:
-
-```
-app_python/
-├── app.py                    # Main application
-├── requirements.txt          # Dependencies
-├── .gitignore               # Git ignore
-├── README.md                # App documentation
-├── tests/                   # Unit tests (Lab 3)
-│   └── __init__.py
-└── docs/                    # Lab documentation
-    ├── LAB01.md            # Your lab submission
-    └── screenshots/        # Proof of work
-        ├── 01-main-endpoint.png
-        ├── 02-health-check.png
-        └── 03-formatted-output.png
-```
-
-#### 1.2 Choose Web Framework
-
-Select and justify your choice:
-- **Flask** - Lightweight, easy to learn
-- **FastAPI** - Modern, async, auto-documentation
-- **Django** - Full-featured, includes ORM
-
-Document your decision in `app_python/docs/LAB01.md`.
-
-#### 1.3 Implement Main Endpoint: `GET /`
-
-Return comprehensive service and system information:
-
-```json
-{
-  "service": {
-    "name": "devops-info-service",
-    "version": "1.0.0",
-    "description": "DevOps course info service",
-    "framework": "Flask"
-  },
-  "system": {
-    "hostname": "my-laptop",
-    "platform": "Linux",
-    "platform_version": "Ubuntu 24.04",
-    "architecture": "x86_64",
-    "cpu_count": 8,
-    "python_version": "3.13.1"
-  },
-  "runtime": {
-    "uptime_seconds": 3600,
-    "uptime_human": "1 hour, 0 minutes",
-    "current_time": "2026-01-07T14:30:00.000Z",
-    "timezone": "UTC"
-  },
-  "request": {
-    "client_ip": "127.0.0.1",
-    "user_agent": "curl/7.81.0",
-    "method": "GET",
-    "path": "/"
-  },
-  "endpoints": [
-    {"path": "/", "method": "GET", "description": "Service information"},
-    {"path": "/health", "method": "GET", "description": "Health check"}
-  ]
-}
-```
-
-<details>
-<summary>💡 Implementation Hints</summary>
-
-**Get System Information:**
-```python
-import platform
-import socket
-from datetime import datetime
-
-hostname = socket.gethostname()
-platform_name = platform.system()
-architecture = platform.machine()
-python_version = platform.python_version()
-```
-
-**Calculate Uptime:**
-```python
-start_time = datetime.now()
-
-def get_uptime():
-    delta = datetime.now() - start_time
-    seconds = int(delta.total_seconds())
-    hours = seconds // 3600
-    minutes = (seconds % 3600) // 60
-    return {
-        'seconds': seconds,
-        'human': f"{hours} hours, {minutes} minutes"
-    }
-```
-
-**Request Information:**
-```python
-# Flask
-request.remote_addr  # Client IP
-request.headers.get('User-Agent')  # User agent
-request.method  # HTTP method
-request.path  # Request path
-
-# FastAPI
-request.client.host
-request.headers.get('user-agent')
-request.method
-request.url.path
-```
-
-</details>
-
-#### 1.4 Implement Health Check: `GET /health`
-
-Simple health endpoint for monitoring:
-
-```json
-{
-  "status": "healthy",
-  "timestamp": "2024-01-15T14:30:00.000Z",
-  "uptime_seconds": 3600
-}
-```
-
-Return HTTP 200 for healthy status. This will be used for Kubernetes probes in Lab 9.
-
-<details>
-<summary>💡 Implementation Hints</summary>
-
-```python
-# Flask
-@app.route('/health')
-def health():
-    return jsonify({
-        'status': 'healthy',
-        'timestamp': datetime.now(timezone.utc).isoformat(),
-        'uptime_seconds': get_uptime()['seconds']
-    })
-
-# FastAPI
-@app.get("/health")
-def health():
-    return {
-        'status': 'healthy',
-        'timestamp': datetime.now(timezone.utc).isoformat(),
-        'uptime_seconds': get_uptime()['seconds']
-    }
-```
-
-</details>
-
-#### 1.5 Configuration
-
-Make your app configurable via environment variables:
-
-```python
-import os
-
-HOST = os.getenv('HOST', '0.0.0.0')
-PORT = int(os.getenv('PORT', 5000))
-DEBUG = os.getenv('DEBUG', 'False').lower() == 'true'
-```
-
-**Test:**
-```bash
-python app.py                    # Default: 0.0.0.0:5000
-PORT=8080 python app.py          # Custom port
-HOST=127.0.0.1 PORT=3000 python app.py
-```
-
----
-
-### Task 2 — Documentation & Best Practices (4 pts)
-
-#### 2.1 Application README (`app_python/README.md`)
-
-Create user-facing documentation:
-
-**Required Sections:**
-1. **Overview** - What the service does
-2. **Prerequisites** - Python version, dependencies
-3. **Installation**
-   ```bash
-   python -m venv venv
-   source venv/bin/activate
-   pip install -r requirements.txt
-   ```
-4. **Running the Application**
-   ```bash
-   python app.py
-   # Or with custom config
-   PORT=8080 python app.py
-   ```
-5. **API Endpoints**
-   - `GET /` - Service and system information
-   - `GET /health` - Health check
-6. **Configuration** - Environment variables table
-
-#### 2.2 Best Practices
-
-Implement these in your code:
-
-**1. Clean Code Organization**
-- Clear function names
-- Proper imports grouping
-- Comments only where needed
-- Follow PEP 8
-
-<details>
-<summary>💡 Example Structure</summary>
-
-```python
-"""
-DevOps Info Service
-Main application module
-"""
-import os
-import socket
-import platform
-from datetime import datetime, timezone
-from flask import Flask, jsonify, request
-
-app = Flask(__name__)
-
-# Configuration
-HOST = os.getenv('HOST', '0.0.0.0')
-PORT = int(os.getenv('PORT', 5000))
-
-# Application start time
-START_TIME = datetime.now(timezone.utc)
-
-def get_system_info():
-    """Collect system information."""
-    return {
-        'hostname': socket.gethostname(),
-        'platform': platform.system(),
-        'architecture': platform.machine(),
-        'python_version': platform.python_version()
-    }
-
-@app.route('/')
-def index():
-    """Main endpoint - service and system information."""
-    # Implementation
-```
-
-</details>
-
-**2. Error Handling**
-
-<details>
-<summary>💡 Implementation</summary>
-
-```python
-@app.errorhandler(404)
-def not_found(error):
-    return jsonify({
-        'error': 'Not Found',
-        'message': 'Endpoint does not exist'
-    }), 404
-
-@app.errorhandler(500)
-def internal_error(error):
-    return jsonify({
-        'error': 'Internal Server Error',
-        'message': 'An unexpected error occurred'
-    }), 500
-```
-
-</details>
-
-**3. Logging**
-
-<details>
-<summary>💡 Implementation</summary>
-
-```python
-import logging
-
-logging.basicConfig(
-    level=logging.INFO,
-    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
-)
-logger = logging.getLogger(__name__)
-
-logger.info('Application starting...')
-logger.debug(f'Request: {request.method} {request.path}')
-```
-
-</details>
-
-**4. Dependencies (`requirements.txt`)**
-
-```txt
-# Web Framework
-Flask==3.1.0
-# or
-fastapi==0.115.0
-uvicorn[standard]==0.32.0  # Includes performance extras
-```
-
-Pin exact versions for reproducibility.
-
-**5. Git Ignore (`.gitignore`)**
-
-```gitignore
-# Python
-__pycache__/
-*.py[cod]
-venv/
-*.log
-
-# IDE
-.vscode/
-.idea/
-
-# OS
-.DS_Store
-```
-
-#### 2.3 Lab Submission (`app_python/docs/LAB01.md`)
-
-Document your implementation:
-
-**Required Sections:**
-1. **Framework Selection**
-   - Your choice and why
-   - Comparison table with alternatives
-2. **Best Practices Applied**
-   - List practices with code examples
-   - Explain importance of each
-3. **API Documentation**
-   - Request/response examples
-   - Testing commands
-4. **Testing Evidence**
-   - Screenshots showing endpoints work
-   - Terminal output
-5. **Challenges & Solutions**
-   - Problems encountered
-   - How you solved them
-
-**Required Screenshots:**
-- Main endpoint showing complete JSON
-- Health check response
-- Formatted/pretty-printed output
-
-#### 2.4 GitHub Community Engagement
-
-**Objective:** Explore GitHub's social features that support collaboration and discovery.
-
-**Actions Required:**
-1. **Star** the course repository
-2. **Star** the [simple-container-com/api](https://github.com/simple-container-com/api) project — a promising open-source tool for container management
-3. **Follow** your professor and TAs on GitHub:
-   - Professor: [@Cre-eD](https://github.com/Cre-eD)
-   - TA: [@marat-biriushev](https://github.com/marat-biriushev)
-   - TA: [@pierrepicaud](https://github.com/pierrepicaud)
-4. **Follow** at least 3 classmates from the course
-
-**Document in LAB01.md:**
-
-Add a "GitHub Community" section (after Challenges & Solutions) with 1-2 sentences explaining:
-- Why starring repositories matters in open source
-- How following developers helps in team projects and professional growth
-
-<details>
-<summary>💡 GitHub Social Features</summary>
-
-**Why Stars Matter:**
-
-**Discovery & Bookmarking:**
-- Stars help you bookmark interesting projects for later reference
-- Star count indicates project popularity and community trust
-- Starred repos appear in your GitHub profile, showing your interests
-
-**Open Source Signal:**
-- Stars encourage maintainers (shows appreciation)
-- High star count attracts more contributors
-- Helps projects gain visibility in GitHub search and recommendations
-
-**Professional Context:**
-- Shows you follow best practices and quality projects
-- Indicates awareness of industry tools and trends
-
-**Why Following Matters:**
-
-**Networking:**
-- See what other developers are working on
-- Discover new projects through their activity
-- Build professional connections beyond the classroom
-
-**Learning:**
-- Learn from others' code and commits
-- See how experienced developers solve problems
-- Get inspiration for your own projects
-
-**Collaboration:**
-- Stay updated on classmates' work
-- Easier to find team members for future projects
-- Build a supportive learning community
-
-**Career Growth:**
-- Follow thought leaders in your technology stack
-- See trending projects in real-time
-- Build visibility in the developer community
-
-**GitHub Best Practices:**
-- Star repos you find useful (not spam)
-- Follow developers whose work interests you
-- Engage meaningfully with the community
-- Your GitHub activity shows employers your interests and involvement
-
-</details>
-
----
-
-## Bonus Task — Compiled Language (2.5 pts)
-
-Implement the same service in a compiled language to prepare for multi-stage Docker builds (Lab 2).
-
-**Choose One:**
-- **Go** (Recommended) - Small binaries, fast compilation
-- **Rust** - Memory safety, modern features
-- **Java/Spring Boot** - Enterprise standard
-- **C#/ASP.NET Core** - Cross-platform .NET
-
-**Structure:**
-
-```
-app_go/  (or app_rust, app_java, etc.)
-├── main.go
-├── go.mod
-├── README.md
-└── docs/
-    ├── LAB01.md              # Implementation details
-    ├── GO.md                 # Language justification
-    └── screenshots/
-```
-
-**Requirements:**
-- Same two endpoints: `/` and `/health`
-- Same JSON structure
-- Document build process
-- Compare binary size to Python
-
-<details>
-<summary>💡 Go Example Skeleton</summary>
-
-```go
-package main
-
-import (
-    "encoding/json"
-    "net/http"
-    "os"
-    "runtime"
-    "time"
-)
-
-type ServiceInfo struct {
-    Service  Service  `json:"service"`
-    System   System   `json:"system"`
-    Runtime  Runtime  `json:"runtime"`
-    Request  Request  `json:"request"`
-}
-
-var startTime = time.Now()
-
-func mainHandler(w http.ResponseWriter, r *http.Request) {
-    info := ServiceInfo{
-        Service: Service{
-            Name:    "devops-info-service",
-            Version: "1.0.0",
-        },
-        System: System{
-            Platform:     runtime.GOOS,
-            Architecture: runtime.GOARCH,
-            CPUCount:     runtime.NumCPU(),
-        },
-        // ... implement rest
-    }
-
-    w.Header().Set("Content-Type", "application/json")
-    json.NewEncoder(w).Encode(info)
-}
-
-func main() {
-    http.HandleFunc("/", mainHandler)
-    http.HandleFunc("/health", healthHandler)
-
-    port := os.Getenv("PORT")
-    if port == "" {
-        port = "8080"
-    }
-
-    http.ListenAndServe(":"+port, nil)
-}
-```
-
-</details>
-
----
-
-## How to Submit
-
-1. **Create Branch:**
-   ```bash
-   git checkout -b lab01
-   ```
-
-2. **Commit Work:**
-   ```bash
-   git add app_python/
-   git commit -m "feat: implement lab01 devops info service"
-   git push -u origin lab01
-   ```
-
-3. **Create Pull Requests:**
-   - **PR #1:** `your-fork:lab01` → `course-repo:master`
-   - **PR #2:** `your-fork:lab01` → `your-fork:master`
-
-4. **Verify:**
-   - All files present
-   - Screenshots included
-   - Documentation complete
-
----
-
-## Acceptance Criteria
-
-### Main Tasks (10 points)
-
-**Application Functionality (3 pts):**
-- [ ] Service runs without errors
-- [ ] `GET /` returns all required fields:
-  - [ ] Service metadata (name, version, description, framework)
-  - [ ] System info (hostname, platform, architecture, CPU, Python version)
-  - [ ] Runtime info (uptime, current time, timezone)
-  - [ ] Request info (client IP, user agent, method, path)
-  - [ ] Endpoints list
-- [ ] `GET /health` returns status and uptime
-- [ ] Configurable via environment variables (PORT, HOST)
-
-**Code Quality (2 pts):**
-- [ ] Clean code structure
-- [ ] PEP 8 compliant
-- [ ] Error handling implemented
-- [ ] Logging configured
-
-**Documentation (3 pts):**
-- [ ] `app_python/README.md` complete with all sections
-- [ ] `app_python/docs/LAB01.md` includes:
-  - [ ] Framework justification
-  - [ ] Best practices documentation
-  - [ ] API examples
-  - [ ] Testing evidence
-  - [ ] Challenges solved
-  - [ ] GitHub Community section (why stars/follows matter)
-- [ ] All 3 required screenshots present
-- [ ] Course repository starred
-- [ ] simple-container-com/api repository starred
-- [ ] Professor and TAs followed on GitHub
-- [ ] At least 3 classmates followed on GitHub
-
-**Configuration (2 pts):**
-- [ ] `requirements.txt` with pinned versions
-- [ ] `.gitignore` properly configured
-- [ ] Environment variables working
-
-### Bonus Task (2.5 points)
-
-- [ ] Compiled language app implements both endpoints
-- [ ] Same JSON structure as Python version
-- [ ] `app_<language>/README.md` with build/run instructions
-- [ ] `app_<language>/docs/GO.md` with language justification
-- [ ] `app_<language>/docs/LAB01.md` with implementation details
-- [ ] Screenshots showing compilation and execution
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Functionality** | 3 pts | Both endpoints work with complete, correct data |
-| **Code Quality** | 2 pts | Clean, organized, follows Python standards |
-| **Documentation** | 3 pts | Complete README and lab submission docs |
-| **Configuration** | 2 pts | Dependencies, environment vars, .gitignore |
-| **Bonus** | 2.5 pts | Compiled language implementation |
-| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
-
-**Grading Scale:**
-- **10/10:** Perfect implementation, excellent documentation
-- **8-9/10:** All works, good docs, minor improvements possible
-- **6-7/10:** Core functionality present, basic documentation
-- **<6/10:** Missing features or documentation, needs revision
-
----
-
-## Resources
-
-<details>
-<summary>📚 Python Web Frameworks</summary>
-
-- [Flask 3.1 Documentation](https://flask.palletsprojects.com/en/latest/)
-- [Flask Quickstart](https://flask.palletsprojects.com/en/latest/quickstart/)
-- [FastAPI Documentation](https://fastapi.tiangolo.com/)
-- [FastAPI Tutorial](https://fastapi.tiangolo.com/tutorial/first-steps/)
-- [Django 5.1 Documentation](https://docs.djangoproject.com/en/5.1/)
-
-</details>
-
-<details>
-<summary>🐍 Python Best Practices</summary>
-
-- [PEP 8 Style Guide](https://pep8.org/)
-- [Python Logging Tutorial](https://docs.python.org/3/howto/logging.html)
-- [Python platform module](https://docs.python.org/3/library/platform.html)
-- [Python socket module](https://docs.python.org/3/library/socket.html)
-
-</details>
-
-<details>
-<summary>🔧 Compiled Languages (Bonus)</summary>
-
-- [Go Web Development](https://golang.org/doc/articles/wiki/)
-- [Go net/http Package](https://pkg.go.dev/net/http)
-- [Rust Web Frameworks](https://www.arewewebyet.org/)
-- [Spring Boot Quickstart](https://spring.io/quickstart)
-- [ASP.NET Core Tutorial](https://docs.microsoft.com/aspnet/core/)
-
-</details>
-
-<details>
-<summary>🛠️ Development Tools</summary>
-
-- [Postman](https://www.postman.com/) - API testing
-- [HTTPie](https://httpie.io/) - Command-line HTTP client
-- [curl](https://curl.se/) - Data transfer tool
-- [jq](https://stedolan.github.io/jq/) - JSON processor
-
-</details>
-
----
-
-## Looking Ahead
-
-This service evolves throughout the course:
-
-- **Lab 2:** Containerize with Docker, multi-stage builds
-- **Lab 3:** Add unit tests and CI/CD pipeline
-- **Lab 8:** Add `/metrics` endpoint for Prometheus
-- **Lab 9:** Deploy to Kubernetes using `/health` probes
-- **Lab 12:** Add `/visits` endpoint with file persistence
-- **Lab 13:** Multi-environment deployment with GitOps
-
----
-
-**Good luck!** 🚀
-
-> **Remember:** Keep it simple, write clean code, and document thoroughly. This foundation will carry through all 16 labs!
+# Lab 1 — DevOps Info Service: Web Application Development
+
+![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
+![topic](https://img.shields.io/badge/topic-Web%20Development-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![languages](https://img.shields.io/badge/languages-Python%20|%20Go-informational)
+
+> Build a DevOps info service that reports system information and health status. This service will evolve throughout the course into a comprehensive monitoring tool.
+
+## Overview
+
+Create a **DevOps Info Service** - a web application providing detailed information about itself and its runtime environment. This foundation will grow throughout the course as you add containerization, CI/CD, monitoring, and persistence.
+
+**What You'll Learn:**
+- Web framework selection and implementation
+- System introspection and API design
+- Python best practices and documentation
+- Foundation for future DevOps tooling
+
+**Tech Stack:** Python 3.11+ | Flask 3.1 or FastAPI 0.115
+
+---
+
+## Tasks
+
+### Task 1 — Python Web Application (6 pts)
+
+Build a production-ready Python web service with comprehensive system information.
+
+#### 1.1 Project Structure
+
+Create this structure:
+
+```
+app_python/
+├── app.py                    # Main application
+├── requirements.txt          # Dependencies
+├── .gitignore               # Git ignore
+├── README.md                # App documentation
+├── tests/                   # Unit tests (Lab 3)
+│   └── __init__.py
+└── docs/                    # Lab documentation
+    ├── LAB01.md            # Your lab submission
+    └── screenshots/        # Proof of work
+        ├── 01-main-endpoint.png
+        ├── 02-health-check.png
+        └── 03-formatted-output.png
+```
+
+#### 1.2 Choose Web Framework
+
+Select and justify your choice:
+- **Flask** - Lightweight, easy to learn
+- **FastAPI** - Modern, async, auto-documentation
+- **Django** - Full-featured, includes ORM
+
+Document your decision in `app_python/docs/LAB01.md`.
+
+#### 1.3 Implement Main Endpoint: `GET /`
+
+Return comprehensive service and system information:
+
+```json
+{
+  "service": {
+    "name": "devops-info-service",
+    "version": "1.0.0",
+    "description": "DevOps course info service",
+    "framework": "Flask"
+  },
+  "system": {
+    "hostname": "my-laptop",
+    "platform": "Linux",
+    "platform_version": "Ubuntu 24.04",
+    "architecture": "x86_64",
+    "cpu_count": 8,
+    "python_version": "3.13.1"
+  },
+  "runtime": {
+    "uptime_seconds": 3600,
+    "uptime_human": "1 hour, 0 minutes",
+    "current_time": "2026-01-07T14:30:00.000Z",
+    "timezone": "UTC"
+  },
+  "request": {
+    "client_ip": "127.0.0.1",
+    "user_agent": "curl/7.81.0",
+    "method": "GET",
+    "path": "/"
+  },
+  "endpoints": [
+    {"path": "/", "method": "GET", "description": "Service information"},
+    {"path": "/health", "method": "GET", "description": "Health check"}
+  ]
+}
+```
+
+<details>
+<summary>💡 Implementation Hints</summary>
+
+**Get System Information:**
+```python
+import platform
+import socket
+from datetime import datetime
+
+hostname = socket.gethostname()
+platform_name = platform.system()
+architecture = platform.machine()
+python_version = platform.python_version()
+```
+
+**Calculate Uptime:**
+```python
+start_time = datetime.now()
+
+def get_uptime():
+    delta = datetime.now() - start_time
+    seconds = int(delta.total_seconds())
+    hours = seconds // 3600
+    minutes = (seconds % 3600) // 60
+    return {
+        'seconds': seconds,
+        'human': f"{hours} hours, {minutes} minutes"
+    }
+```
+
+**Request Information:**
+```python
+# Flask
+request.remote_addr  # Client IP
+request.headers.get('User-Agent')  # User agent
+request.method  # HTTP method
+request.path  # Request path
+
+# FastAPI
+request.client.host
+request.headers.get('user-agent')
+request.method
+request.url.path
+```
+
+</details>
+
+#### 1.4 Implement Health Check: `GET /health`
+
+Simple health endpoint for monitoring:
+
+```json
+{
+  "status": "healthy",
+  "timestamp": "2024-01-15T14:30:00.000Z",
+  "uptime_seconds": 3600
+}
+```
+
+Return HTTP 200 for healthy status. This will be used for Kubernetes probes in Lab 9.
+
+<details>
+<summary>💡 Implementation Hints</summary>
+
+```python
+# Flask
+@app.route('/health')
+def health():
+    return jsonify({
+        'status': 'healthy',
+        'timestamp': datetime.now(timezone.utc).isoformat(),
+        'uptime_seconds': get_uptime()['seconds']
+    })
+
+# FastAPI
+@app.get("/health")
+def health():
+    return {
+        'status': 'healthy',
+        'timestamp': datetime.now(timezone.utc).isoformat(),
+        'uptime_seconds': get_uptime()['seconds']
+    }
+```
+
+</details>
+
+#### 1.5 Configuration
+
+Make your app configurable via environment variables:
+
+```python
+import os
+
+HOST = os.getenv('HOST', '0.0.0.0')
+PORT = int(os.getenv('PORT', 5000))
+DEBUG = os.getenv('DEBUG', 'False').lower() == 'true'
+```
+
+**Test:**
+```bash
+python app.py                    # Default: 0.0.0.0:5000
+PORT=8080 python app.py          # Custom port
+HOST=127.0.0.1 PORT=3000 python app.py
+```
+
+---
+
+### Task 2 — Documentation & Best Practices (4 pts)
+
+#### 2.1 Application README (`app_python/README.md`)
+
+Create user-facing documentation:
+
+**Required Sections:**
+1. **Overview** - What the service does
+2. **Prerequisites** - Python version, dependencies
+3. **Installation**
+   ```bash
+   python -m venv venv
+   source venv/bin/activate
+   pip install -r requirements.txt
+   ```
+4. **Running the Application**
+   ```bash
+   python app.py
+   # Or with custom config
+   PORT=8080 python app.py
+   ```
+5. **API Endpoints**
+   - `GET /` - Service and system information
+   - `GET /health` - Health check
+6. **Configuration** - Environment variables table
+
+#### 2.2 Best Practices
+
+Implement these in your code:
+
+**1. Clean Code Organization**
+- Clear function names
+- Proper imports grouping
+- Comments only where needed
+- Follow PEP 8
+
+<details>
+<summary>💡 Example Structure</summary>
+
+```python
+"""
+DevOps Info Service
+Main application module
+"""
+import os
+import socket
+import platform
+from datetime import datetime, timezone
+from flask import Flask, jsonify, request
+
+app = Flask(__name__)
+
+# Configuration
+HOST = os.getenv('HOST', '0.0.0.0')
+PORT = int(os.getenv('PORT', 5000))
+
+# Application start time
+START_TIME = datetime.now(timezone.utc)
+
+def get_system_info():
+    """Collect system information."""
+    return {
+        'hostname': socket.gethostname(),
+        'platform': platform.system(),
+        'architecture': platform.machine(),
+        'python_version': platform.python_version()
+    }
+
+@app.route('/')
+def index():
+    """Main endpoint - service and system information."""
+    # Implementation
+```
+
+</details>
+
+**2. Error Handling**
+
+<details>
+<summary>💡 Implementation</summary>
+
+```python
+@app.errorhandler(404)
+def not_found(error):
+    return jsonify({
+        'error': 'Not Found',
+        'message': 'Endpoint does not exist'
+    }), 404
+
+@app.errorhandler(500)
+def internal_error(error):
+    return jsonify({
+        'error': 'Internal Server Error',
+        'message': 'An unexpected error occurred'
+    }), 500
+```
+
+</details>
+
+**3. Logging**
+
+<details>
+<summary>💡 Implementation</summary>
+
+```python
+import logging
+
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+
+logger.info('Application starting...')
+logger.debug(f'Request: {request.method} {request.path}')
+```
+
+</details>
+
+**4. Dependencies (`requirements.txt`)**
+
+```txt
+# Web Framework
+Flask==3.1.0
+# or
+fastapi==0.115.0
+uvicorn[standard]==0.32.0  # Includes performance extras
+```
+
+Pin exact versions for reproducibility.
+
+**5. Git Ignore (`.gitignore`)**
+
+```gitignore
+# Python
+__pycache__/
+*.py[cod]
+venv/
+*.log
+
+# IDE
+.vscode/
+.idea/
+
+# OS
+.DS_Store
+```
+
+#### 2.3 Lab Submission (`app_python/docs/LAB01.md`)
+
+Document your implementation:
+
+**Required Sections:**
+1. **Framework Selection**
+   - Your choice and why
+   - Comparison table with alternatives
+2. **Best Practices Applied**
+   - List practices with code examples
+   - Explain importance of each
+3. **API Documentation**
+   - Request/response examples
+   - Testing commands
+4. **Testing Evidence**
+   - Screenshots showing endpoints work
+   - Terminal output
+5. **Challenges & Solutions**
+   - Problems encountered
+   - How you solved them
+
+**Required Screenshots:**
+- Main endpoint showing complete JSON
+- Health check response
+- Formatted/pretty-printed output
+
+#### 2.4 GitHub Community Engagement
+
+**Objective:** Explore GitHub's social features that support collaboration and discovery.
+
+**Actions Required:**
+1. **Star** the course repository
+2. **Star** the [simple-container-com/api](https://github.com/simple-container-com/api) project — a promising open-source tool for container management
+3. **Follow** your professor and TAs on GitHub:
+   - Professor: [@Cre-eD](https://github.com/Cre-eD)
+   - TA: [@marat-biriushev](https://github.com/marat-biriushev)
+   - TA: [@pierrepicaud](https://github.com/pierrepicaud)
+4. **Follow** at least 3 classmates from the course
+
+**Document in LAB01.md:**
+
+Add a "GitHub Community" section (after Challenges & Solutions) with 1-2 sentences explaining:
+- Why starring repositories matters in open source
+- How following developers helps in team projects and professional growth
+
+<details>
+<summary>💡 GitHub Social Features</summary>
+
+**Why Stars Matter:**
+
+**Discovery & Bookmarking:**
+- Stars help you bookmark interesting projects for later reference
+- Star count indicates project popularity and community trust
+- Starred repos appear in your GitHub profile, showing your interests
+
+**Open Source Signal:**
+- Stars encourage maintainers (shows appreciation)
+- High star count attracts more contributors
+- Helps projects gain visibility in GitHub search and recommendations
+
+**Professional Context:**
+- Shows you follow best practices and quality projects
+- Indicates awareness of industry tools and trends
+
+**Why Following Matters:**
+
+**Networking:**
+- See what other developers are working on
+- Discover new projects through their activity
+- Build professional connections beyond the classroom
+
+**Learning:**
+- Learn from others' code and commits
+- See how experienced developers solve problems
+- Get inspiration for your own projects
+
+**Collaboration:**
+- Stay updated on classmates' work
+- Easier to find team members for future projects
+- Build a supportive learning community
+
+**Career Growth:**
+- Follow thought leaders in your technology stack
+- See trending projects in real-time
+- Build visibility in the developer community
+
+**GitHub Best Practices:**
+- Star repos you find useful (not spam)
+- Follow developers whose work interests you
+- Engage meaningfully with the community
+- Your GitHub activity shows employers your interests and involvement
+
+</details>
+
+---
+
+## Bonus Task — Compiled Language (2.5 pts)
+
+Implement the same service in a compiled language to prepare for multi-stage Docker builds (Lab 2).
+
+**Choose One:**
+- **Go** (Recommended) - Small binaries, fast compilation
+- **Rust** - Memory safety, modern features
+- **Java/Spring Boot** - Enterprise standard
+- **C#/ASP.NET Core** - Cross-platform .NET
+
+**Structure:**
+
+```
+app_go/  (or app_rust, app_java, etc.)
+├── main.go
+├── go.mod
+├── README.md
+└── docs/
+    ├── LAB01.md              # Implementation details
+    ├── GO.md                 # Language justification
+    └── screenshots/
+```
+
+**Requirements:**
+- Same two endpoints: `/` and `/health`
+- Same JSON structure
+- Document build process
+- Compare binary size to Python
+
+<details>
+<summary>💡 Go Example Skeleton</summary>
+
+```go
+package main
+
+import (
+    "encoding/json"
+    "net/http"
+    "os"
+    "runtime"
+    "time"
+)
+
+type ServiceInfo struct {
+    Service  Service  `json:"service"`
+    System   System   `json:"system"`
+    Runtime  Runtime  `json:"runtime"`
+    Request  Request  `json:"request"`
+}
+
+var startTime = time.Now()
+
+func mainHandler(w http.ResponseWriter, r *http.Request) {
+    info := ServiceInfo{
+        Service: Service{
+            Name:    "devops-info-service",
+            Version: "1.0.0",
+        },
+        System: System{
+            Platform:     runtime.GOOS,
+            Architecture: runtime.GOARCH,
+            CPUCount:     runtime.NumCPU(),
+        },
+        // ... implement rest
+    }
+
+    w.Header().Set("Content-Type", "application/json")
+    json.NewEncoder(w).Encode(info)
+}
+
+func main() {
+    http.HandleFunc("/", mainHandler)
+    http.HandleFunc("/health", healthHandler)
+
+    port := os.Getenv("PORT")
+    if port == "" {
+        port = "8080"
+    }
+
+    http.ListenAndServe(":"+port, nil)
+}
+```
+
+</details>
+
+---
+
+## How to Submit
+
+1. **Create Branch:**
+   ```bash
+   git checkout -b lab01
+   ```
+
+2. **Commit Work:**
+   ```bash
+   git add app_python/
+   git commit -m "feat: implement lab01 devops info service"
+   git push -u origin lab01
+   ```
+
+3. **Create Pull Requests:**
+   - **PR #1:** `your-fork:lab01` → `course-repo:master`
+   - **PR #2:** `your-fork:lab01` → `your-fork:master`
+
+4. **Verify:**
+   - All files present
+   - Screenshots included
+   - Documentation complete
+
+---
+
+## Acceptance Criteria
+
+### Main Tasks (10 points)
+
+**Application Functionality (3 pts):**
+- [ ] Service runs without errors
+- [ ] `GET /` returns all required fields:
+  - [ ] Service metadata (name, version, description, framework)
+  - [ ] System info (hostname, platform, architecture, CPU, Python version)
+  - [ ] Runtime info (uptime, current time, timezone)
+  - [ ] Request info (client IP, user agent, method, path)
+  - [ ] Endpoints list
+- [ ] `GET /health` returns status and uptime
+- [ ] Configurable via environment variables (PORT, HOST)
+
+**Code Quality (2 pts):**
+- [ ] Clean code structure
+- [ ] PEP 8 compliant
+- [ ] Error handling implemented
+- [ ] Logging configured
+
+**Documentation (3 pts):**
+- [ ] `app_python/README.md` complete with all sections
+- [ ] `app_python/docs/LAB01.md` includes:
+  - [ ] Framework justification
+  - [ ] Best practices documentation
+  - [ ] API examples
+  - [ ] Testing evidence
+  - [ ] Challenges solved
+  - [ ] GitHub Community section (why stars/follows matter)
+- [ ] All 3 required screenshots present
+- [ ] Course repository starred
+- [ ] simple-container-com/api repository starred
+- [ ] Professor and TAs followed on GitHub
+- [ ] At least 3 classmates followed on GitHub
+
+**Configuration (2 pts):**
+- [ ] `requirements.txt` with pinned versions
+- [ ] `.gitignore` properly configured
+- [ ] Environment variables working
+
+### Bonus Task (2.5 points)
+
+- [ ] Compiled language app implements both endpoints
+- [ ] Same JSON structure as Python version
+- [ ] `app_<language>/README.md` with build/run instructions
+- [ ] `app_<language>/docs/GO.md` with language justification
+- [ ] `app_<language>/docs/LAB01.md` with implementation details
+- [ ] Screenshots showing compilation and execution
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Functionality** | 3 pts | Both endpoints work with complete, correct data |
+| **Code Quality** | 2 pts | Clean, organized, follows Python standards |
+| **Documentation** | 3 pts | Complete README and lab submission docs |
+| **Configuration** | 2 pts | Dependencies, environment vars, .gitignore |
+| **Bonus** | 2.5 pts | Compiled language implementation |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading Scale:**
+- **10/10:** Perfect implementation, excellent documentation
+- **8-9/10:** All works, good docs, minor improvements possible
+- **6-7/10:** Core functionality present, basic documentation
+- **<6/10:** Missing features or documentation, needs revision
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Python Web Frameworks</summary>
+
+- [Flask 3.1 Documentation](https://flask.palletsprojects.com/en/latest/)
+- [Flask Quickstart](https://flask.palletsprojects.com/en/latest/quickstart/)
+- [FastAPI Documentation](https://fastapi.tiangolo.com/)
+- [FastAPI Tutorial](https://fastapi.tiangolo.com/tutorial/first-steps/)
+- [Django 5.1 Documentation](https://docs.djangoproject.com/en/5.1/)
+
+</details>
+
+<details>
+<summary>🐍 Python Best Practices</summary>
+
+- [PEP 8 Style Guide](https://pep8.org/)
+- [Python Logging Tutorial](https://docs.python.org/3/howto/logging.html)
+- [Python platform module](https://docs.python.org/3/library/platform.html)
+- [Python socket module](https://docs.python.org/3/library/socket.html)
+
+</details>
+
+<details>
+<summary>🔧 Compiled Languages (Bonus)</summary>
+
+- [Go Web Development](https://golang.org/doc/articles/wiki/)
+- [Go net/http Package](https://pkg.go.dev/net/http)
+- [Rust Web Frameworks](https://www.arewewebyet.org/)
+- [Spring Boot Quickstart](https://spring.io/quickstart)
+- [ASP.NET Core Tutorial](https://docs.microsoft.com/aspnet/core/)
+
+</details>
+
+<details>
+<summary>🛠️ Development Tools</summary>
+
+- [Postman](https://www.postman.com/) - API testing
+- [HTTPie](https://httpie.io/) - Command-line HTTP client
+- [curl](https://curl.se/) - Data transfer tool
+- [jq](https://stedolan.github.io/jq/) - JSON processor
+
+</details>
+
+---
+
+## Looking Ahead
+
+This service evolves throughout the course:
+
+- **Lab 2:** Containerize with Docker, multi-stage builds
+- **Lab 3:** Add unit tests and CI/CD pipeline
+- **Lab 8:** Add `/metrics` endpoint for Prometheus
+- **Lab 9:** Deploy to Kubernetes using `/health` probes
+- **Lab 12:** Add `/visits` endpoint with file persistence
+- **Lab 13:** Multi-environment deployment with GitOps
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** Keep it simple, write clean code, and document thoroughly. This foundation will carry through all 16 labs!
diff --git a/labs/lab02.md b/labs/lab02.md
index 1c3e032f89..448a84a2ca 100644
--- a/labs/lab02.md
+++ b/labs/lab02.md
@@ -1,366 +1,366 @@
-# Lab 2 — Docker Containerization
-
-![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
-![topic](https://img.shields.io/badge/topic-Containerization-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Docker-informational)
-
-> Containerize your Python app from Lab 1 using Docker best practices and publish it to Docker Hub.
-
-## Overview
-
-Take your Lab 1 application and package it into a Docker container. Learn image optimization, security basics, and the Docker workflow used in production.
-
-**What You'll Learn:**
-- Writing production-ready Dockerfiles
-- Docker best practices and security
-- Image optimization techniques
-- Docker Hub workflow
-
-**Tech Stack:** Docker 25+ | Python 3.13-slim | Multi-stage builds
-
----
-
-## Tasks
-
-### Task 1 — Create Dockerfile (4 pts)
-
-**Objective:** Write a Dockerfile that containerizes your Python app following best practices.
-
-Create `app_python/Dockerfile` with these requirements:
-
-**Must Have:**
-- Non-root user (mandatory)
-- Specific base image version (e.g., `python:3.13-slim` or `python:3.12-slim`)
-- Only copy necessary files
-- Proper layer ordering
-- `.dockerignore` file
-
-**Your app should work the same way in the container as it did locally.**
-
-<details>
-<summary>💡 Dockerfile Concepts & Resources</summary>
-
-**Key Dockerfile Instructions to Research:**
-- `FROM` - Choose your base image (look at python:3.13-slim, python:3.12-slim, python:3.13-alpine)
-- `RUN` - Execute commands (creating users, installing packages)
-- `WORKDIR` - Set working directory
-- `COPY` - Copy files into the image
-- `USER` - Switch to non-root user
-- `EXPOSE` - Document which port your app uses
-- `CMD` - Define how to start your application
-
-**Critical Concepts:**
-- **Layer Caching**: Why does the order of COPY commands matter?
-- **Non-root User**: How do you create and switch to a non-root user?
-- **Base Image Selection**: What's the difference between slim, alpine, and full images?
-- **Dependency Installation**: Why copy requirements.txt separately from application code?
-
-**Resources:**
-- [Dockerfile Reference](https://docs.docker.com/reference/dockerfile/)
-- [Best Practices Guide](https://docs.docker.com/build/building/best-practices/)
-- [Python Image Variants](https://hub.docker.com/_/python) - Use 3.13-slim or 3.12-slim
-
-**Think About:**
-- What happens if you copy all files before installing dependencies?
-- Why shouldn't you run as root?
-- How does layer caching speed up rebuilds?
-
-</details>
-
-<details>
-<summary>💡 .dockerignore Concepts</summary>
-
-**Purpose:** Prevent unnecessary files from being sent to Docker daemon during build (faster builds, smaller context).
-
-**What Should You Exclude?**
-Think about what doesn't need to be in your container:
-- Development artifacts (like Python's `__pycache__`, `*.pyc`)
-- Version control files (`.git` directory)
-- IDE configuration files
-- Virtual environments (`venv/`, `.venv/`)
-- Documentation that's not needed at runtime
-- Test files (if not running tests in container)
-
-**Key Question:** Why does excluding files from the build context matter for build speed?
-
-**Resources:**
-- [.dockerignore Documentation](https://docs.docker.com/engine/reference/builder/#dockerignore-file)
-- Look at your `.gitignore` for inspiration - many patterns overlap
-
-**Exercise:** Start minimal and add exclusions as needed, rather than copying a huge list you don't understand.
-
-</details>
-
-**Test Your Container:**
-
-You should be able to:
-1. Build your image using the `docker build` command
-2. Run a container from your image with proper port mapping
-3. Access your application endpoints from the host machine
-
-Verify that your application works the same way in the container as it did locally.
-
----
-
-### Task 2 — Docker Hub (2 pts)
-
-**Objective:** Publish your image to Docker Hub.
-
-**Requirements:**
-1. Create a Docker Hub account (if you don't have one)
-2. Tag your image with your Docker Hub username
-3. Authenticate with Docker Hub
-4. Push your image to the registry
-5. Verify the image is publicly accessible
-
-**Documentation Required:**
-- Terminal output showing successful push
-- Docker Hub repository URL
-- Explanation of your tagging strategy
-
-<details>
-<summary>💡 Docker Hub Resources</summary>
-
-**Useful Commands:**
-- `docker tag` - Tag images for registry push
-- `docker login` - Authenticate with Docker Hub
-- `docker push` - Upload image to registry
-- `docker pull` - Download image from registry
-
-**Resources:**
-- [Docker Hub Quickstart](https://docs.docker.com/docker-hub/quickstart/)
-- [Docker Tag Reference](https://docs.docker.com/reference/cli/docker/image/tag/)
-- [Best Practices for Tagging](https://docs.docker.com/build/building/best-practices/#tagging)
-
-</details>
-
----
-
-### Task 3 — Documentation (4 pts)
-
-**Objective:** Document your Docker implementation with focus on understanding and decisions.
-
-#### 3.1 Update `app_python/README.md`
-
-Add a **Docker** section explaining how to use your containerized application. Include command patterns (not exact commands) for:
-- Building the image locally
-- Running a container
-- Pulling from Docker Hub
-
-#### 3.2 Create `app_python/docs/LAB02.md`
-
-Document your implementation with these sections:
-
-**Required Sections:**
-
-1. **Docker Best Practices Applied**
-   - List each practice you implemented (non-root user, layer caching, .dockerignore, etc.)
-   - Explain WHY each matters (not just what it does)
-   - Include relevant Dockerfile snippets with explanations
-
-2. **Image Information & Decisions**
-   - Base image chosen and justification (why this specific version?)
-   - Final image size and your assessment
-   - Layer structure explanation
-   - Optimization choices you made
-
-3. **Build & Run Process**
-   - Complete terminal output from your build process
-   - Terminal output showing container running
-   - Terminal output from testing endpoints (curl/httpie)
-   - Docker Hub repository URL
-
-4. **Technical Analysis**
-   - Why does your Dockerfile work the way it does?
-   - What would happen if you changed the layer order?
-   - What security considerations did you implement?
-   - How does .dockerignore improve your build?
-
-5. **Challenges & Solutions**
-   - Issues encountered during implementation
-   - How you debugged and resolved them
-   - What you learned from the process
-
----
-
-## Bonus Task — Multi-Stage Build (2.5 pts)
-
-**Objective:** Containerize your compiled language app (from Lab 1 bonus) using multi-stage builds.
-
-**Why Multi-Stage?** Separate build environment from runtime → smaller final image.
-
-**Example Flow:**
-1. **Stage 1 (Builder):** Compile the app (large image with compilers)
-2. **Stage 2 (Runtime):** Copy only the binary (small image, no build tools)
-
-<details>
-<summary>💡 Multi-Stage Build Concepts</summary>
-
-**The Problem:** Compiled language images include the entire compiler/SDK in the final image (huge!).
-
-**The Solution:** Use multiple `FROM` statements:
-- **Stage 1 (Builder)**: Use full SDK image, compile your application
-- **Stage 2 (Runtime)**: Use minimal base image, copy only the compiled binary
-
-**Key Concepts to Research:**
-- How to name build stages (`AS builder`)
-- How to copy files from previous stages (`COPY --from=builder`)
-- Choosing runtime base images (alpine, distroless, scratch)
-- Static vs dynamic compilation (affects what base image you can use)
-
-**Questions to Explore:**
-- What's the size difference between your builder and final image?
-- Why can't you just use the builder image as your final image?
-- What security benefits come from smaller images?
-- Can you use `FROM scratch`? Why or why not?
-
-**Resources:**
-- [Multi-Stage Builds Documentation](https://docs.docker.com/build/building/multi-stage/)
-- [Distroless Base Images](https://github.com/GoogleContainerTools/distroless)
-- Language-specific: Search "Go static binary Docker" or "Rust alpine Docker"
-
-**Challenge:** Try to get your final image under 20MB.
-
-</details>
-
-**Requirements:**
-- Multi-stage Dockerfile in `app_go/` (or your chosen language)
-- Working containerized application
-- Documentation in `app_go/docs/LAB02.md` explaining:
-  - Your multi-stage build strategy
-  - Size comparison with analysis (builder vs final image)
-  - Why multi-stage builds matter for compiled languages
-  - Terminal output showing build process and image sizes
-  - Technical explanation of each stage's purpose
-
-**Bonus Points Given For:**
-- Significant size reduction achieved with clear metrics
-- Deep understanding of multi-stage build benefits
-- Analysis of security implications (smaller attack surface)
-- Explanation of trade-offs and decisions made
-
----
-
-## How to Submit
-
-1. **Create Branch:** Create a new branch called `lab02`
-
-2. **Commit Work:**
-   - Add your changes (app_python/ directory with Dockerfile, .dockerignore, updated docs)
-   - Commit with a descriptive message following conventional commits format
-   - Push to your fork
-
-3. **Create Pull Requests:**
-   - **PR #1:** `your-fork:lab02` → `course-repo:master`
-   - **PR #2:** `your-fork:lab02` → `your-fork:master`
-
----
-
-## Acceptance Criteria
-
-### Main Tasks (10 points)
-
-**Dockerfile (4 pts):**
-- [ ] Dockerfile exists in `app_python/`
-- [ ] Uses specific base image version
-- [ ] Runs as non-root user (USER directive)
-- [ ] Proper layer ordering (dependencies before code)
-- [ ] Only copies necessary files
-- [ ] `.dockerignore` file present
-- [ ] Image builds successfully
-- [ ] Container runs and app works
-
-**Docker Hub (2 pts):**
-- [ ] Image pushed to Docker Hub
-- [ ] Image is publicly accessible
-- [ ] Correct tagging used
-- [ ] Can pull and run from Docker Hub
-
-**Documentation (4 pts):**
-- [ ] `app_python/README.md` has Docker section with command patterns
-- [ ] `app_python/docs/LAB02.md` complete with:
-  - [ ] Best practices explained with WHY (not just what)
-  - [ ] Image information and justifications for choices
-  - [ ] Terminal output from build, run, and testing
-  - [ ] Technical analysis demonstrating understanding
-  - [ ] Challenges and solutions documented
-  - [ ] Docker Hub repository URL provided
-
-### Bonus Task (2.5 points)
-
-- [ ] Multi-stage Dockerfile for compiled language app
-- [ ] Working containerized application
-- [ ] Documentation in `app_<language>/docs/LAB02.md` with:
-  - [ ] Multi-stage strategy explained
-  - [ ] Terminal output showing image sizes (builder vs final)
-  - [ ] Analysis of size reduction and why it matters
-  - [ ] Technical explanation of each stage
-  - [ ] Security benefits discussed
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Dockerfile** | 4 pts | Correct, secure, optimized |
-| **Docker Hub** | 2 pts | Successfully published |
-| **Documentation** | 4 pts | Complete and clear |
-| **Bonus** | 2.5 pts | Multi-stage implementation |
-| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
-
-**Grading:**
-- **10/10:** Perfect Dockerfile, deep understanding demonstrated, excellent analysis
-- **8-9/10:** Working container, good practices, solid understanding shown
-- **6-7/10:** Container works, basic security, surface-level explanations
-- **<6/10:** Missing requirements, runs as root, copy-paste without understanding
-
----
-
-## Resources
-
-<details>
-<summary>📚 Docker Documentation</summary>
-
-- [Dockerfile Best Practices](https://docs.docker.com/build/building/best-practices/)
-- [Dockerfile Reference](https://docs.docker.com/reference/dockerfile/)
-- [Multi-Stage Builds](https://docs.docker.com/build/building/multi-stage/)
-- [.dockerignore](https://docs.docker.com/reference/dockerfile/#dockerignore-file)
-- [Docker Build Guide](https://docs.docker.com/build/guide/)
-
-</details>
-
-<details>
-<summary>🔒 Security Resources</summary>
-
-- [Docker Security Best Practices](https://docs.docker.com/build/building/best-practices/#security)
-- [Snyk Docker Security](https://snyk.io/learn/docker-security-scanning/)
-- [Why Non-Root Containers](https://docs.docker.com/build/building/best-practices/#user)
-- [Distroless Images](https://github.com/GoogleContainerTools/distroless) - Minimal base images
-
-</details>
-
-<details>
-<summary>🛠️ Tools</summary>
-
-- [Hadolint](https://github.com/hadolint/hadolint) - Dockerfile linter
-- [Dive](https://github.com/wagoodman/dive) - Explore image layers
-- [Docker Hub](https://hub.docker.com/) - Container registry
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 3:** CI/CD will automatically build these Docker images
-- **Lab 7-8:** Deploy containers with docker-compose for logging/monitoring
-- **Lab 9:** Run these containers in Kubernetes
-- **Lab 13:** ArgoCD will deploy containerized apps automatically
-
----
-
-**Good luck!** 🚀
-
-> **Remember:** Understanding beats copy-paste. Explain your decisions, not just your actions. Run as non-root or no points!
+# Lab 2 — Docker Containerization
+
+![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
+![topic](https://img.shields.io/badge/topic-Containerization-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Docker-informational)
+
+> Containerize your Python app from Lab 1 using Docker best practices and publish it to Docker Hub.
+
+## Overview
+
+Take your Lab 1 application and package it into a Docker container. Learn image optimization, security basics, and the Docker workflow used in production.
+
+**What You'll Learn:**
+- Writing production-ready Dockerfiles
+- Docker best practices and security
+- Image optimization techniques
+- Docker Hub workflow
+
+**Tech Stack:** Docker 25+ | Python 3.13-slim | Multi-stage builds
+
+---
+
+## Tasks
+
+### Task 1 — Create Dockerfile (4 pts)
+
+**Objective:** Write a Dockerfile that containerizes your Python app following best practices.
+
+Create `app_python/Dockerfile` with these requirements:
+
+**Must Have:**
+- Non-root user (mandatory)
+- Specific base image version (e.g., `python:3.13-slim` or `python:3.12-slim`)
+- Only copy necessary files
+- Proper layer ordering
+- `.dockerignore` file
+
+**Your app should work the same way in the container as it did locally.**
+
+<details>
+<summary>💡 Dockerfile Concepts & Resources</summary>
+
+**Key Dockerfile Instructions to Research:**
+- `FROM` - Choose your base image (look at python:3.13-slim, python:3.12-slim, python:3.13-alpine)
+- `RUN` - Execute commands (creating users, installing packages)
+- `WORKDIR` - Set working directory
+- `COPY` - Copy files into the image
+- `USER` - Switch to non-root user
+- `EXPOSE` - Document which port your app uses
+- `CMD` - Define how to start your application
+
+**Critical Concepts:**
+- **Layer Caching**: Why does the order of COPY commands matter?
+- **Non-root User**: How do you create and switch to a non-root user?
+- **Base Image Selection**: What's the difference between slim, alpine, and full images?
+- **Dependency Installation**: Why copy requirements.txt separately from application code?
+
+**Resources:**
+- [Dockerfile Reference](https://docs.docker.com/reference/dockerfile/)
+- [Best Practices Guide](https://docs.docker.com/build/building/best-practices/)
+- [Python Image Variants](https://hub.docker.com/_/python) - Use 3.13-slim or 3.12-slim
+
+**Think About:**
+- What happens if you copy all files before installing dependencies?
+- Why shouldn't you run as root?
+- How does layer caching speed up rebuilds?
+
+</details>
+
+<details>
+<summary>💡 .dockerignore Concepts</summary>
+
+**Purpose:** Prevent unnecessary files from being sent to Docker daemon during build (faster builds, smaller context).
+
+**What Should You Exclude?**
+Think about what doesn't need to be in your container:
+- Development artifacts (like Python's `__pycache__`, `*.pyc`)
+- Version control files (`.git` directory)
+- IDE configuration files
+- Virtual environments (`venv/`, `.venv/`)
+- Documentation that's not needed at runtime
+- Test files (if not running tests in container)
+
+**Key Question:** Why does excluding files from the build context matter for build speed?
+
+**Resources:**
+- [.dockerignore Documentation](https://docs.docker.com/engine/reference/builder/#dockerignore-file)
+- Look at your `.gitignore` for inspiration - many patterns overlap
+
+**Exercise:** Start minimal and add exclusions as needed, rather than copying a huge list you don't understand.
+
+</details>
+
+**Test Your Container:**
+
+You should be able to:
+1. Build your image using the `docker build` command
+2. Run a container from your image with proper port mapping
+3. Access your application endpoints from the host machine
+
+Verify that your application works the same way in the container as it did locally.
+
+---
+
+### Task 2 — Docker Hub (2 pts)
+
+**Objective:** Publish your image to Docker Hub.
+
+**Requirements:**
+1. Create a Docker Hub account (if you don't have one)
+2. Tag your image with your Docker Hub username
+3. Authenticate with Docker Hub
+4. Push your image to the registry
+5. Verify the image is publicly accessible
+
+**Documentation Required:**
+- Terminal output showing successful push
+- Docker Hub repository URL
+- Explanation of your tagging strategy
+
+<details>
+<summary>💡 Docker Hub Resources</summary>
+
+**Useful Commands:**
+- `docker tag` - Tag images for registry push
+- `docker login` - Authenticate with Docker Hub
+- `docker push` - Upload image to registry
+- `docker pull` - Download image from registry
+
+**Resources:**
+- [Docker Hub Quickstart](https://docs.docker.com/docker-hub/quickstart/)
+- [Docker Tag Reference](https://docs.docker.com/reference/cli/docker/image/tag/)
+- [Best Practices for Tagging](https://docs.docker.com/build/building/best-practices/#tagging)
+
+</details>
+
+---
+
+### Task 3 — Documentation (4 pts)
+
+**Objective:** Document your Docker implementation with focus on understanding and decisions.
+
+#### 3.1 Update `app_python/README.md`
+
+Add a **Docker** section explaining how to use your containerized application. Include command patterns (not exact commands) for:
+- Building the image locally
+- Running a container
+- Pulling from Docker Hub
+
+#### 3.2 Create `app_python/docs/LAB02.md`
+
+Document your implementation with these sections:
+
+**Required Sections:**
+
+1. **Docker Best Practices Applied**
+   - List each practice you implemented (non-root user, layer caching, .dockerignore, etc.)
+   - Explain WHY each matters (not just what it does)
+   - Include relevant Dockerfile snippets with explanations
+
+2. **Image Information & Decisions**
+   - Base image chosen and justification (why this specific version?)
+   - Final image size and your assessment
+   - Layer structure explanation
+   - Optimization choices you made
+
+3. **Build & Run Process**
+   - Complete terminal output from your build process
+   - Terminal output showing container running
+   - Terminal output from testing endpoints (curl/httpie)
+   - Docker Hub repository URL
+
+4. **Technical Analysis**
+   - Why does your Dockerfile work the way it does?
+   - What would happen if you changed the layer order?
+   - What security considerations did you implement?
+   - How does .dockerignore improve your build?
+
+5. **Challenges & Solutions**
+   - Issues encountered during implementation
+   - How you debugged and resolved them
+   - What you learned from the process
+
+---
+
+## Bonus Task — Multi-Stage Build (2.5 pts)
+
+**Objective:** Containerize your compiled language app (from Lab 1 bonus) using multi-stage builds.
+
+**Why Multi-Stage?** Separate build environment from runtime → smaller final image.
+
+**Example Flow:**
+1. **Stage 1 (Builder):** Compile the app (large image with compilers)
+2. **Stage 2 (Runtime):** Copy only the binary (small image, no build tools)
+
+<details>
+<summary>💡 Multi-Stage Build Concepts</summary>
+
+**The Problem:** Compiled language images include the entire compiler/SDK in the final image (huge!).
+
+**The Solution:** Use multiple `FROM` statements:
+- **Stage 1 (Builder)**: Use full SDK image, compile your application
+- **Stage 2 (Runtime)**: Use minimal base image, copy only the compiled binary
+
+**Key Concepts to Research:**
+- How to name build stages (`AS builder`)
+- How to copy files from previous stages (`COPY --from=builder`)
+- Choosing runtime base images (alpine, distroless, scratch)
+- Static vs dynamic compilation (affects what base image you can use)
+
+**Questions to Explore:**
+- What's the size difference between your builder and final image?
+- Why can't you just use the builder image as your final image?
+- What security benefits come from smaller images?
+- Can you use `FROM scratch`? Why or why not?
+
+**Resources:**
+- [Multi-Stage Builds Documentation](https://docs.docker.com/build/building/multi-stage/)
+- [Distroless Base Images](https://github.com/GoogleContainerTools/distroless)
+- Language-specific: Search "Go static binary Docker" or "Rust alpine Docker"
+
+**Challenge:** Try to get your final image under 20MB.
+
+</details>
+
+**Requirements:**
+- Multi-stage Dockerfile in `app_go/` (or your chosen language)
+- Working containerized application
+- Documentation in `app_go/docs/LAB02.md` explaining:
+  - Your multi-stage build strategy
+  - Size comparison with analysis (builder vs final image)
+  - Why multi-stage builds matter for compiled languages
+  - Terminal output showing build process and image sizes
+  - Technical explanation of each stage's purpose
+
+**Bonus Points Given For:**
+- Significant size reduction achieved with clear metrics
+- Deep understanding of multi-stage build benefits
+- Analysis of security implications (smaller attack surface)
+- Explanation of trade-offs and decisions made
+
+---
+
+## How to Submit
+
+1. **Create Branch:** Create a new branch called `lab02`
+
+2. **Commit Work:**
+   - Add your changes (app_python/ directory with Dockerfile, .dockerignore, updated docs)
+   - Commit with a descriptive message following conventional commits format
+   - Push to your fork
+
+3. **Create Pull Requests:**
+   - **PR #1:** `your-fork:lab02` → `course-repo:master`
+   - **PR #2:** `your-fork:lab02` → `your-fork:master`
+
+---
+
+## Acceptance Criteria
+
+### Main Tasks (10 points)
+
+**Dockerfile (4 pts):**
+- [ ] Dockerfile exists in `app_python/`
+- [ ] Uses specific base image version
+- [ ] Runs as non-root user (USER directive)
+- [ ] Proper layer ordering (dependencies before code)
+- [ ] Only copies necessary files
+- [ ] `.dockerignore` file present
+- [ ] Image builds successfully
+- [ ] Container runs and app works
+
+**Docker Hub (2 pts):**
+- [ ] Image pushed to Docker Hub
+- [ ] Image is publicly accessible
+- [ ] Correct tagging used
+- [ ] Can pull and run from Docker Hub
+
+**Documentation (4 pts):**
+- [ ] `app_python/README.md` has Docker section with command patterns
+- [ ] `app_python/docs/LAB02.md` complete with:
+  - [ ] Best practices explained with WHY (not just what)
+  - [ ] Image information and justifications for choices
+  - [ ] Terminal output from build, run, and testing
+  - [ ] Technical analysis demonstrating understanding
+  - [ ] Challenges and solutions documented
+  - [ ] Docker Hub repository URL provided
+
+### Bonus Task (2.5 points)
+
+- [ ] Multi-stage Dockerfile for compiled language app
+- [ ] Working containerized application
+- [ ] Documentation in `app_<language>/docs/LAB02.md` with:
+  - [ ] Multi-stage strategy explained
+  - [ ] Terminal output showing image sizes (builder vs final)
+  - [ ] Analysis of size reduction and why it matters
+  - [ ] Technical explanation of each stage
+  - [ ] Security benefits discussed
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Dockerfile** | 4 pts | Correct, secure, optimized |
+| **Docker Hub** | 2 pts | Successfully published |
+| **Documentation** | 4 pts | Complete and clear |
+| **Bonus** | 2.5 pts | Multi-stage implementation |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Perfect Dockerfile, deep understanding demonstrated, excellent analysis
+- **8-9/10:** Working container, good practices, solid understanding shown
+- **6-7/10:** Container works, basic security, surface-level explanations
+- **<6/10:** Missing requirements, runs as root, copy-paste without understanding
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Docker Documentation</summary>
+
+- [Dockerfile Best Practices](https://docs.docker.com/build/building/best-practices/)
+- [Dockerfile Reference](https://docs.docker.com/reference/dockerfile/)
+- [Multi-Stage Builds](https://docs.docker.com/build/building/multi-stage/)
+- [.dockerignore](https://docs.docker.com/reference/dockerfile/#dockerignore-file)
+- [Docker Build Guide](https://docs.docker.com/build/guide/)
+
+</details>
+
+<details>
+<summary>🔒 Security Resources</summary>
+
+- [Docker Security Best Practices](https://docs.docker.com/build/building/best-practices/#security)
+- [Snyk Docker Security](https://snyk.io/learn/docker-security-scanning/)
+- [Why Non-Root Containers](https://docs.docker.com/build/building/best-practices/#user)
+- [Distroless Images](https://github.com/GoogleContainerTools/distroless) - Minimal base images
+
+</details>
+
+<details>
+<summary>🛠️ Tools</summary>
+
+- [Hadolint](https://github.com/hadolint/hadolint) - Dockerfile linter
+- [Dive](https://github.com/wagoodman/dive) - Explore image layers
+- [Docker Hub](https://hub.docker.com/) - Container registry
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 3:** CI/CD will automatically build these Docker images
+- **Lab 7-8:** Deploy containers with docker-compose for logging/monitoring
+- **Lab 9:** Run these containers in Kubernetes
+- **Lab 13:** ArgoCD will deploy containerized apps automatically
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** Understanding beats copy-paste. Explain your decisions, not just your actions. Run as non-root or no points!
diff --git a/labs/lab03.md b/labs/lab03.md
index 9824e934b3..d0acb4da96 100644
--- a/labs/lab03.md
+++ b/labs/lab03.md
@@ -1,931 +1,931 @@
-# Lab 3 — Continuous Integration (CI/CD)
-
-![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
-![topic](https://img.shields.io/badge/topic-CI/CD-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-GitHub%20Actions-informational)
-
-> Automate your Python app testing and Docker builds with GitHub Actions CI/CD pipeline.
-
-## Overview
-
-Take your containerized app from Labs 1-2 and add automated testing and deployment. Learn how CI/CD catches bugs early, ensures code quality, and automates the Docker build/push workflow.
-
-**What You'll Learn:**
-- Writing effective unit tests
-- GitHub Actions workflow syntax
-- CI/CD best practices (caching, matrix builds, security scanning)
-- Automated Docker image publishing
-- Continuous integration for multiple applications
-
-**Tech Stack:** GitHub Actions | pytest 8+ | Python 3.11+ | Snyk | Docker
-
-**Connection to Previous Labs:**
-- **Lab 1:** Test the endpoints you created
-- **Lab 2:** Automate the Docker build/push workflow
-- **Lab 4+:** This CI pipeline will run for all future labs
-
----
-
-## Tasks
-
-### Task 1 — Unit Testing (3 pts)
-
-**Objective:** Write comprehensive unit tests for your Python application to ensure reliability.
-
-**Requirements:**
-
-1. **Choose a Testing Framework**
-   - Research Python testing frameworks (pytest, unittest, etc.)
-   - Select one and justify your choice
-   - Install it in your `requirements.txt` or create `requirements-dev.txt`
-
-2. **Write Unit Tests**
-   - Create `app_python/tests/` directory
-   - Write tests for **all** your endpoints:
-     - `GET /` - Verify JSON structure and required fields
-     - `GET /health` - Verify health check response
-   - Test both successful responses and error cases
-   - Aim for meaningful test coverage (not just basic smoke tests)
-
-3. **Run Tests Locally**
-   - Verify all tests pass locally before CI setup
-   - Document how to run tests in your README
-
-<details>
-<summary>💡 Testing Framework Guidance</summary>
-
-**Popular Python Testing Frameworks:**
-
-**pytest (Recommended):**
-- Pros: Simple syntax, powerful fixtures, excellent plugin ecosystem
-- Cons: Additional dependency
-- Use case: Most modern Python projects
-
-**unittest:**
-- Pros: Built into Python (no extra dependencies)
-- Cons: More verbose, less modern features
-- Use case: Minimal dependency projects
-
-**Key Testing Concepts to Research:**
-- Test fixtures and setup/teardown
-- Mocking external dependencies
-- Testing HTTP endpoints (test client usage)
-- Test coverage measurement
-- Assertions and expected vs actual results
-
-**What Should You Test?**
-- Correct HTTP status codes (200, 404, 500)
-- Response data structure (JSON fields present)
-- Response data types (strings, integers, etc.)
-- Edge cases (invalid requests, missing data)
-- Error handling (what happens when things fail?)
-
-**Questions to Consider:**
-- How do you test a Flask/FastAPI app without starting the server?
-- Should you test that `hostname` returns your actual hostname, or just that the field exists?
-- How do you simulate different client IPs or user agents in tests?
-
-**Resources:**
-- [Pytest Documentation](https://docs.pytest.org/)
-- [Flask Testing](https://flask.palletsprojects.com/en/stable/testing/)
-- [FastAPI Testing](https://fastapi.tiangolo.com/tutorial/testing/)
-- [Python unittest](https://docs.python.org/3/library/unittest.html)
-
-**Anti-Patterns to Avoid:**
-- Testing framework functionality instead of your code
-- Tests that always pass regardless of implementation
-- Tests with no assertions
-- Tests that depend on external services
-
-</details>
-
-**What to Document:**
-- Your testing framework choice and why
-- Test structure explanation
-- How to run tests locally
-- Terminal output showing all tests passing
-
----
-
-### Task 2 — GitHub Actions CI Workflow (4 pts)
-
-**Objective:** Create a GitHub Actions workflow that automatically tests your code and builds Docker images with proper versioning.
-
-**Requirements:**
-
-1. **Create Workflow File**
-   - Create `.github/workflows/python-ci.yml` in your repository
-   - Name your workflow descriptively
-
-2. **Implement Essential CI Steps**
-
-   Your workflow must include these logical stages:
-
-   **a) Code Quality & Testing:**
-   - Install dependencies
-   - Run a linter (pylint, flake8, black, ruff, etc.)
-   - Run your unit tests
-
-   **b) Docker Build & Push with Versioning:**
-   - Authenticate with Docker Hub
-   - Build your Docker image
-   - Tag with proper version strategy (see versioning section below)
-   - Push to Docker Hub with multiple tags
-
-3. **Versioning Strategy**
-
-   Choose **one** versioning approach and implement it:
-
-   **Option A: Semantic Versioning (SemVer)**
-   - Version format: `v1.2.3` (major.minor.patch)
-   - Use git tags for releases
-   - Tag images like: `username/app:1.2.3`, `username/app:1.2`, `username/app:latest`
-   - **When to use:** Traditional software releases with breaking changes
-
-   **Option B: Calendar Versioning (CalVer)**
-   - Version format: `2024.01.15` or `2024.01` (year.month.day or year.month)
-   - Based on release date
-   - Tag images like: `username/app:2024.01`, `username/app:latest`
-   - **When to use:** Time-based releases, continuous deployment
-
-   **Required:**
-   - Document which strategy you chose and why
-   - Implement it in your CI workflow
-   - Show at least 2 tags per image (e.g., version + latest)
-
-4. **Workflow Triggers**
-   - Configure when the workflow runs (push, pull request, etc.)
-   - Consider which branches should trigger builds
-
-5. **Testing the Workflow**
-   - Push your workflow file and verify it runs
-   - Fix any issues that arise
-   - Ensure all steps complete successfully
-   - Verify Docker Hub shows your version tags
-
-<details>
-<summary>💡 GitHub Actions Concepts</summary>
-
-**Core Concepts to Research:**
-
-**Workflow Anatomy:**
-- `name` - What is your workflow called?
-- `on` - When does it run? (push, pull_request, schedule, etc.)
-- `jobs` - What work needs to be done?
-- `steps` - Individual commands within a job
-- `runs-on` - What OS environment? (ubuntu-latest, etc.)
-
-**Key Questions:**
-- Should you run CI on every push, or only on pull requests?
-- What happens if tests fail? Should the workflow continue?
-- How do you access secrets (like Docker Hub credentials) securely?
-- Why might you want multiple jobs vs multiple steps in one job?
-
-**Python CI Steps Pattern:**
-```yaml
-# This is a pattern, not exact copy-paste code
-# Research the actual syntax and actions needed
-
-- Set up Python environment
-- Install dependencies
-- Run linter
-- Run tests
-```
-
-**Docker CI Steps Pattern:**
-```yaml
-# This is a pattern, not exact copy-paste code
-# Research the actual actions and their parameters
-
-- Log in to Docker Hub
-- Extract metadata for tags
-- Build and push Docker image
-```
-
-**Important Concepts:**
-- **Actions Marketplace:** Reusable actions (actions/checkout@v4, actions/setup-python@v5, docker/build-push-action@v6)
-- **Secrets:** How to store Docker Hub credentials securely
-- **Job Dependencies:** Can one job depend on another succeeding?
-- **Matrix Builds:** Testing multiple Python versions (optional but good to know)
-- **Caching:** Speed up workflows by caching dependencies (we'll add this in Task 3)
-
-**Resources:**
-- [GitHub Actions Documentation](https://docs.github.com/en/actions)
-- [Building and Testing Python](https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python)
-- [Publishing Docker Images](https://docs.docker.com/ci-cd/github-actions/)
-- [GitHub Actions Marketplace](https://github.com/marketplace?type=actions)
-- [Workflow Syntax](https://docs.github.com/en/actions/using-workflows/workflow-syntax-for-github-actions)
-
-**Security Best Practices:**
-- Never hardcode passwords or tokens in workflow files
-- Use GitHub Secrets for sensitive data
-- Understand when secrets are exposed to pull requests from forks
-- Use `secrets.GITHUB_TOKEN` for GitHub API access (auto-provided)
-
-**Docker Hub Authentication:**
-You'll need to create a Docker Hub access token and add it as a GitHub Secret. Research:
-- How to create Docker Hub access tokens
-- How to add secrets to your GitHub repository
-- How to reference secrets in workflow files (hint: `${{ secrets.NAME }}`)
-
-</details>
-
-<details>
-<summary>💡 Versioning Strategy Guidance</summary>
-
-**Semantic Versioning (SemVer):**
-
-**Format:** MAJOR.MINOR.PATCH (e.g., 1.2.3)
-- **MAJOR:** Breaking changes (incompatible API changes)
-- **MINOR:** New features (backward-compatible)
-- **PATCH:** Bug fixes (backward-compatible)
-
-**Implementation Approaches:**
-1. **Manual Git Tags:** Create git tags (v1.0.0) and reference in workflow
-2. **Automated from Commits:** Parse conventional commits to bump version
-3. **GitHub Releases:** Trigger on release creation
-
-**Docker Tagging Example:**
-- `username/app:1.2.3` (full version)
-- `username/app:1.2` (minor version, rolling)
-- `username/app:1` (major version, rolling)
-- `username/app:latest` (latest stable)
-
-**Pros:** Clear when breaking changes occur, industry standard for libraries
-**Cons:** Requires discipline to follow rules correctly
-
----
-
-**Calendar Versioning (CalVer):**
-
-**Common Formats:**
-- `YYYY.MM.DD` (e.g., 2024.01.15) - Daily releases
-- `YYYY.MM.MICRO` (e.g., 2024.01.0) - Monthly with patch number
-- `YYYY.0M` (e.g., 2024.01) - Monthly releases
-
-**Implementation Approaches:**
-1. **Date-based:** Generate from current date in workflow
-2. **Git SHA:** Combine with short commit SHA (2024.01-a1b2c3d)
-3. **Build Number:** Use GitHub run number (2024.01.42)
-
-**Docker Tagging Example:**
-- `username/app:2024.01` (month version)
-- `username/app:2024.01.123` (with build number)
-- `username/app:latest` (latest build)
-
-**Pros:** No ambiguity, good for continuous deployment, easier to remember
-**Cons:** Doesn't indicate breaking changes
-
----
-
-**How to Implement in CI:**
-
-**Using docker/metadata-action:**
-```yaml
-# Pattern - research actual syntax
-- name: Docker metadata
-  uses: docker/metadata-action
-  with:
-    # Define your tagging strategy here
-    # Can reference git tags, dates, commit SHAs
-```
-
-**Manual Tagging:**
-```yaml
-# Pattern - research actual syntax
-- name: Generate version
-  run: echo "VERSION=$(date +%Y.%m.%d)" >> $GITHUB_ENV
-
-- name: Build and push
-  # Use ${{ env.VERSION }} in tags
-```
-
-**Questions to Consider:**
-- How often will you release? (Daily? Per feature? Monthly?)
-- Do users need to know about breaking changes explicitly?
-- Are you building a library (use SemVer) or a service (CalVer works)?
-- How will you track what's in each version?
-
-**Resources:**
-- [Semantic Versioning](https://semver.org/)
-- [Calendar Versioning](https://calver.org/)
-- [Docker Metadata Action](https://github.com/docker/metadata-action)
-- [Conventional Commits](https://www.conventionalcommits.org/) (for automated SemVer)
-
-</details>
-
-<details>
-<summary>💡 Debugging GitHub Actions</summary>
-
-**Common Issues & How to Debug:**
-
-**Workflow Won't Trigger:**
-- Check your `on:` configuration
-- Verify you pushed to the correct branch
-- Look at Actions tab for filtering options
-
-**Steps Failing:**
-- Click into the failed step to see full logs
-- Check for typos in action names or parameters
-- Verify secrets are configured correctly
-- Test commands locally first
-
-**Docker Build Fails:**
-- Ensure Dockerfile is in the correct location
-- Check context path in build step
-- Verify base image exists and is accessible
-- Test Docker build locally first
-
-**Authentication Issues:**
-- Verify secret names match exactly (case-sensitive)
-- Check that Docker Hub token has write permissions
-- Ensure you're using `docker/login-action` correctly
-
-**Debugging Techniques:**
-- Add `run: echo "Debug message"` steps to understand workflow state
-- Use `run: env` to see available environment variables
-- Check Actions tab for detailed logs
-- Enable debug logging (add `ACTIONS_RUNNER_DEBUG` secret = true)
-
-</details>
-
-**What to Document:**
-- Your workflow trigger strategy and reasoning
-- Why you chose specific actions from the marketplace
-- Your Docker tagging strategy (latest? version tags? commit SHA?)
-- Link to successful workflow run in GitHub Actions tab
-- Terminal output or screenshot of green checkmark
-
----
-
-### Task 3 — CI Best Practices & Security (3 pts)
-
-**Objective:** Optimize your CI workflow and add security scanning.
-
-**Requirements:**
-
-1. **Add Status Badge**
-   - Add a GitHub Actions status badge to your `app_python/README.md`
-   - The badge should show the current workflow status (passing/failing)
-
-2. **Implement Dependency Caching**
-   - Add caching for Python dependencies to speed up workflow
-   - Measure and document the speed improvement
-
-3. **Add Security Scanning with Snyk**
-   - Integrate Snyk vulnerability scanning into your workflow
-   - Configure it to check for vulnerabilities in your dependencies
-   - Document any vulnerabilities found and how you addressed them
-
-4. **Apply CI Best Practices**
-   - Research and implement at least 3 additional CI best practices
-   - Document which practices you applied and why they matter
-
-<details>
-<summary>💡 CI Best Practices Guidance</summary>
-
-**Dependency Caching:**
-
-Caching speeds up workflows by reusing previously downloaded dependencies.
-
-**Key Concepts:**
-- What should be cached? (pip packages, Docker layers, etc.)
-- What's the cache key? (based on requirements.txt hash)
-- When does cache become invalid?
-- How much time does caching save?
-
-**Actions to Research:**
-- `actions/cache` for general caching
-- `actions/setup-python` has built-in cache support
-
-**Questions to Explore:**
-- Where are Python packages stored that should be cached?
-- How do you measure cache hit vs cache miss?
-- What happens if requirements.txt changes?
-
-**Status Badges:**
-
-Show workflow status directly in your README.
-
-**Format Pattern:**
-```markdown
-![Workflow Name](https://github.com/username/repo/workflows/workflow-name/badge.svg)
-```
-
-Research how to:
-- Get the correct badge URL for your workflow
-- Make badges clickable (link to Actions tab)
-- Display specific branch status
-
-**CI Best Practices to Consider:**
-
-Research and choose at least 3 to implement:
-
-1. **Fail Fast:** Stop workflow on first failure
-2. **Matrix Builds:** Test multiple Python versions (3.12, 3.13)
-3. **Job Dependencies:** Don't push Docker if tests fail
-4. **Conditional Steps:** Only push on main branch
-5. **Pull Request Checks:** Require passing CI before merge
-6. **Workflow Concurrency:** Cancel outdated workflow runs
-7. **Docker Layer Caching:** Cache Docker build layers
-8. **Environment Variables:** Use env for repeated values
-9. **Secrets Scanning:** Prevent committing secrets
-10. **YAML Validation:** Lint your workflow files
-
-**Resources:**
-- [GitHub Actions Best Practices](https://docs.github.com/en/actions/learn-github-actions/usage-limits-billing-and-administration#usage-limits)
-- [Caching Dependencies](https://docs.github.com/en/actions/using-workflows/caching-dependencies-to-speed-up-workflows)
-- [Security Hardening](https://docs.github.com/en/actions/security-guides/security-hardening-for-github-actions)
-
-</details>
-
-<details>
-<summary>💡 Snyk Integration Guidance</summary>
-
-**What is Snyk?**
-
-Snyk is a security tool that scans your dependencies for known vulnerabilities.
-
-**Key Concepts:**
-- Vulnerability databases (CVEs)
-- Severity levels (low, medium, high, critical)
-- Automated dependency updates
-- Security advisories
-
-**Integration Options:**
-
-1. **Snyk GitHub Action:**
-   - Use `snyk/actions` from GitHub Marketplace
-   - Requires Snyk API token (free tier available)
-   - Can fail builds on vulnerabilities
-
-2. **Snyk CLI in Workflow:**
-   - Install Snyk CLI in workflow
-   - Run `snyk test` command
-   - More flexible but requires setup
-
-**Setup Steps:**
-1. Create free Snyk account
-2. Get API token from Snyk dashboard
-3. Add token as GitHub Secret
-4. Add Snyk step to workflow
-5. Configure severity threshold (what level fails the build?)
-
-**Questions to Explore:**
-- Should every vulnerability fail your build?
-- What if vulnerabilities have no fix available?
-- How do you handle false positives?
-- When should you break the build vs just warn?
-
-**Resources:**
-- [Snyk GitHub Actions](https://github.com/snyk/actions)
-- [Snyk Python Example](https://github.com/snyk/actions/tree/master/python)
-- [Snyk Documentation](https://docs.snyk.io/integrations/ci-cd-integrations/github-actions-integration)
-
-**Common Issues:**
-- Dependencies not installed before Snyk runs
-- API token not configured correctly
-- Overly strict severity settings breaking builds
-- Virtual environment confusion
-
-**What to Document:**
-- Your severity threshold decision and reasoning
-- Any vulnerabilities found and your response
-- Whether you fail builds on vulnerabilities or just warn
-
-</details>
-
-**What to Document:**
-- Status badge in README (visible proof it works)
-- Caching implementation and speed improvement metrics
-- CI best practices you applied with explanations
-- Snyk integration results and vulnerability handling
-- Terminal output showing improved workflow performance
-
----
-
-## Bonus Task — Multi-App CI with Path Filters + Test Coverage (2.5 pts)
-
-**Objective:** Set up CI for your compiled language app with intelligent path-based triggers AND add test coverage tracking.
-
-**Part 1: Multi-App CI (1.5 pts)**
-
-1. **Create Second CI Workflow**
-   - Create `.github/workflows/<language>-ci.yml` for your Go/Rust/Java app
-   - Implement similar CI steps (lint, test, build Docker image)
-   - Use language-specific actions and best practices
-   - Apply versioning strategy (SemVer or CalVer) consistently
-
-2. **Implement Path-Based Triggers**
-   - Python workflow should only run when `app_python/` files change
-   - Compiled language workflow should only run when `app_<language>/` files change
-   - Neither should run when only docs or other files change
-
-3. **Optimize for Multiple Apps**
-   - Ensure both workflows can run in parallel
-   - Consider using workflow templates (DRY principle)
-   - Document the benefits of path-based triggers
-
-**Part 2: Test Coverage Badge (1 pt)**
-
-4. **Add Coverage Tracking**
-   - Install coverage tool (`pytest-cov` for Python, coverage tool for your other language)
-   - Generate coverage reports in CI workflow
-   - Integrate with codecov.io or coveralls.io (free for public repos)
-   - Add coverage badge to README showing percentage
-
-5. **Coverage Goals**
-   - Document your current coverage percentage
-   - Identify what's not covered and why
-   - Set a coverage threshold in CI (e.g., fail if below 70%)
-
-<details>
-<summary>💡 Path Filters & Multi-App CI</summary>
-
-**Why Path Filters?**
-
-In a monorepo with multiple apps, you don't want to run Python CI when only Go code changes.
-
-**Path Filter Syntax:**
-```yaml
-on:
-  push:
-    paths:
-      - 'app_python/**'
-      - '.github/workflows/python-ci.yml'
-```
-
-**Key Concepts:**
-- Glob patterns for path matching
-- When to include workflow file itself
-- Exclude patterns (paths-ignore)
-- How to test path filters
-
-**Questions to Explore:**
-- Should changes to README.md trigger CI?
-- Should changes to the root .gitignore trigger CI?
-- What about changes to both apps in one commit?
-- How do you test that path filters work correctly?
-
-**Multi-Language CI Patterns:**
-
-**For Go:**
-- actions/setup-go
-- golangci-lint for linting
-- go test for testing
-- Multi-stage Docker builds (from Lab 2 bonus)
-
-**For Rust:**
-- actions-rs/toolchain
-- cargo clippy for linting
-- cargo test for testing
-- cargo-audit for security
-
-**For Java:**
-- actions/setup-java
-- Maven or Gradle for build
-- Checkstyle or SpotBugs for linting
-- JUnit tests
-
-**Workflow Reusability:**
-
-Consider:
-- Reusable workflows (call one workflow from another)
-- Composite actions (bundle steps together)
-- Workflow templates (DRY for similar workflows)
-
-**Resources:**
-- [Path Filters](https://docs.github.com/en/actions/using-workflows/workflow-syntax-for-github-actions#onpushpull_requestpaths)
-- [Reusable Workflows](https://docs.github.com/en/actions/using-workflows/reusing-workflows)
-- [Starter Workflows](https://github.com/actions/starter-workflows/tree/main/ci)
-
-</details>
-
-<details>
-<summary>💡 Test Coverage Tracking</summary>
-
-**What is Test Coverage?**
-
-Coverage measures what percentage of your code is executed by your tests. High coverage = more code is tested.
-
-**Why Coverage Matters:**
-- Identifies untested code paths
-- Prevents regressions (changes breaking untested code)
-- Increases confidence in refactoring
-- Industry standard quality metric
-
-**Coverage Tools by Language:**
-
-**Python (pytest-cov):**
-```bash
-# Install
-pip install pytest-cov
-
-# Run with coverage
-pytest --cov=app_python --cov-report=xml --cov-report=term
-
-# Generates coverage.xml for upload
-```
-
-**Go (built-in):**
-```bash
-go test -coverprofile=coverage.out ./...
-go tool cover -html=coverage.out
-```
-
-**Rust (tarpaulin):**
-```bash
-cargo install cargo-tarpaulin
-cargo tarpaulin --out Xml
-```
-
-**Java (JaCoCo with Maven/Gradle):**
-```bash
-mvn test jacoco:report
-# or
-gradle test jacocoTestReport
-```
-
-**Integration Services:**
-
-**Codecov (Recommended):**
-- Free for public repos
-- Beautiful visualizations
-- PR comments with coverage diff
-- Setup: Sign in with GitHub, add repo, upload coverage report
-
-**Coveralls:**
-- Alternative to Codecov
-- Similar features
-- Different UI
-
-**Coverage in CI Workflow:**
-```yaml
-# Pattern for Python (research actual syntax)
-- name: Run tests with coverage
-  run: pytest --cov=. --cov-report=xml
-
-- name: Upload to Codecov
-  uses: codecov/codecov-action@v4
-  with:
-    file: ./coverage.xml
-    token: ${{ secrets.CODECOV_TOKEN }}
-```
-
-**Coverage Badge:**
-```markdown
-![Coverage](https://codecov.io/gh/username/repo/branch/main/graph/badge.svg)
-```
-
-**Setting Coverage Thresholds:**
-
-You can fail CI if coverage drops below a threshold:
-
-```yaml
-# In pytest.ini or pyproject.toml
-[tool:pytest]
-addopts = --cov=. --cov-fail-under=70
-```
-
-**Questions to Consider:**
-- What's a reasonable coverage target? (70%? 80%? 90%?)
-- Should you aim for 100% coverage? (Usually no - diminishing returns)
-- What code is OK to leave untested? (Error handlers, config, main)
-- How do you test hard-to-reach code paths?
-
-**Best Practices:**
-- Don't chase 100% coverage blindly
-- Focus on testing critical business logic
-- Integration points should have high coverage
-- Simple getters/setters can be skipped
-- Measure coverage trends, not just absolute numbers
-
-**Resources:**
-- [Codecov Documentation](https://docs.codecov.com/)
-- [pytest-cov Documentation](https://pytest-cov.readthedocs.io/)
-- [Go Coverage](https://go.dev/blog/cover)
-- [Cargo Tarpaulin](https://github.com/xd009642/tarpaulin)
-- [JaCoCo](https://www.jacoco.org/)
-
-</details>
-
-**What to Document:**
-- Second workflow implementation with language-specific best practices
-- Path filter configuration and testing proof
-- Benefits analysis: Why path filters matter in monorepos
-- Example showing workflows running independently
-- Terminal output or Actions tab showing selective triggering
-- **Coverage integration:** Screenshot/link to codecov/coveralls dashboard
-- **Coverage analysis:** Current percentage, what's covered/not covered, your threshold
-
----
-
-## How to Submit
-
-1. **Create Branch:**
-   - Create a new branch called `lab03`
-   - Develop your CI workflows on this branch
-
-2. **Commit Work:**
-   - Add workflow files (`.github/workflows/`)
-   - Add test files (`app_python/tests/`)
-   - Add documentation (`app_python/docs/LAB03.md`)
-   - Commit with descriptive message following conventional commits
-
-3. **Verify CI Works:**
-   - Push to your fork and verify workflows run
-   - Check that all jobs pass
-   - Review workflow logs for any issues
-
-4. **Create Pull Requests:**
-   - **PR #1:** `your-fork:lab03` → `course-repo:master`
-   - **PR #2:** `your-fork:lab03` → `your-fork:master`
-   - CI should run automatically on your PRs
-
----
-
-## Acceptance Criteria
-
-### Main Tasks (10 points)
-
-**Unit Testing (3 pts):**
-- [ ] Testing framework chosen with justification
-- [ ] Tests exist in `app_python/tests/` directory
-- [ ] All endpoints have test coverage
-- [ ] Tests pass locally (terminal output provided)
-- [ ] README updated with testing instructions
-
-**GitHub Actions CI (4 pts):**
-- [ ] Workflow file exists at `.github/workflows/python-ci.yml`
-- [ ] Workflow includes: dependency installation, linting, testing
-- [ ] Workflow includes: Docker Hub login, build, and push
-- [ ] Versioning strategy chosen (SemVer or CalVer) and implemented
-- [ ] Docker images tagged with at least 2 tags (e.g., version + latest)
-- [ ] Workflow triggers configured appropriately
-- [ ] All workflow steps pass successfully
-- [ ] Docker Hub shows versioned images
-- [ ] Link to successful workflow run provided
-
-**CI Best Practices (3 pts):**
-- [ ] Status badge added to README and working
-- [ ] Dependency caching implemented with performance metrics
-- [ ] Snyk security scanning integrated
-- [ ] At least 3 CI best practices applied
-- [ ] Documentation complete (see Documentation Requirements section)
-
-### Bonus Task (2.5 points)
-
-**Part 1: Multi-App CI (1.5 pts)**
-- [ ] Second workflow created for compiled language app (`.github/workflows/<language>-ci.yml`)
-- [ ] Language-specific linting and testing implemented
-- [ ] Versioning strategy applied to second app
-- [ ] Path filters configured for both workflows
-- [ ] Path filters tested and proven to work (workflows run selectively)
-- [ ] Both workflows can run in parallel
-- [ ] Documentation explains benefits and shows selective triggering
-
-**Part 2: Test Coverage (1 pt)**
-- [ ] Coverage tool integrated (`pytest-cov` or equivalent)
-- [ ] Coverage reports generated in CI workflow
-- [ ] Codecov or Coveralls integration complete
-- [ ] Coverage badge added to README
-- [ ] Coverage threshold set in CI (optional but recommended)
-- [ ] Documentation includes coverage analysis (percentage, what's covered/not)
-
----
-
-## Documentation Requirements
-
-Create `app_python/docs/LAB03.md` with these sections:
-
-### 1. Overview
-- Testing framework used and why you chose it
-- What endpoints/functionality your tests cover
-- CI workflow trigger configuration (when does it run?)
-- Versioning strategy chosen (SemVer or CalVer) and rationale
-
-### 2. Workflow Evidence
-```
-Provide links/terminal output for:
-- ✅ Successful workflow run (GitHub Actions link)
-- ✅ Tests passing locally (terminal output)
-- ✅ Docker image on Docker Hub (link to your image)
-- ✅ Status badge working in README
-```
-
-### 3. Best Practices Implemented
-Quick list with one-sentence explanations:
-- **Practice 1:** Why it helps
-- **Practice 2:** Why it helps
-- **Practice 3:** Why it helps
-- **Caching:** Time saved (before vs after)
-- **Snyk:** Any vulnerabilities found? Your action taken
-
-### 4. Key Decisions
-Answer these briefly (2-3 sentences each):
-- **Versioning Strategy:** SemVer or CalVer? Why did you choose it for your app?
-- **Docker Tags:** What tags does your CI create? (e.g., latest, version number, etc.)
-- **Workflow Triggers:** Why did you choose those triggers?
-- **Test Coverage:** What's tested vs not tested?
-
-### 5. Challenges (Optional)
-- Any issues you encountered and how you fixed them
-- Keep it brief - bullet points are fine
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Unit Testing** | 3 pts | Comprehensive tests, good coverage |
-| **CI Workflow** | 4 pts | Complete, functional, automated |
-| **Best Practices** | 3 pts | Optimized, secure, well-documented |
-| **Bonus** | 2.5 pts | Multi-app CI with path filters |
-| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
-
-**Grading:**
-- **10/10:** All tasks complete, CI works flawlessly, clear documentation, meaningful tests
-- **8-9/10:** CI works, good test coverage, best practices applied, solid documentation
-- **6-7/10:** CI functional, basic tests, some best practices, minimal documentation
-- **<6/10:** CI broken or missing steps, poor tests, incomplete work
-
-**Quick Checklist for Full Points:**
-- ✅ Tests actually test your endpoints (not just imports)
-- ✅ CI workflow runs and passes
-- ✅ Docker image builds and pushes successfully
-- ✅ At least 3 best practices applied (caching, Snyk, status badge, etc.)
-- ✅ Documentation complete but concise (no essay needed!)
-- ✅ Links/evidence provided (workflow runs, Docker Hub, etc.)
-
-**Documentation Should Take:** 15-30 minutes to write, 5 minutes to review
-
----
-
-## Resources
-
-<details>
-<summary>📚 GitHub Actions Documentation</summary>
-
-- [GitHub Actions Quickstart](https://docs.github.com/en/actions/quickstart)
-- [Workflow Syntax](https://docs.github.com/en/actions/using-workflows/workflow-syntax-for-github-actions)
-- [Building and Testing Python](https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python)
-- [Publishing Docker Images](https://docs.docker.com/ci-cd/github-actions/)
-- [GitHub Actions Marketplace](https://github.com/marketplace?type=actions)
-
-</details>
-
-<details>
-<summary>🧪 Testing Resources</summary>
-
-- [Pytest Documentation](https://docs.pytest.org/)
-- [Flask Testing Guide](https://flask.palletsprojects.com/en/stable/testing/)
-- [FastAPI Testing Guide](https://fastapi.tiangolo.com/tutorial/testing/)
-- [Python Testing Best Practices](https://realpython.com/python-testing/)
-
-</details>
-
-<details>
-<summary>🔒 Security & Quality</summary>
-
-- [Snyk GitHub Actions](https://github.com/snyk/actions)
-- [Snyk Python Integration](https://docs.snyk.io/integrations/ci-cd-integrations/github-actions-integration)
-- [GitHub Security Best Practices](https://docs.github.com/en/actions/security-guides/security-hardening-for-github-actions)
-- [Dependency Scanning](https://docs.github.com/en/code-security/supply-chain-security)
-
-</details>
-
-<details>
-<summary>⚡ Performance & Optimization</summary>
-
-- [Caching Dependencies](https://docs.github.com/en/actions/using-workflows/caching-dependencies-to-speed-up-workflows)
-- [Docker Build Cache](https://docs.docker.com/build/cache/)
-- [Workflow Optimization](https://docs.github.com/en/actions/learn-github-actions/usage-limits-billing-and-administration)
-
-</details>
-
-<details>
-<summary>🛠️ CI/CD Tools</summary>
-
-- [act](https://github.com/nektos/act) - Run GitHub Actions locally
-- [actionlint](https://github.com/rhysd/actionlint) - Lint workflow files
-- [GitHub CLI](https://cli.github.com/) - Manage workflows from terminal
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 4-6:** CI will validate your Terraform and Ansible code
-- **Lab 7-8:** CI will run integration tests with logging/metrics
-- **Lab 9-10:** CI will validate Kubernetes manifests and Helm charts
-- **Lab 13:** ArgoCD will deploy what CI builds (GitOps!)
-- **All Future Labs:** This pipeline is your safety net for changes
-
----
-
-**Good luck!** 🚀
-
-> **Remember:** CI isn't about having green checkmarks—it's about catching problems before they reach production. Focus on meaningful tests and understanding why each practice matters. Think like a DevOps engineer: automate everything, fail fast, and learn from failures.
+# Lab 3 — Continuous Integration (CI/CD)
+
+![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
+![topic](https://img.shields.io/badge/topic-CI/CD-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-GitHub%20Actions-informational)
+
+> Automate your Python app testing and Docker builds with GitHub Actions CI/CD pipeline.
+
+## Overview
+
+Take your containerized app from Labs 1-2 and add automated testing and deployment. Learn how CI/CD catches bugs early, ensures code quality, and automates the Docker build/push workflow.
+
+**What You'll Learn:**
+- Writing effective unit tests
+- GitHub Actions workflow syntax
+- CI/CD best practices (caching, matrix builds, security scanning)
+- Automated Docker image publishing
+- Continuous integration for multiple applications
+
+**Tech Stack:** GitHub Actions | pytest 8+ | Python 3.11+ | Snyk | Docker
+
+**Connection to Previous Labs:**
+- **Lab 1:** Test the endpoints you created
+- **Lab 2:** Automate the Docker build/push workflow
+- **Lab 4+:** This CI pipeline will run for all future labs
+
+---
+
+## Tasks
+
+### Task 1 — Unit Testing (3 pts)
+
+**Objective:** Write comprehensive unit tests for your Python application to ensure reliability.
+
+**Requirements:**
+
+1. **Choose a Testing Framework**
+   - Research Python testing frameworks (pytest, unittest, etc.)
+   - Select one and justify your choice
+   - Install it in your `requirements.txt` or create `requirements-dev.txt`
+
+2. **Write Unit Tests**
+   - Create `app_python/tests/` directory
+   - Write tests for **all** your endpoints:
+     - `GET /` - Verify JSON structure and required fields
+     - `GET /health` - Verify health check response
+   - Test both successful responses and error cases
+   - Aim for meaningful test coverage (not just basic smoke tests)
+
+3. **Run Tests Locally**
+   - Verify all tests pass locally before CI setup
+   - Document how to run tests in your README
+
+<details>
+<summary>💡 Testing Framework Guidance</summary>
+
+**Popular Python Testing Frameworks:**
+
+**pytest (Recommended):**
+- Pros: Simple syntax, powerful fixtures, excellent plugin ecosystem
+- Cons: Additional dependency
+- Use case: Most modern Python projects
+
+**unittest:**
+- Pros: Built into Python (no extra dependencies)
+- Cons: More verbose, less modern features
+- Use case: Minimal dependency projects
+
+**Key Testing Concepts to Research:**
+- Test fixtures and setup/teardown
+- Mocking external dependencies
+- Testing HTTP endpoints (test client usage)
+- Test coverage measurement
+- Assertions and expected vs actual results
+
+**What Should You Test?**
+- Correct HTTP status codes (200, 404, 500)
+- Response data structure (JSON fields present)
+- Response data types (strings, integers, etc.)
+- Edge cases (invalid requests, missing data)
+- Error handling (what happens when things fail?)
+
+**Questions to Consider:**
+- How do you test a Flask/FastAPI app without starting the server?
+- Should you test that `hostname` returns your actual hostname, or just that the field exists?
+- How do you simulate different client IPs or user agents in tests?
+
+**Resources:**
+- [Pytest Documentation](https://docs.pytest.org/)
+- [Flask Testing](https://flask.palletsprojects.com/en/stable/testing/)
+- [FastAPI Testing](https://fastapi.tiangolo.com/tutorial/testing/)
+- [Python unittest](https://docs.python.org/3/library/unittest.html)
+
+**Anti-Patterns to Avoid:**
+- Testing framework functionality instead of your code
+- Tests that always pass regardless of implementation
+- Tests with no assertions
+- Tests that depend on external services
+
+</details>
+
+**What to Document:**
+- Your testing framework choice and why
+- Test structure explanation
+- How to run tests locally
+- Terminal output showing all tests passing
+
+---
+
+### Task 2 — GitHub Actions CI Workflow (4 pts)
+
+**Objective:** Create a GitHub Actions workflow that automatically tests your code and builds Docker images with proper versioning.
+
+**Requirements:**
+
+1. **Create Workflow File**
+   - Create `.github/workflows/python-ci.yml` in your repository
+   - Name your workflow descriptively
+
+2. **Implement Essential CI Steps**
+
+   Your workflow must include these logical stages:
+
+   **a) Code Quality & Testing:**
+   - Install dependencies
+   - Run a linter (pylint, flake8, black, ruff, etc.)
+   - Run your unit tests
+
+   **b) Docker Build & Push with Versioning:**
+   - Authenticate with Docker Hub
+   - Build your Docker image
+   - Tag with proper version strategy (see versioning section below)
+   - Push to Docker Hub with multiple tags
+
+3. **Versioning Strategy**
+
+   Choose **one** versioning approach and implement it:
+
+   **Option A: Semantic Versioning (SemVer)**
+   - Version format: `v1.2.3` (major.minor.patch)
+   - Use git tags for releases
+   - Tag images like: `username/app:1.2.3`, `username/app:1.2`, `username/app:latest`
+   - **When to use:** Traditional software releases with breaking changes
+
+   **Option B: Calendar Versioning (CalVer)**
+   - Version format: `2024.01.15` or `2024.01` (year.month.day or year.month)
+   - Based on release date
+   - Tag images like: `username/app:2024.01`, `username/app:latest`
+   - **When to use:** Time-based releases, continuous deployment
+
+   **Required:**
+   - Document which strategy you chose and why
+   - Implement it in your CI workflow
+   - Show at least 2 tags per image (e.g., version + latest)
+
+4. **Workflow Triggers**
+   - Configure when the workflow runs (push, pull request, etc.)
+   - Consider which branches should trigger builds
+
+5. **Testing the Workflow**
+   - Push your workflow file and verify it runs
+   - Fix any issues that arise
+   - Ensure all steps complete successfully
+   - Verify Docker Hub shows your version tags
+
+<details>
+<summary>💡 GitHub Actions Concepts</summary>
+
+**Core Concepts to Research:**
+
+**Workflow Anatomy:**
+- `name` - What is your workflow called?
+- `on` - When does it run? (push, pull_request, schedule, etc.)
+- `jobs` - What work needs to be done?
+- `steps` - Individual commands within a job
+- `runs-on` - What OS environment? (ubuntu-latest, etc.)
+
+**Key Questions:**
+- Should you run CI on every push, or only on pull requests?
+- What happens if tests fail? Should the workflow continue?
+- How do you access secrets (like Docker Hub credentials) securely?
+- Why might you want multiple jobs vs multiple steps in one job?
+
+**Python CI Steps Pattern:**
+```yaml
+# This is a pattern, not exact copy-paste code
+# Research the actual syntax and actions needed
+
+- Set up Python environment
+- Install dependencies
+- Run linter
+- Run tests
+```
+
+**Docker CI Steps Pattern:**
+```yaml
+# This is a pattern, not exact copy-paste code
+# Research the actual actions and their parameters
+
+- Log in to Docker Hub
+- Extract metadata for tags
+- Build and push Docker image
+```
+
+**Important Concepts:**
+- **Actions Marketplace:** Reusable actions (actions/checkout@v4, actions/setup-python@v5, docker/build-push-action@v6)
+- **Secrets:** How to store Docker Hub credentials securely
+- **Job Dependencies:** Can one job depend on another succeeding?
+- **Matrix Builds:** Testing multiple Python versions (optional but good to know)
+- **Caching:** Speed up workflows by caching dependencies (we'll add this in Task 3)
+
+**Resources:**
+- [GitHub Actions Documentation](https://docs.github.com/en/actions)
+- [Building and Testing Python](https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python)
+- [Publishing Docker Images](https://docs.docker.com/ci-cd/github-actions/)
+- [GitHub Actions Marketplace](https://github.com/marketplace?type=actions)
+- [Workflow Syntax](https://docs.github.com/en/actions/using-workflows/workflow-syntax-for-github-actions)
+
+**Security Best Practices:**
+- Never hardcode passwords or tokens in workflow files
+- Use GitHub Secrets for sensitive data
+- Understand when secrets are exposed to pull requests from forks
+- Use `secrets.GITHUB_TOKEN` for GitHub API access (auto-provided)
+
+**Docker Hub Authentication:**
+You'll need to create a Docker Hub access token and add it as a GitHub Secret. Research:
+- How to create Docker Hub access tokens
+- How to add secrets to your GitHub repository
+- How to reference secrets in workflow files (hint: `${{ secrets.NAME }}`)
+
+</details>
+
+<details>
+<summary>💡 Versioning Strategy Guidance</summary>
+
+**Semantic Versioning (SemVer):**
+
+**Format:** MAJOR.MINOR.PATCH (e.g., 1.2.3)
+- **MAJOR:** Breaking changes (incompatible API changes)
+- **MINOR:** New features (backward-compatible)
+- **PATCH:** Bug fixes (backward-compatible)
+
+**Implementation Approaches:**
+1. **Manual Git Tags:** Create git tags (v1.0.0) and reference in workflow
+2. **Automated from Commits:** Parse conventional commits to bump version
+3. **GitHub Releases:** Trigger on release creation
+
+**Docker Tagging Example:**
+- `username/app:1.2.3` (full version)
+- `username/app:1.2` (minor version, rolling)
+- `username/app:1` (major version, rolling)
+- `username/app:latest` (latest stable)
+
+**Pros:** Clear when breaking changes occur, industry standard for libraries
+**Cons:** Requires discipline to follow rules correctly
+
+---
+
+**Calendar Versioning (CalVer):**
+
+**Common Formats:**
+- `YYYY.MM.DD` (e.g., 2024.01.15) - Daily releases
+- `YYYY.MM.MICRO` (e.g., 2024.01.0) - Monthly with patch number
+- `YYYY.0M` (e.g., 2024.01) - Monthly releases
+
+**Implementation Approaches:**
+1. **Date-based:** Generate from current date in workflow
+2. **Git SHA:** Combine with short commit SHA (2024.01-a1b2c3d)
+3. **Build Number:** Use GitHub run number (2024.01.42)
+
+**Docker Tagging Example:**
+- `username/app:2024.01` (month version)
+- `username/app:2024.01.123` (with build number)
+- `username/app:latest` (latest build)
+
+**Pros:** No ambiguity, good for continuous deployment, easier to remember
+**Cons:** Doesn't indicate breaking changes
+
+---
+
+**How to Implement in CI:**
+
+**Using docker/metadata-action:**
+```yaml
+# Pattern - research actual syntax
+- name: Docker metadata
+  uses: docker/metadata-action
+  with:
+    # Define your tagging strategy here
+    # Can reference git tags, dates, commit SHAs
+```
+
+**Manual Tagging:**
+```yaml
+# Pattern - research actual syntax
+- name: Generate version
+  run: echo "VERSION=$(date +%Y.%m.%d)" >> $GITHUB_ENV
+
+- name: Build and push
+  # Use ${{ env.VERSION }} in tags
+```
+
+**Questions to Consider:**
+- How often will you release? (Daily? Per feature? Monthly?)
+- Do users need to know about breaking changes explicitly?
+- Are you building a library (use SemVer) or a service (CalVer works)?
+- How will you track what's in each version?
+
+**Resources:**
+- [Semantic Versioning](https://semver.org/)
+- [Calendar Versioning](https://calver.org/)
+- [Docker Metadata Action](https://github.com/docker/metadata-action)
+- [Conventional Commits](https://www.conventionalcommits.org/) (for automated SemVer)
+
+</details>
+
+<details>
+<summary>💡 Debugging GitHub Actions</summary>
+
+**Common Issues & How to Debug:**
+
+**Workflow Won't Trigger:**
+- Check your `on:` configuration
+- Verify you pushed to the correct branch
+- Look at Actions tab for filtering options
+
+**Steps Failing:**
+- Click into the failed step to see full logs
+- Check for typos in action names or parameters
+- Verify secrets are configured correctly
+- Test commands locally first
+
+**Docker Build Fails:**
+- Ensure Dockerfile is in the correct location
+- Check context path in build step
+- Verify base image exists and is accessible
+- Test Docker build locally first
+
+**Authentication Issues:**
+- Verify secret names match exactly (case-sensitive)
+- Check that Docker Hub token has write permissions
+- Ensure you're using `docker/login-action` correctly
+
+**Debugging Techniques:**
+- Add `run: echo "Debug message"` steps to understand workflow state
+- Use `run: env` to see available environment variables
+- Check Actions tab for detailed logs
+- Enable debug logging (add `ACTIONS_RUNNER_DEBUG` secret = true)
+
+</details>
+
+**What to Document:**
+- Your workflow trigger strategy and reasoning
+- Why you chose specific actions from the marketplace
+- Your Docker tagging strategy (latest? version tags? commit SHA?)
+- Link to successful workflow run in GitHub Actions tab
+- Terminal output or screenshot of green checkmark
+
+---
+
+### Task 3 — CI Best Practices & Security (3 pts)
+
+**Objective:** Optimize your CI workflow and add security scanning.
+
+**Requirements:**
+
+1. **Add Status Badge**
+   - Add a GitHub Actions status badge to your `app_python/README.md`
+   - The badge should show the current workflow status (passing/failing)
+
+2. **Implement Dependency Caching**
+   - Add caching for Python dependencies to speed up workflow
+   - Measure and document the speed improvement
+
+3. **Add Security Scanning with Snyk**
+   - Integrate Snyk vulnerability scanning into your workflow
+   - Configure it to check for vulnerabilities in your dependencies
+   - Document any vulnerabilities found and how you addressed them
+
+4. **Apply CI Best Practices**
+   - Research and implement at least 3 additional CI best practices
+   - Document which practices you applied and why they matter
+
+<details>
+<summary>💡 CI Best Practices Guidance</summary>
+
+**Dependency Caching:**
+
+Caching speeds up workflows by reusing previously downloaded dependencies.
+
+**Key Concepts:**
+- What should be cached? (pip packages, Docker layers, etc.)
+- What's the cache key? (based on requirements.txt hash)
+- When does cache become invalid?
+- How much time does caching save?
+
+**Actions to Research:**
+- `actions/cache` for general caching
+- `actions/setup-python` has built-in cache support
+
+**Questions to Explore:**
+- Where are Python packages stored that should be cached?
+- How do you measure cache hit vs cache miss?
+- What happens if requirements.txt changes?
+
+**Status Badges:**
+
+Show workflow status directly in your README.
+
+**Format Pattern:**
+```markdown
+![Workflow Name](https://github.com/username/repo/workflows/workflow-name/badge.svg)
+```
+
+Research how to:
+- Get the correct badge URL for your workflow
+- Make badges clickable (link to Actions tab)
+- Display specific branch status
+
+**CI Best Practices to Consider:**
+
+Research and choose at least 3 to implement:
+
+1. **Fail Fast:** Stop workflow on first failure
+2. **Matrix Builds:** Test multiple Python versions (3.12, 3.13)
+3. **Job Dependencies:** Don't push Docker if tests fail
+4. **Conditional Steps:** Only push on main branch
+5. **Pull Request Checks:** Require passing CI before merge
+6. **Workflow Concurrency:** Cancel outdated workflow runs
+7. **Docker Layer Caching:** Cache Docker build layers
+8. **Environment Variables:** Use env for repeated values
+9. **Secrets Scanning:** Prevent committing secrets
+10. **YAML Validation:** Lint your workflow files
+
+**Resources:**
+- [GitHub Actions Best Practices](https://docs.github.com/en/actions/learn-github-actions/usage-limits-billing-and-administration#usage-limits)
+- [Caching Dependencies](https://docs.github.com/en/actions/using-workflows/caching-dependencies-to-speed-up-workflows)
+- [Security Hardening](https://docs.github.com/en/actions/security-guides/security-hardening-for-github-actions)
+
+</details>
+
+<details>
+<summary>💡 Snyk Integration Guidance</summary>
+
+**What is Snyk?**
+
+Snyk is a security tool that scans your dependencies for known vulnerabilities.
+
+**Key Concepts:**
+- Vulnerability databases (CVEs)
+- Severity levels (low, medium, high, critical)
+- Automated dependency updates
+- Security advisories
+
+**Integration Options:**
+
+1. **Snyk GitHub Action:**
+   - Use `snyk/actions` from GitHub Marketplace
+   - Requires Snyk API token (free tier available)
+   - Can fail builds on vulnerabilities
+
+2. **Snyk CLI in Workflow:**
+   - Install Snyk CLI in workflow
+   - Run `snyk test` command
+   - More flexible but requires setup
+
+**Setup Steps:**
+1. Create free Snyk account
+2. Get API token from Snyk dashboard
+3. Add token as GitHub Secret
+4. Add Snyk step to workflow
+5. Configure severity threshold (what level fails the build?)
+
+**Questions to Explore:**
+- Should every vulnerability fail your build?
+- What if vulnerabilities have no fix available?
+- How do you handle false positives?
+- When should you break the build vs just warn?
+
+**Resources:**
+- [Snyk GitHub Actions](https://github.com/snyk/actions)
+- [Snyk Python Example](https://github.com/snyk/actions/tree/master/python)
+- [Snyk Documentation](https://docs.snyk.io/integrations/ci-cd-integrations/github-actions-integration)
+
+**Common Issues:**
+- Dependencies not installed before Snyk runs
+- API token not configured correctly
+- Overly strict severity settings breaking builds
+- Virtual environment confusion
+
+**What to Document:**
+- Your severity threshold decision and reasoning
+- Any vulnerabilities found and your response
+- Whether you fail builds on vulnerabilities or just warn
+
+</details>
+
+**What to Document:**
+- Status badge in README (visible proof it works)
+- Caching implementation and speed improvement metrics
+- CI best practices you applied with explanations
+- Snyk integration results and vulnerability handling
+- Terminal output showing improved workflow performance
+
+---
+
+## Bonus Task — Multi-App CI with Path Filters + Test Coverage (2.5 pts)
+
+**Objective:** Set up CI for your compiled language app with intelligent path-based triggers AND add test coverage tracking.
+
+**Part 1: Multi-App CI (1.5 pts)**
+
+1. **Create Second CI Workflow**
+   - Create `.github/workflows/<language>-ci.yml` for your Go/Rust/Java app
+   - Implement similar CI steps (lint, test, build Docker image)
+   - Use language-specific actions and best practices
+   - Apply versioning strategy (SemVer or CalVer) consistently
+
+2. **Implement Path-Based Triggers**
+   - Python workflow should only run when `app_python/` files change
+   - Compiled language workflow should only run when `app_<language>/` files change
+   - Neither should run when only docs or other files change
+
+3. **Optimize for Multiple Apps**
+   - Ensure both workflows can run in parallel
+   - Consider using workflow templates (DRY principle)
+   - Document the benefits of path-based triggers
+
+**Part 2: Test Coverage Badge (1 pt)**
+
+4. **Add Coverage Tracking**
+   - Install coverage tool (`pytest-cov` for Python, coverage tool for your other language)
+   - Generate coverage reports in CI workflow
+   - Integrate with codecov.io or coveralls.io (free for public repos)
+   - Add coverage badge to README showing percentage
+
+5. **Coverage Goals**
+   - Document your current coverage percentage
+   - Identify what's not covered and why
+   - Set a coverage threshold in CI (e.g., fail if below 70%)
+
+<details>
+<summary>💡 Path Filters & Multi-App CI</summary>
+
+**Why Path Filters?**
+
+In a monorepo with multiple apps, you don't want to run Python CI when only Go code changes.
+
+**Path Filter Syntax:**
+```yaml
+on:
+  push:
+    paths:
+      - 'app_python/**'
+      - '.github/workflows/python-ci.yml'
+```
+
+**Key Concepts:**
+- Glob patterns for path matching
+- When to include workflow file itself
+- Exclude patterns (paths-ignore)
+- How to test path filters
+
+**Questions to Explore:**
+- Should changes to README.md trigger CI?
+- Should changes to the root .gitignore trigger CI?
+- What about changes to both apps in one commit?
+- How do you test that path filters work correctly?
+
+**Multi-Language CI Patterns:**
+
+**For Go:**
+- actions/setup-go
+- golangci-lint for linting
+- go test for testing
+- Multi-stage Docker builds (from Lab 2 bonus)
+
+**For Rust:**
+- actions-rs/toolchain
+- cargo clippy for linting
+- cargo test for testing
+- cargo-audit for security
+
+**For Java:**
+- actions/setup-java
+- Maven or Gradle for build
+- Checkstyle or SpotBugs for linting
+- JUnit tests
+
+**Workflow Reusability:**
+
+Consider:
+- Reusable workflows (call one workflow from another)
+- Composite actions (bundle steps together)
+- Workflow templates (DRY for similar workflows)
+
+**Resources:**
+- [Path Filters](https://docs.github.com/en/actions/using-workflows/workflow-syntax-for-github-actions#onpushpull_requestpaths)
+- [Reusable Workflows](https://docs.github.com/en/actions/using-workflows/reusing-workflows)
+- [Starter Workflows](https://github.com/actions/starter-workflows/tree/main/ci)
+
+</details>
+
+<details>
+<summary>💡 Test Coverage Tracking</summary>
+
+**What is Test Coverage?**
+
+Coverage measures what percentage of your code is executed by your tests. High coverage = more code is tested.
+
+**Why Coverage Matters:**
+- Identifies untested code paths
+- Prevents regressions (changes breaking untested code)
+- Increases confidence in refactoring
+- Industry standard quality metric
+
+**Coverage Tools by Language:**
+
+**Python (pytest-cov):**
+```bash
+# Install
+pip install pytest-cov
+
+# Run with coverage
+pytest --cov=app_python --cov-report=xml --cov-report=term
+
+# Generates coverage.xml for upload
+```
+
+**Go (built-in):**
+```bash
+go test -coverprofile=coverage.out ./...
+go tool cover -html=coverage.out
+```
+
+**Rust (tarpaulin):**
+```bash
+cargo install cargo-tarpaulin
+cargo tarpaulin --out Xml
+```
+
+**Java (JaCoCo with Maven/Gradle):**
+```bash
+mvn test jacoco:report
+# or
+gradle test jacocoTestReport
+```
+
+**Integration Services:**
+
+**Codecov (Recommended):**
+- Free for public repos
+- Beautiful visualizations
+- PR comments with coverage diff
+- Setup: Sign in with GitHub, add repo, upload coverage report
+
+**Coveralls:**
+- Alternative to Codecov
+- Similar features
+- Different UI
+
+**Coverage in CI Workflow:**
+```yaml
+# Pattern for Python (research actual syntax)
+- name: Run tests with coverage
+  run: pytest --cov=. --cov-report=xml
+
+- name: Upload to Codecov
+  uses: codecov/codecov-action@v4
+  with:
+    file: ./coverage.xml
+    token: ${{ secrets.CODECOV_TOKEN }}
+```
+
+**Coverage Badge:**
+```markdown
+![Coverage](https://codecov.io/gh/username/repo/branch/main/graph/badge.svg)
+```
+
+**Setting Coverage Thresholds:**
+
+You can fail CI if coverage drops below a threshold:
+
+```yaml
+# In pytest.ini or pyproject.toml
+[tool:pytest]
+addopts = --cov=. --cov-fail-under=70
+```
+
+**Questions to Consider:**
+- What's a reasonable coverage target? (70%? 80%? 90%?)
+- Should you aim for 100% coverage? (Usually no - diminishing returns)
+- What code is OK to leave untested? (Error handlers, config, main)
+- How do you test hard-to-reach code paths?
+
+**Best Practices:**
+- Don't chase 100% coverage blindly
+- Focus on testing critical business logic
+- Integration points should have high coverage
+- Simple getters/setters can be skipped
+- Measure coverage trends, not just absolute numbers
+
+**Resources:**
+- [Codecov Documentation](https://docs.codecov.com/)
+- [pytest-cov Documentation](https://pytest-cov.readthedocs.io/)
+- [Go Coverage](https://go.dev/blog/cover)
+- [Cargo Tarpaulin](https://github.com/xd009642/tarpaulin)
+- [JaCoCo](https://www.jacoco.org/)
+
+</details>
+
+**What to Document:**
+- Second workflow implementation with language-specific best practices
+- Path filter configuration and testing proof
+- Benefits analysis: Why path filters matter in monorepos
+- Example showing workflows running independently
+- Terminal output or Actions tab showing selective triggering
+- **Coverage integration:** Screenshot/link to codecov/coveralls dashboard
+- **Coverage analysis:** Current percentage, what's covered/not covered, your threshold
+
+---
+
+## How to Submit
+
+1. **Create Branch:**
+   - Create a new branch called `lab03`
+   - Develop your CI workflows on this branch
+
+2. **Commit Work:**
+   - Add workflow files (`.github/workflows/`)
+   - Add test files (`app_python/tests/`)
+   - Add documentation (`app_python/docs/LAB03.md`)
+   - Commit with descriptive message following conventional commits
+
+3. **Verify CI Works:**
+   - Push to your fork and verify workflows run
+   - Check that all jobs pass
+   - Review workflow logs for any issues
+
+4. **Create Pull Requests:**
+   - **PR #1:** `your-fork:lab03` → `course-repo:master`
+   - **PR #2:** `your-fork:lab03` → `your-fork:master`
+   - CI should run automatically on your PRs
+
+---
+
+## Acceptance Criteria
+
+### Main Tasks (10 points)
+
+**Unit Testing (3 pts):**
+- [ ] Testing framework chosen with justification
+- [ ] Tests exist in `app_python/tests/` directory
+- [ ] All endpoints have test coverage
+- [ ] Tests pass locally (terminal output provided)
+- [ ] README updated with testing instructions
+
+**GitHub Actions CI (4 pts):**
+- [ ] Workflow file exists at `.github/workflows/python-ci.yml`
+- [ ] Workflow includes: dependency installation, linting, testing
+- [ ] Workflow includes: Docker Hub login, build, and push
+- [ ] Versioning strategy chosen (SemVer or CalVer) and implemented
+- [ ] Docker images tagged with at least 2 tags (e.g., version + latest)
+- [ ] Workflow triggers configured appropriately
+- [ ] All workflow steps pass successfully
+- [ ] Docker Hub shows versioned images
+- [ ] Link to successful workflow run provided
+
+**CI Best Practices (3 pts):**
+- [ ] Status badge added to README and working
+- [ ] Dependency caching implemented with performance metrics
+- [ ] Snyk security scanning integrated
+- [ ] At least 3 CI best practices applied
+- [ ] Documentation complete (see Documentation Requirements section)
+
+### Bonus Task (2.5 points)
+
+**Part 1: Multi-App CI (1.5 pts)**
+- [ ] Second workflow created for compiled language app (`.github/workflows/<language>-ci.yml`)
+- [ ] Language-specific linting and testing implemented
+- [ ] Versioning strategy applied to second app
+- [ ] Path filters configured for both workflows
+- [ ] Path filters tested and proven to work (workflows run selectively)
+- [ ] Both workflows can run in parallel
+- [ ] Documentation explains benefits and shows selective triggering
+
+**Part 2: Test Coverage (1 pt)**
+- [ ] Coverage tool integrated (`pytest-cov` or equivalent)
+- [ ] Coverage reports generated in CI workflow
+- [ ] Codecov or Coveralls integration complete
+- [ ] Coverage badge added to README
+- [ ] Coverage threshold set in CI (optional but recommended)
+- [ ] Documentation includes coverage analysis (percentage, what's covered/not)
+
+---
+
+## Documentation Requirements
+
+Create `app_python/docs/LAB03.md` with these sections:
+
+### 1. Overview
+- Testing framework used and why you chose it
+- What endpoints/functionality your tests cover
+- CI workflow trigger configuration (when does it run?)
+- Versioning strategy chosen (SemVer or CalVer) and rationale
+
+### 2. Workflow Evidence
+```
+Provide links/terminal output for:
+- ✅ Successful workflow run (GitHub Actions link)
+- ✅ Tests passing locally (terminal output)
+- ✅ Docker image on Docker Hub (link to your image)
+- ✅ Status badge working in README
+```
+
+### 3. Best Practices Implemented
+Quick list with one-sentence explanations:
+- **Practice 1:** Why it helps
+- **Practice 2:** Why it helps
+- **Practice 3:** Why it helps
+- **Caching:** Time saved (before vs after)
+- **Snyk:** Any vulnerabilities found? Your action taken
+
+### 4. Key Decisions
+Answer these briefly (2-3 sentences each):
+- **Versioning Strategy:** SemVer or CalVer? Why did you choose it for your app?
+- **Docker Tags:** What tags does your CI create? (e.g., latest, version number, etc.)
+- **Workflow Triggers:** Why did you choose those triggers?
+- **Test Coverage:** What's tested vs not tested?
+
+### 5. Challenges (Optional)
+- Any issues you encountered and how you fixed them
+- Keep it brief - bullet points are fine
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Unit Testing** | 3 pts | Comprehensive tests, good coverage |
+| **CI Workflow** | 4 pts | Complete, functional, automated |
+| **Best Practices** | 3 pts | Optimized, secure, well-documented |
+| **Bonus** | 2.5 pts | Multi-app CI with path filters |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** All tasks complete, CI works flawlessly, clear documentation, meaningful tests
+- **8-9/10:** CI works, good test coverage, best practices applied, solid documentation
+- **6-7/10:** CI functional, basic tests, some best practices, minimal documentation
+- **<6/10:** CI broken or missing steps, poor tests, incomplete work
+
+**Quick Checklist for Full Points:**
+- ✅ Tests actually test your endpoints (not just imports)
+- ✅ CI workflow runs and passes
+- ✅ Docker image builds and pushes successfully
+- ✅ At least 3 best practices applied (caching, Snyk, status badge, etc.)
+- ✅ Documentation complete but concise (no essay needed!)
+- ✅ Links/evidence provided (workflow runs, Docker Hub, etc.)
+
+**Documentation Should Take:** 15-30 minutes to write, 5 minutes to review
+
+---
+
+## Resources
+
+<details>
+<summary>📚 GitHub Actions Documentation</summary>
+
+- [GitHub Actions Quickstart](https://docs.github.com/en/actions/quickstart)
+- [Workflow Syntax](https://docs.github.com/en/actions/using-workflows/workflow-syntax-for-github-actions)
+- [Building and Testing Python](https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python)
+- [Publishing Docker Images](https://docs.docker.com/ci-cd/github-actions/)
+- [GitHub Actions Marketplace](https://github.com/marketplace?type=actions)
+
+</details>
+
+<details>
+<summary>🧪 Testing Resources</summary>
+
+- [Pytest Documentation](https://docs.pytest.org/)
+- [Flask Testing Guide](https://flask.palletsprojects.com/en/stable/testing/)
+- [FastAPI Testing Guide](https://fastapi.tiangolo.com/tutorial/testing/)
+- [Python Testing Best Practices](https://realpython.com/python-testing/)
+
+</details>
+
+<details>
+<summary>🔒 Security & Quality</summary>
+
+- [Snyk GitHub Actions](https://github.com/snyk/actions)
+- [Snyk Python Integration](https://docs.snyk.io/integrations/ci-cd-integrations/github-actions-integration)
+- [GitHub Security Best Practices](https://docs.github.com/en/actions/security-guides/security-hardening-for-github-actions)
+- [Dependency Scanning](https://docs.github.com/en/code-security/supply-chain-security)
+
+</details>
+
+<details>
+<summary>⚡ Performance & Optimization</summary>
+
+- [Caching Dependencies](https://docs.github.com/en/actions/using-workflows/caching-dependencies-to-speed-up-workflows)
+- [Docker Build Cache](https://docs.docker.com/build/cache/)
+- [Workflow Optimization](https://docs.github.com/en/actions/learn-github-actions/usage-limits-billing-and-administration)
+
+</details>
+
+<details>
+<summary>🛠️ CI/CD Tools</summary>
+
+- [act](https://github.com/nektos/act) - Run GitHub Actions locally
+- [actionlint](https://github.com/rhysd/actionlint) - Lint workflow files
+- [GitHub CLI](https://cli.github.com/) - Manage workflows from terminal
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 4-6:** CI will validate your Terraform and Ansible code
+- **Lab 7-8:** CI will run integration tests with logging/metrics
+- **Lab 9-10:** CI will validate Kubernetes manifests and Helm charts
+- **Lab 13:** ArgoCD will deploy what CI builds (GitOps!)
+- **All Future Labs:** This pipeline is your safety net for changes
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** CI isn't about having green checkmarks—it's about catching problems before they reach production. Focus on meaningful tests and understanding why each practice matters. Think like a DevOps engineer: automate everything, fail fast, and learn from failures.
diff --git a/labs/lab04.md b/labs/lab04.md
index eefa858953..a98794f6e1 100644
--- a/labs/lab04.md
+++ b/labs/lab04.md
@@ -1,1510 +1,1510 @@
-# Lab 4 — Infrastructure as Code (Terraform & Pulumi)
-
-![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
-![topic](https://img.shields.io/badge/topic-Infrastructure%20as%20Code-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Terraform%20%7C%20Pulumi-informational)
-
-> Provision cloud infrastructure using code with Terraform and Pulumi, comparing both approaches.
-
-## Overview
-
-Learn Infrastructure as Code (IaC) by creating virtual machines in the cloud using two popular tools: Terraform (declarative, HCL) and Pulumi (imperative, real programming languages).
-
-**What You'll Learn:**
-- Terraform fundamentals and HCL syntax
-- Pulumi fundamentals and infrastructure with code
-- Cloud provider APIs and resources
-- Infrastructure lifecycle management
-- IaC best practices and validation
-- Comparing IaC tools and approaches
-
-**Connection to Previous Labs:**
-- **Lab 2:** Created Docker images - now we'll provision infrastructure to run them
-- **Lab 3:** CI/CD for applications - now we'll add CI/CD for infrastructure
-- **Lab 5:** Ansible will provision software on these VMs (you'll need a VM ready!)
-
-**Tech Stack:** Terraform 1.9+ | Pulumi 3.x | Yandex Cloud / AWS
-
-**Why Two Tools?**
-By using both Terraform and Pulumi for the same task, you'll understand:
-- Different IaC philosophies (declarative vs imperative)
-- Tool trade-offs and use cases
-- How to evaluate IaC tools for your needs
-
-**Important for Lab 5:**
-The VM you create in this lab will be used in **Lab 5 (Ansible)** for configuration management. You have two options:
-- **Option A (Recommended):** Keep your cloud VM running until you complete Lab 5
-- **Option B:** Use a local VM (see Local VM Alternative section below)
-
-If you choose to destroy your cloud VM after Lab 4, you can easily recreate it later using your Terraform/Pulumi code!
-
----
-
-## Important: Cloud Provider Selection
-
-### Recommended for Russia: Yandex Cloud
-
-Yandex Cloud offers free tier and is accessible in Russia:
-- 1 VM with 20% vCPU, 1 GB RAM (free tier)
-- 10 GB SSD storage
-- No credit card required initially
-
-### Alternative Cloud Providers
-
-If Yandex Cloud is unavailable, choose any of these:
-
-**VK Cloud (Russia):**
-- Russian cloud provider
-- Free trial with bonus credits
-- Good documentation in Russian
-
-**AWS (Amazon Web Services):**
-- 750 hours/month free tier (t2.micro)
-- Most popular globally
-- Extensive documentation
-
-**GCP (Google Cloud Platform):**
-- $300 free credits for 90 days
-- Always-free tier for e2-micro
-- Modern interface
-
-**Azure (Microsoft):**
-- $200 free credits for 30 days
-- Free tier for B1s instances
-- Good Windows support
-
-**DigitalOcean:**
-- Simple pricing and interface
-- $200 free credits with GitHub Student Pack
-- Beginner-friendly
-
-### Cost Management 🚨
-
-**IMPORTANT - Read This:**
-- ✅ **Use smallest/free tier instances only**
-- ✅ **Run `terraform destroy` when done testing**
-- ✅ **Consider keeping VM for Lab 5 to avoid recreation**
-- ✅ **Set billing alerts if available**
-- ✅ **If not using for Lab 5, delete resources after lab completion**
-- ❌ **Never commit cloud credentials to Git**
-
----
-
-## Local VM Alternative
-
-If you cannot or prefer not to use cloud providers, you can use a local VM instead. This VM will need to meet specific requirements for Lab 5 (Ansible).
-
-### Option 1: VirtualBox/VMware VM
-
-**Requirements:**
-- Ubuntu 24.04 LTS (recommended) or Ubuntu 22.04 LTS
-- 1 GB RAM minimum (2 GB recommended)
-- 10 GB disk space
-- Network adapter in Bridged mode (or NAT with port forwarding)
-- SSH server installed and configured
-- Your SSH public key added to `~/.ssh/authorized_keys`
-- Static or predictable IP address
-
-**Setup Steps:**
-```bash
-# Install SSH server (if not installed)
-sudo apt update
-sudo apt install openssh-server
-
-# Add your SSH public key
-mkdir -p ~/.ssh
-echo "your-public-key-here" >> ~/.ssh/authorized_keys
-chmod 700 ~/.ssh
-chmod 600 ~/.ssh/authorized_keys
-
-# Verify SSH access from your host machine
-ssh username@vm-ip-address
-```
-
-### Option 2: Vagrant VM
-
-**Requirements:**
-- Vagrant installed on your machine
-- VirtualBox (or another Vagrant provider)
-
-**Basic Vagrantfile:**
-```ruby
-Vagrant.configure("2") do |config|
-  config.vm.box = "ubuntu/noble64"  # Ubuntu 24.04 LTS
-  # Or use "ubuntu/jammy64" for Ubuntu 22.04 LTS
-  config.vm.network "private_network", ip: "192.168.56.10"
-  config.vm.provider "virtualbox" do |vb|
-    vb.memory = "2048"
-  end
-end
-```
-
-### Option 3: WSL2 (Windows Subsystem for Linux)
-
-**Note:** WSL2 can work but has networking limitations. Bridged mode VM is preferred.
-
-**If using local VM:**
-- You can skip Terraform/Pulumi cloud provider setup
-- Document your local VM setup instead
-- For Task 1, show VM creation (manual or Vagrant)
-- For Task 2, you can skip Pulumi (or use Pulumi to manage Vagrant)
-- Focus on understanding IaC concepts with cloud provider research
-
-**Recommended Approach:**
-Even with a local VM, complete the Terraform/Pulumi tasks with a cloud provider to gain real IaC experience. You can destroy the cloud VM after Lab 4 and use your local VM for Lab 5.
-
----
-
-## Tasks
-
-### Task 1 — Terraform VM Creation (4 pts)
-
-**Objective:** Create a virtual machine using Terraform on your chosen cloud provider.
-
-**Requirements:**
-
-1. **Setup Terraform**
-   - Install Terraform CLI
-   - Choose and configure your cloud provider
-   - Set up authentication (access keys, service accounts, etc.)
-   - Initialize Terraform
-
-2. **Define Infrastructure**
-
-   Create a `terraform/` directory with the following resources:
-
-   **Minimum Required Resources:**
-   - **VM/Compute Instance** (smallest free tier size)
-   - **Network/VPC** (if required by provider)
-   - **Security Group/Firewall Rules:**
-     - Allow SSH (port 22) from your IP
-     - Allow HTTP (port 80)
-     - Allow custom port 5000 (for future app deployment)
-   - **Public IP Address** (to access VM remotely)
-
-3. **Configuration Best Practices**
-   - Use variables for configurable values (region, instance type, etc.)
-   - Use outputs to display important information (public IP, etc.)
-   - Add appropriate tags/labels for resource identification
-   - Use `.gitignore` for sensitive files
-
-4. **Apply Infrastructure**
-   - Run `terraform plan` to preview changes
-   - Review the plan carefully
-   - Apply infrastructure
-   - Verify VM is accessible via SSH
-   - Document the public IP and connection method
-
-5. **State Management**
-   - Keep state file local (for now)
-   - Understand what the state file contains
-   - **Never commit `terraform.tfstate` to Git**
-
-<details>
-<summary>💡 Terraform Fundamentals</summary>
-
-**What is Terraform?**
-
-Terraform is a declarative IaC tool that lets you define infrastructure in configuration files (HCL - HashiCorp Configuration Language).
-
-**Key Concepts:**
-
-**Providers:**
-- Plugins that interact with cloud APIs
-- Each cloud has its own provider (yandex, aws, google, azurerm)
-- Configure authentication and region
-
-**Resources:**
-- Infrastructure components (VMs, networks, firewalls)
-- Format: `resource "type" "name" { ... }`
-- Each resource has required and optional arguments
-
-**Data Sources:**
-- Query existing infrastructure
-- Example: Find latest Ubuntu image ID
-- Format: `data "type" "name" { ... }`
-
-**Variables:**
-- Make configurations reusable
-- Define in `variables.tf`
-- Set values in `terraform.tfvars` (gitignored!)
-- Reference: `var.variable_name`
-
-**Outputs:**
-- Display important values after apply
-- Example: VM public IP
-- Define in `outputs.tf`
-
-**State File:**
-- Tracks real infrastructure
-- Maps config to reality
-- **Never commit to Git** (contains sensitive data)
-- Add to `.gitignore`
-
-**Typical Workflow:**
-```bash
-terraform init      # Initialize provider plugins
-terraform fmt       # Format code
-terraform validate  # Check syntax
-terraform plan      # Preview changes
-terraform apply     # Create/update infrastructure
-terraform destroy   # Delete all infrastructure
-```
-
-**Resources:**
-- [Terraform Documentation](https://developer.hashicorp.com/terraform/docs)
-- [Terraform Registry](https://registry.terraform.io/) - Provider docs
-- [HCL Syntax](https://developer.hashicorp.com/terraform/language/syntax)
-
-</details>
-
-<details>
-<summary>☁️ Yandex Cloud Terraform Guide</summary>
-
-**Yandex Cloud Setup:**
-
-**Authentication:**
-- Create service account in Yandex Cloud Console
-- Generate authorized key (JSON)
-- Set key file path or use environment variables
-
-**Provider Configuration Pattern:**
-```hcl
-terraform {
-  required_providers {
-    yandex = {
-      source = "yandex-cloud/yandex"
-    }
-  }
-}
-
-provider "yandex" {
-  # Configuration here (zone, folder_id, etc.)
-}
-```
-
-**Key Resources:**
-- `yandex_compute_instance` - Virtual machine
-- `yandex_vpc_network` - Virtual private cloud
-- `yandex_vpc_subnet` - Subnet within VPC
-- `yandex_vpc_security_group` - Firewall rules
-
-**Free Tier Instance:**
-- Platform: standard-v2
-- Cores: 2 (core_fraction = 20%)
-- Memory: 1 GB
-- Boot disk: 10 GB HDD
-
-**SSH Access:**
-- Add SSH public key to `metadata`
-- Use `ssh-keys` metadata field
-- Connect: `ssh <username>@<public_ip>`
-
-**Resources:**
-- [Yandex Cloud Terraform Provider](https://registry.terraform.io/providers/yandex-cloud/yandex/latest/docs)
-- [Getting Started Guide](https://cloud.yandex.com/en/docs/tutorials/infrastructure-management/terraform-quickstart)
-- [Compute Instance Example](https://registry.terraform.io/providers/yandex-cloud/yandex/latest/docs/resources/compute_instance)
-
-</details>
-
-<details>
-<summary>☁️ AWS Terraform Guide</summary>
-
-**AWS Setup:**
-
-**Authentication:**
-- Create IAM user with EC2 permissions
-- Generate access key ID and secret access key
-- Configure AWS CLI or use environment variables
-- Never hardcode credentials
-
-**Provider Configuration Pattern:**
-```hcl
-terraform {
-  required_providers {
-    aws = {
-      source = "hashicorp/aws"
-    }
-  }
-}
-
-provider "aws" {
-  region = var.region  # e.g., "us-east-1"
-}
-```
-
-**Key Resources:**
-- `aws_instance` - EC2 instance
-- `aws_vpc` - Virtual Private Cloud
-- `aws_subnet` - Subnet within VPC
-- `aws_security_group` - Firewall rules
-- `aws_key_pair` - SSH key
-
-**Free Tier Instance:**
-- Instance type: t2.micro
-- AMI: Amazon Linux 2 or Ubuntu (find with data source)
-- 750 hours/month free for 12 months
-- 30 GB storage included
-
-**Data Source for AMI:**
-Use `aws_ami` data source to find latest Ubuntu image dynamically
-
-**Resources:**
-- [AWS Provider Documentation](https://registry.terraform.io/providers/hashicorp/aws/latest/docs)
-- [EC2 Instance Resource](https://registry.terraform.io/providers/hashicorp/aws/latest/docs/resources/instance)
-- [AWS Free Tier](https://aws.amazon.com/free/)
-
-</details>
-
-<details>
-<summary>☁️ GCP Terraform Guide</summary>
-
-**GCP Setup:**
-
-**Authentication:**
-- Create service account in Google Cloud Console
-- Download JSON key file
-- Set `GOOGLE_APPLICATION_CREDENTIALS` environment variable
-- Enable Compute Engine API
-
-**Provider Configuration Pattern:**
-```hcl
-terraform {
-  required_providers {
-    google = {
-      source = "hashicorp/google"
-    }
-  }
-}
-
-provider "google" {
-  project = var.project_id
-  region  = var.region
-}
-```
-
-**Key Resources:**
-- `google_compute_instance` - VM instance
-- `google_compute_network` - VPC network
-- `google_compute_subnetwork` - Subnet
-- `google_compute_firewall` - Firewall rules
-
-**Free Tier Instance:**
-- Machine type: e2-micro
-- Zone: us-central1-a (or other free tier zone)
-- Always free (within limits)
-- Boot disk: 30 GB standard persistent disk
-
-**Resources:**
-- [Google Provider Documentation](https://registry.terraform.io/providers/hashicorp/google/latest/docs)
-- [Compute Instance Resource](https://registry.terraform.io/providers/hashicorp/google/latest/docs/resources/compute_instance)
-- [GCP Free Tier](https://cloud.google.com/free)
-
-</details>
-
-<details>
-<summary>☁️ Other Cloud Providers</summary>
-
-**Azure:**
-- Provider: `azurerm`
-- Resource: `azurerm_linux_virtual_machine`
-- Free tier: B1s instance
-- [Azure Provider Docs](https://registry.terraform.io/providers/hashicorp/azurerm/latest/docs)
-
-**VK Cloud:**
-- Based on OpenStack
-- Provider: OpenStack provider
-- [VK Cloud Documentation](https://mcs.mail.ru/help/)
-
-**DigitalOcean:**
-- Provider: `digitalocean`
-- Resource: `digitalocean_droplet`
-- Simple and beginner-friendly
-- [DigitalOcean Provider Docs](https://registry.terraform.io/providers/digitalocean/digitalocean/latest/docs)
-
-**Questions to Explore:**
-- What's the smallest instance size for your provider?
-- How do you find the right OS image ID?
-- What authentication method does your provider use?
-- How do you add SSH keys to instances?
-
-</details>
-
-<details>
-<summary>🔒 Security Best Practices</summary>
-
-**Credentials Management:**
-
-**❌ NEVER DO THIS:**
-```hcl
-provider "aws" {
-  access_key = "AKIAIOSFODNN7EXAMPLE"  # NEVER!
-  secret_key = "wJalrXUtnFEMI/K7MDENG/bPxRfiCYEXAMPLEKEY"  # NEVER!
-}
-```
-
-**✅ DO THIS INSTEAD:**
-
-**Option 1: Environment Variables**
-```bash
-export AWS_ACCESS_KEY_ID="your-key"
-export AWS_SECRET_ACCESS_KEY="your-secret"
-# Provider will auto-detect
-```
-
-**Option 2: Credentials File**
-```bash
-# ~/.aws/credentials (for AWS)
-[default]
-aws_access_key_id = your-key
-aws_secret_access_key = your-secret
-```
-
-**Option 3: terraform.tfvars (gitignored)**
-```hcl
-# terraform.tfvars (add to .gitignore!)
-access_key = "your-key"
-secret_key = "your-secret"
-```
-
-**Files to Add to .gitignore:**
-```
-# Terraform
-*.tfstate
-*.tfstate.*
-.terraform/
-terraform.tfvars
-*.tfvars
-.terraform.lock.hcl
-
-# Cloud credentials
-*.pem
-*.key
-*.json  # Service account keys
-credentials
-```
-
-**SSH Key Management:**
-- Generate SSH key pair locally
-- Add public key to cloud provider
-- Keep private key secure (never commit)
-- Use `chmod 600` on private key file
-
-**Security Group Rules:**
-- Restrict SSH to your IP only (not 0.0.0.0/0)
-- Only open ports you need
-- Document why each port is open
-
-</details>
-
-<details>
-<summary>📁 Terraform Project Structure</summary>
-
-**Recommended Structure:**
-
-```
-terraform/
-├── .gitignore           # Ignore state, credentials
-├── main.tf              # Main resources
-├── variables.tf         # Input variables
-├── outputs.tf           # Output values
-├── terraform.tfvars     # Variable values (gitignored!)
-└── README.md            # Setup instructions
-```
-
-**What Goes in Each File:**
-
-**main.tf:**
-- Provider configuration
-- Resource definitions
-- Data sources
-
-**variables.tf:**
-- Variable declarations
-- Descriptions
-- Default values (non-sensitive only)
-
-**outputs.tf:**
-- Important values to display
-- VM IP addresses
-- Connection strings
-
-**terraform.tfvars:**
-- Actual variable values
-- Secrets and credentials
-- **MUST be in .gitignore**
-
-**Alternative: Single File**
-For small projects, you can put everything in `main.tf`, but multi-file is more maintainable.
-
-</details>
-
-**What to Document:**
-- Cloud provider chosen and why
-- Terraform version used
-- Resources created (VM size, region, etc.)
-- Public IP address of created VM
-- SSH connection command
-- Terminal output from `terraform plan` and `terraform apply`
-- Proof of SSH access to VM
-
----
-
-### Task 2 — Pulumi VM Creation (4 pts)
-
-**Objective:** Destroy the Terraform VM and recreate the same infrastructure using Pulumi.
-
-**Requirements:**
-
-1. **Cleanup Terraform Infrastructure**
-   - Run `terraform destroy` to delete all resources
-   - Verify all resources are deleted in cloud console
-   - Document the cleanup process
-
-2. **Setup Pulumi**
-   - Install Pulumi CLI
-   - Choose a programming language (Python recommended, or TypeScript, Go, C#, Java)
-   - Initialize a new Pulumi project
-   - Configure cloud provider
-
-3. **Recreate Same Infrastructure**
-
-   Create a `pulumi/` directory with equivalent resources:
-
-   **Same Resources as Task 1:**
-   - VM/Compute Instance (same size)
-   - Network/VPC
-   - Security Group/Firewall (same rules)
-   - Public IP Address
-
-   **Goal:** Functionally identical infrastructure, different tool
-
-4. **Apply Infrastructure**
-   - Run `pulumi preview` to see planned changes
-   - Apply infrastructure with `pulumi up`
-   - Verify VM is accessible via SSH
-   - Document the public IP
-
-5. **Compare Experience**
-   - What was easier/harder than Terraform?
-   - How does the code differ?
-   - Which approach do you prefer and why?
-
-<details>
-<summary>💡 Pulumi Fundamentals</summary>
-
-**What is Pulumi?**
-
-Pulumi is an imperative IaC tool that lets you write infrastructure using real programming languages (Python, TypeScript, Go, etc.).
-
-**Key Differences from Terraform:**
-
-| Aspect | Terraform | Pulumi |
-|--------|-----------|--------|
-| **Language** | HCL (declarative) | Python, JS, Go, etc. (imperative) |
-| **State** | Local or remote state file | Pulumi Cloud (free tier) or self-hosted |
-| **Logic** | Limited (count, for_each) | Full programming language |
-| **Testing** | External tools | Native unit tests |
-| **Secrets** | Plain in state | Encrypted by default |
-
-**Key Concepts:**
-
-**Resources:**
-- Similar to Terraform, but defined in code
-- Example (Python): `vm = compute.Instance("my-vm", ...)`
-
-**Stacks:**
-- Like Terraform workspaces
-- Separate environments (dev, staging, prod)
-- Each has its own config and state
-
-**Outputs:**
-- Return values from your program
-- Example: `pulumi.export("ip", vm.public_ip)`
-
-**Config:**
-- Per-stack configuration
-- Set with: `pulumi config set key value`
-- Access in code: `config.get("key")`
-
-**Typical Workflow:**
-```bash
-pulumi new <template>   # Create new project
-pulumi config set ...   # Configure settings
-pulumi preview          # Preview changes (like terraform plan)
-pulumi up               # Create/update infrastructure
-pulumi destroy          # Delete all infrastructure
-pulumi stack output     # View outputs
-```
-
-**Advantages of Pulumi:**
-- Use familiar programming languages
-- Full language features (loops, functions, classes)
-- Better IDE support (autocomplete, type checking)
-- Native testing capabilities
-- Secrets encrypted by default
-
-**Disadvantages of Pulumi:**
-- Smaller community than Terraform
-- More complex for simple tasks
-- Requires programming knowledge
-- Pulumi Cloud dependency (or self-hosted backend)
-
-**Resources:**
-- [Pulumi Documentation](https://www.pulumi.com/docs/)
-- [Pulumi Registry](https://www.pulumi.com/registry/) - Provider docs
-- [Python Examples](https://www.pulumi.com/docs/languages-sdks/python/)
-
-</details>
-
-<details>
-<summary>🐍 Pulumi with Python</summary>
-
-**Project Setup:**
-
-```bash
-pulumi new python
-# Follow prompts for project name, stack name
-```
-
-**Project Structure:**
-```
-pulumi/
-├── __main__.py          # Main infrastructure code
-├── requirements.txt     # Python dependencies
-├── Pulumi.yaml         # Project metadata
-├── Pulumi.dev.yaml     # Stack configuration
-└── venv/               # Python virtual environment
-```
-
-**Basic Pattern (AWS Example):**
-
-```python
-import pulumi
-import pulumi_aws as aws
-
-# Create a security group
-security_group = aws.ec2.SecurityGroup("web-sg",
-    description="Allow SSH and HTTP",
-    ingress=[
-        {"protocol": "tcp", "from_port": 22, "to_port": 22, "cidr_blocks": ["0.0.0.0/0"]},
-        {"protocol": "tcp", "from_port": 80, "to_port": 80, "cidr_blocks": ["0.0.0.0/0"]},
-    ])
-
-# Create an EC2 instance
-instance = aws.ec2.Instance("my-vm",
-    instance_type="t2.micro",
-    ami="ami-0c55b159cbfafe1f0",  # Ubuntu
-    security_groups=[security_group.name])
-
-# Export the instance's public IP
-pulumi.export("public_ip", instance.public_ip)
-```
-
-**Configuration:**
-```bash
-pulumi config set aws:region us-east-1
-pulumi config set --secret aws:accessKey YOUR_KEY
-pulumi config set --secret aws:secretKey YOUR_SECRET
-```
-
-**Running:**
-```bash
-# Activate venv
-source venv/bin/activate  # or venv\Scripts\activate on Windows
-
-# Install dependencies
-pip install -r requirements.txt
-
-# Preview and apply
-pulumi preview
-pulumi up
-```
-
-**Resources:**
-- [Pulumi Python SDK](https://www.pulumi.com/docs/languages-sdks/python/)
-- [Pulumi AWS Examples](https://github.com/pulumi/examples/tree/master/aws-py-webserver)
-
-</details>
-
-<details>
-<summary>📦 Pulumi with TypeScript</summary>
-
-**Project Setup:**
-
-```bash
-pulumi new typescript
-```
-
-**Basic Pattern (AWS Example):**
-
-```typescript
-import * as pulumi from "@pulumi/pulumi";
-import * as aws from "@pulumi/aws";
-
-// Create a security group
-const securityGroup = new aws.ec2.SecurityGroup("web-sg", {
-    description: "Allow SSH and HTTP",
-    ingress: [
-        { protocol: "tcp", fromPort: 22, toPort: 22, cidrBlocks: ["0.0.0.0/0"] },
-        { protocol: "tcp", fromPort: 80, toPort: 80, cidrBlocks: ["0.0.0.0/0"] },
-    ],
-});
-
-// Create an EC2 instance
-const instance = new aws.ec2.Instance("my-vm", {
-    instanceType: "t2.micro",
-    ami: "ami-0c55b159cbfafe1f0",
-    securityGroups: [securityGroup.name],
-});
-
-// Export the instance's public IP
-export const publicIp = instance.publicIp;
-```
-
-**Running:**
-```bash
-npm install
-pulumi preview
-pulumi up
-```
-
-</details>
-
-<details>
-<summary>☁️ Pulumi Cloud Providers</summary>
-
-**Installing Provider Packages:**
-
-**Yandex Cloud (Python):**
-```bash
-pip install pulumi-yandex
-```
-
-**AWS (Python):**
-```bash
-pip install pulumi-aws
-```
-
-**GCP (Python):**
-```bash
-pip install pulumi-gcp
-```
-
-**Azure (Python):**
-```bash
-pip install pulumi-azure-native
-```
-
-**Provider Documentation:**
-- [Pulumi Yandex](https://www.pulumi.com/registry/packages/yandex/)
-- [Pulumi AWS](https://www.pulumi.com/registry/packages/aws/)
-- [Pulumi GCP](https://www.pulumi.com/registry/packages/gcp/)
-- [Pulumi Azure](https://www.pulumi.com/registry/packages/azure-native/)
-
-**Authentication:**
-- Same as Terraform (environment variables, config files)
-- Pulumi can also use `pulumi config set --secret` for secure credential storage
-
-</details>
-
-<details>
-<summary>🔄 Migrating from Terraform to Pulumi</summary>
-
-**Key Differences:**
-
-**Resource Names:**
-- Terraform: `resource "aws_instance" "web" { ... }`
-- Pulumi: `const web = new aws.ec2.Instance("web", { ... })`
-
-**Variables:**
-- Terraform: `var.instance_type`
-- Pulumi: `config.require("instanceType")` or just regular variables
-
-**Outputs:**
-- Terraform: `output "ip" { value = aws_instance.web.public_ip }`
-- Pulumi: `export const ip = web.publicIp` (TS) or `pulumi.export("ip", web.public_ip)` (Python)
-
-**Benefits of Real Programming Language:**
-- Use loops, conditionals, functions naturally
-- Import external libraries
-- Better code reuse (functions, classes)
-- Type checking and IDE support
-
-**Conversion Tips:**
-1. Start with Terraform docs to understand resources needed
-2. Find equivalent Pulumi resources in registry
-3. Convert HCL blocks to function calls
-4. Use language features for logic
-
-**Pulumi Can Import Terraform State:**
-```bash
-pulumi import ...
-```
-But for this lab, start fresh with Pulumi.
-
-</details>
-
-**What to Document:**
-- Programming language chosen for Pulumi
-- Terraform destroy output
-- Pulumi preview and up output
-- Public IP of Pulumi-created VM
-- Comparison: Terraform vs Pulumi experience
-- Code differences (HCL vs Python/TypeScript)
-- Which tool you prefer and why
-
----
-
-### Task 3 — Documentation (2 pts)
-
-**Objective:** Document your IaC implementation, decisions, and learnings.
-
-Create `terraform/docs/LAB04.md` (or `docs/LAB04.md` at root) with these sections:
-
-### 1. Cloud Provider & Infrastructure
-- Cloud provider chosen and rationale
-- Instance type/size and why
-- Region/zone selected
-- Total cost (should be $0 with free tier)
-- Resources created (list all)
-
-### 2. Terraform Implementation
-- Terraform version used
-- Project structure explanation
-- Key configuration decisions
-- Challenges encountered
-- Terminal output from key commands:
-  - `terraform init`
-  - `terraform plan` (sanitized, no secrets)
-  - `terraform apply`
-  - SSH connection to VM
-
-### 3. Pulumi Implementation
-- Pulumi version and language used
-- How code differs from Terraform
-- Advantages you discovered
-- Challenges encountered
-- Terminal output from:
-  - `pulumi preview`
-  - `pulumi up`
-  - SSH connection to VM
-
-### 4. Terraform vs Pulumi Comparison
-
-Brief comparison (3-5 sentences each):
-- **Ease of Learning:** Which was easier to learn and why?
-- **Code Readability:** Which is more readable for you?
-- **Debugging:** Which was easier to debug when things went wrong?
-- **Documentation:** Which has better docs and examples?
-- **Use Case:** When would you use Terraform? When Pulumi?
-
-### 5. Lab 5 Preparation & Cleanup
-
-**VM for Lab 5:**
-- Are you keeping your VM for Lab 5? (Yes/No)
-- If yes: Which VM (Terraform or Pulumi created)?
-- If no: What will you use for Lab 5? (Local VM/Will recreate cloud VM)
-
-**Cleanup Status:**
-- If keeping VM for Lab 5: Show VM is still running and accessible
-- If destroying everything: Terminal output showing both tools' resources destroyed
-- Cloud console screenshot showing resource status (optional but recommended)
-
----
-
-## Bonus Task — IaC CI/CD + Infrastructure Import (2.5 pts)
-
-**Objective:** Add automated validation for infrastructure code and learn to import existing resources into Terraform.
-
-### Part 1: GitHub Actions for IaC Validation (1.5 pts)
-
-**Objective:** Automatically validate Terraform code on pull requests.
-
-**Requirements:**
-
-1. **Create Validation Workflow**
-
-   Create `.github/workflows/terraform-ci.yml` that:
-   - Triggers only on changes to `terraform/**` files
-   - Runs `terraform fmt -check` (code formatting validation)
-   - Runs `terraform init`
-   - Runs `terraform validate` (syntax validation)
-   - Runs `tflint` (Terraform linter for best practices)
-
-2. **Workflow Setup**
-   - Install Terraform in workflow
-   - Install tflint
-   - Configure path filters (similar to Lab 3)
-   - Show validation results in workflow logs
-
-3. **Testing**
-   - Create a PR with Terraform changes
-   - Verify workflow runs only for Terraform changes
-   - Show passing and failing validation examples
-
-<details>
-<summary>💡 Terraform CI/CD Concepts</summary>
-
-**Why Validate Infrastructure Code in CI?**
-
-- Catch syntax errors before apply
-- Enforce code formatting standards
-- Check for security issues and bad practices
-- Prevent broken configurations from merging
-- Review infrastructure changes before deployment
-
-**Terraform CI Steps:**
-
-**terraform fmt:**
-- Formats code to canonical style
-- Use `-check` flag to verify without changing files
-- Ensures consistency across team
-
-**terraform validate:**
-- Checks syntax and internal consistency
-- Validates resource configurations
-- Doesn't access provider APIs (fast)
-
-**tflint:**
-- Linter for Terraform code
-- Finds possible errors (invalid instance types, etc.)
-- Checks best practices
-- Provider-specific rules
-
-**Path Filters:**
-- Only run workflow when IaC files change
-- Same concept as Lab 3 path filters
-- Prevents unnecessary CI runs
-
-**Pattern for Workflow:**
-```yaml
-on:
-  pull_request:
-    paths:
-      - 'terraform/**'
-      - '.github/workflows/terraform-ci.yml'
-
-jobs:
-  validate:
-    runs-on: ubuntu-latest
-    steps:
-      - Checkout code
-      - Setup Terraform
-      - Install tflint
-      - Run terraform fmt -check
-      - Run terraform init
-      - Run terraform validate
-      - Run tflint
-```
-
-**Advanced: Terraform Plan in PR**
-
-You can also add `terraform plan` to show what would change:
-- Requires cloud credentials (use GitHub Secrets)
-- Shows plan output as PR comment
-- Helps reviewers understand impact
-- Use `terraform plan -no-color` for readable output
-
-**Security Considerations:**
-- Be careful with secrets in CI
-- Don't expose sensitive outputs
-- Use `-backend=false` for init if not using state
-- Consider using Terraform Cloud for plan sharing
-
-**Resources:**
-- [GitHub Actions for Terraform](https://developer.hashicorp.com/terraform/tutorials/automation/github-actions)
-- [tflint Documentation](https://github.com/terraform-linters/tflint)
-- [Setup Terraform Action](https://github.com/hashicorp/setup-terraform)
-
-</details>
-
-<details>
-<summary>🔧 tflint Setup</summary>
-
-**What is tflint?**
-
-A linter for Terraform that finds:
-- Possible errors (invalid instance types, deprecated syntax)
-- Best practice violations
-- Provider-specific issues
-
-**Installation in CI:**
-```yaml
-- name: Setup TFLint
-  uses: terraform-linters/setup-tflint@v3
-  with:
-    tflint_version: latest
-
-- name: Run TFLint
-  run: tflint --format compact
-  working-directory: terraform/
-```
-
-**Local Installation:**
-```bash
-# macOS
-brew install tflint
-
-# Linux
-curl -s https://raw.githubusercontent.com/terraform-linters/tflint/master/install_linux.sh | bash
-
-# Windows
-choco install tflint
-```
-
-**Configuration (.tflint.hcl):**
-```hcl
-plugin "terraform" {
-  enabled = true
-}
-
-plugin "aws" {  # Or your cloud provider
-  enabled = true
-}
-```
-
-**Running Locally:**
-```bash
-cd terraform/
-tflint --init  # Download plugins
-tflint         # Run linting
-```
-
-**Common Issues Found:**
-- Invalid instance types
-- Missing required arguments
-- Deprecated syntax
-- Security group issues
-- Invalid AMI IDs
-
-</details>
-
-### Part 2: Import GitHub Repository to Terraform (1 pt)
-
-**Objective:** Learn to manage existing infrastructure with Terraform by importing your course repository.
-
-**Requirements:**
-
-1. **Import GitHub Repository**
-   - Create Terraform configuration for GitHub provider
-   - Define a `github_repository` resource for your course repo
-   - Use `terraform import` to bring existing repo under Terraform management
-   - Verify state matches reality
-
-2. **Manage Repository Settings**
-   - Add Terraform code to manage repository settings:
-     - Description
-     - Visibility (public/private)
-     - Has issues enabled
-     - Has wiki enabled
-     - Branch protection rules (optional)
-   - Apply changes and verify in GitHub
-
-3. **Documentation**
-   - Explain the import process
-   - Show terminal output of import command
-   - Document why importing existing resources matters
-
-<details>
-<summary>💡 Why Import Existing Resources?</summary>
-
-**The Problem:**
-
-In real world, you often have:
-- Infrastructure created manually (before IaC adoption)
-- Resources created by other tools or people
-- Legacy systems that need to be managed with code
-
-You can't just run `terraform apply` - resources already exist!
-
-**The Solution: terraform import**
-
-Import brings existing resources into Terraform management:
-1. Write Terraform config describing the resource
-2. Run `terraform import` to link config to real resource
-3. Terraform now manages that resource
-4. Future changes go through Terraform
-
-**Advantages of Managing Existing Resources with IaC:**
-
-**1. Version Control:**
-- Track configuration changes over time
-- See who changed what and when
-- Rollback to previous configurations
-
-**2. Consistency:**
-- Standardize configuration across resources
-- Prevent configuration drift
-- Ensure compliance with policies
-
-**3. Automation:**
-- Changes require code review
-- CI/CD validation
-- Automated testing
-
-**4. Documentation:**
-- Code is living documentation
-- Anyone can see current configuration
-- No "tribal knowledge" needed
-
-**5. Disaster Recovery:**
-- Quickly recreate infrastructure from code
-- No manual steps to remember
-- Tested recovery process
-
-**6. Team Collaboration:**
-- Multiple people can work on infrastructure
-- PR-based workflow
-- No conflicting manual changes
-
-**Real-World Use Cases:**
-
-**Brownfield Infrastructure:**
-- Company has 100s of manually created resources
-- Import them gradually into Terraform
-- Eventually all infrastructure is code-managed
-
-**Migrating Between Tools:**
-- Moving from CloudFormation to Terraform
-- Moving from manual management to IaC
-- Gradual transition without downtime
-
-**Compliance and Governance:**
-- All changes must go through code review
-- Audit trail of who changed what
-- Prevent unauthorized changes
-
-**Cost Management:**
-- Review infrastructure changes before apply
-- Prevent accidental expensive resources
-- Track infrastructure costs in code
-
-**The Import Process:**
-
-```bash
-# 1. Write the resource config (empty or partial)
-resource "github_repository" "course_repo" {
-  name = "DevOps-Core-Course"
-  # ... other settings
-}
-
-# 2. Import the existing resource
-terraform import github_repository.course_repo DevOps-Core-Course
-
-# 3. Terraform now tracks this resource in state
-# 4. Run terraform plan to see any drift
-# 5. Update config to match reality
-# 6. Apply to bring under full management
-```
-
-**Challenges:**
-
-- Config must match reality exactly
-- May need to import many related resources
-- Some resources don't support import
-- Requires careful planning
-
-**Best Practices:**
-
-- Import one resource at a time
-- Test in non-production first
-- Use `terraform plan` to verify match
-- Document the import process
-- Keep manual backups before import
-
-**Resources:**
-- [Terraform Import Command](https://developer.hashicorp.com/terraform/cli/import)
-- [Import Usage Examples](https://developer.hashicorp.com/terraform/cli/import/usage)
-
-</details>
-
-<details>
-<summary>🐙 GitHub Provider Setup</summary>
-
-**Installing GitHub Provider:**
-
-```hcl
-terraform {
-  required_providers {
-    github = {
-      source  = "integrations/github"
-      version = "~> 5.0"
-    }
-  }
-}
-
-provider "github" {
-  token = var.github_token  # Personal access token
-}
-```
-
-**Authentication:**
-
-**Create Personal Access Token:**
-1. GitHub → Settings → Developer settings → Personal access tokens → Tokens (classic)
-2. Generate new token
-3. Select scopes: `repo` (all repo permissions)
-4. Copy token (shown once!)
-
-**Configure Token:**
-```bash
-# Environment variable (recommended)
-export GITHUB_TOKEN="your-token-here"
-
-# Or in terraform.tfvars (gitignored!)
-github_token = "your-token-here"
-```
-
-**Repository Resource:**
-
-```hcl
-resource "github_repository" "course_repo" {
-  name        = "DevOps-Core-Course"
-  description = "DevOps course lab assignments"
-  visibility  = "public"
-
-  has_issues   = true
-  has_wiki     = false
-  has_projects = false
-
-  # Other settings...
-}
-```
-
-**Import Command:**
-
-```bash
-# Format: terraform import <resource_type>.<name> <repo_name>
-terraform import github_repository.course_repo DevOps-Core-Course
-```
-
-**After Import:**
-1. Run `terraform plan` - shows differences between code and reality
-2. Update your config to match reality (eliminate differences)
-3. Run `terraform plan` again - should show "No changes"
-4. Now you can manage the repo with Terraform!
-
-**What You Can Manage:**
-- Repository settings
-- Branch protection rules
-- Collaborators and teams
-- Webhooks
-- Deploy keys
-- Repository secrets
-
-**Resources:**
-- [GitHub Provider Documentation](https://registry.terraform.io/providers/integrations/github/latest/docs)
-- [Repository Resource](https://registry.terraform.io/providers/integrations/github/latest/docs/resources/repository)
-- [Import Guide](https://registry.terraform.io/providers/integrations/github/latest/docs/resources/repository#import)
-
-</details>
-
-**What to Document:**
-- Workflow file implementation
-- Path filter configuration
-- tflint results and any issues found
-- Example of workflow running on PR
-- GitHub repository import process
-- Terminal output of import command
-- Why importing matters (brief explanation)
-- Benefits you see for managing repos with IaC
-
----
-
-## How to Submit
-
-1. **Create Branch:**
-   - Create a new branch called `lab04`
-   - Work on this branch
-
-2. **Commit Work:**
-   - Add Terraform code (`terraform/` directory)
-   - Add Pulumi code (`pulumi/` directory)
-   - Add documentation (`docs/LAB04.md` or `terraform/docs/LAB04.md`)
-   - Add GitHub workflow (`.github/workflows/terraform-ci.yml` if doing bonus)
-   - **IMPORTANT:** Ensure `.gitignore` excludes:
-     - `*.tfstate`, `*.tfstate.*`, `.terraform/`, `terraform.tfvars`
-     - `pulumi/venv/`, `Pulumi.*.yaml` (stack configs with secrets)
-     - Any credential files
-   - Commit with conventional commits format
-
-3. **CLEANUP BEFORE COMMITTING:**
-
-   **If keeping VM for Lab 5:**
-   - ✅ Keep one VM running (Terraform or Pulumi - your choice)
-   - ✅ Destroy the other tool's resources
-   - ✅ Document which VM you're keeping in LAB04.md
-   - ✅ Check no secrets in code
-   - ✅ Review .gitignore is correct
-
-   **If NOT keeping VM for Lab 5:**
-   - ✅ Run `terraform destroy`
-   - ✅ Run `pulumi destroy`
-   - ✅ Verify no resources in cloud console
-   - ✅ Check no secrets in code
-   - ✅ Review .gitignore is correct
-   - ✅ Document your Lab 5 plan (local VM or recreate cloud VM)
-
-4. **Create Pull Requests:**
-   - **PR #1:** `your-fork:lab04` → `course-repo:master`
-   - **PR #2:** `your-fork:lab04` → `your-fork:master`
-   - Bonus workflow will validate Terraform code automatically
-
----
-
-## Acceptance Criteria
-
-### Main Tasks (10 points)
-
-**Terraform VM Creation (4 pts):**
-- [ ] Cloud provider chosen and configured
-- [ ] Terraform project created in `terraform/` directory
-- [ ] All required resources defined (VM, network, security group, public IP)
-- [ ] Free tier instance used
-- [ ] Variables and outputs used appropriately
-- [ ] `.gitignore` configured correctly
-- [ ] Infrastructure applied successfully
-- [ ] VM accessible via SSH (proof provided)
-- [ ] Terminal output from `terraform plan` and `terraform apply` provided
-- [ ] No secrets committed to Git
-
-**Pulumi VM Recreation (4 pts):**
-- [ ] Terraform resources destroyed (proof provided)
-- [ ] Pulumi project created in `pulumi/` directory
-- [ ] Programming language chosen
-- [ ] Same infrastructure recreated with Pulumi
-- [ ] Infrastructure applied successfully
-- [ ] VM accessible via SSH (proof provided)
-- [ ] Terminal output from `pulumi preview` and `pulumi up` provided
-- [ ] Comparison with Terraform documented
-
-**Documentation (2 pts):**
-- [ ] `docs/LAB04.md` complete with all required sections
-- [ ] Cloud provider choice justified
-- [ ] Terraform implementation documented
-- [ ] Pulumi implementation documented
-- [ ] Terraform vs Pulumi comparison provided
-- [ ] Lab 5 preparation documented (keeping VM or using local/recreating)
-- [ ] Cleanup status documented (what's kept, what's destroyed)
-- [ ] Terminal outputs provided (sanitized, no secrets)
-
-### Bonus Task (2.5 points)
-
-**Part 1: IaC CI/CD (1.5 pts)**
-- [ ] GitHub Actions workflow created (`.github/workflows/terraform-ci.yml`)
-- [ ] Path filters configured for `terraform/**`
-- [ ] Workflow runs `terraform fmt -check`
-- [ ] Workflow runs `terraform validate`
-- [ ] Workflow runs `tflint`
-- [ ] Workflow triggers only on Terraform changes (proof provided)
-- [ ] Documentation includes workflow implementation details
-
-**Part 2: GitHub Repository Import (1 pt)**
-- [ ] GitHub provider configured in Terraform
-- [ ] Repository resource defined
-- [ ] `terraform import` executed successfully
-- [ ] State matches reality (terraform plan shows no changes)
-- [ ] Terminal output of import process provided
-- [ ] Documentation explains why importing matters
-- [ ] Benefits of managing existing resources documented
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Terraform Implementation** | 4 pts | Working infrastructure, best practices, documentation |
-| **Pulumi Implementation** | 4 pts | Working infrastructure, comparison provided |
-| **Documentation** | 2 pts | Complete, clear, includes cleanup proof |
-| **Bonus: IaC CI/CD** | 1.5 pts | Automated validation, path filters working |
-| **Bonus: Import** | 1 pt | Successful import, benefits explained |
-| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
-
-**Grading:**
-- **10/10:** Both tools working perfectly, excellent comparison, comprehensive documentation, proper cleanup
-- **8-9/10:** Infrastructure works, good documentation, minor issues or missing comparisons
-- **6-7/10:** One tool works well, other has issues, minimal comparison, incomplete docs
-- **<6/10:** Infrastructure doesn't work, major issues, secrets committed, no cleanup
-
-**Critical Requirements:**
-- ✅ MUST use free tier resources only
-- ✅ MUST document Lab 5 VM plan (keeping, local, or recreating)
-- ✅ MUST NOT commit secrets or state files
-- ✅ MUST provide SSH access proof
-- ⚠️ Keeping ONE VM for Lab 5 is acceptable (document it!)
-- ❌ Multiple VMs running without documentation = point deduction
-
----
-
-## Resources
-
-<details>
-<summary>📚 Terraform Documentation</summary>
-
-- [Terraform Documentation](https://developer.hashicorp.com/terraform/docs)
-- [Terraform Registry](https://registry.terraform.io/) - All providers
-- [Terraform Best Practices](https://www.terraform-best-practices.com/)
-- [HCL Configuration Language](https://developer.hashicorp.com/terraform/language)
-
-</details>
-
-<details>
-<summary>📚 Pulumi Documentation</summary>
-
-- [Pulumi Documentation](https://www.pulumi.com/docs/)
-- [Pulumi Registry](https://www.pulumi.com/registry/)
-- [Pulumi Examples](https://github.com/pulumi/examples)
-- [Pulumi vs Terraform](https://www.pulumi.com/docs/concepts/vs/terraform/)
-
-</details>
-
-<details>
-<summary>☁️ Cloud Provider Documentation</summary>
-
-- [Yandex Cloud Docs](https://cloud.yandex.com/en/docs)
-- [AWS Documentation](https://docs.aws.amazon.com/)
-- [GCP Documentation](https://cloud.google.com/docs)
-- [Azure Documentation](https://learn.microsoft.com/azure/)
-- [VK Cloud Docs](https://mcs.mail.ru/help/)
-
-</details>
-
-<details>
-<summary>🔒 Security & Best Practices</summary>
-
-- [Terraform Security Best Practices](https://spacelift.io/blog/terraform-security-best-practices)
-- [Managing Secrets in Terraform](https://developer.hashicorp.com/terraform/tutorials/configuration-language/sensitive-variables)
-- [Pulumi Secrets Management](https://www.pulumi.com/docs/concepts/secrets/)
-- [Git Secrets Prevention](https://github.com/awslabs/git-secrets)
-
-</details>
-
-<details>
-<summary>🛠️ Tools</summary>
-
-- [Terraform CLI](https://developer.hashicorp.com/terraform/downloads)
-- [Pulumi CLI](https://www.pulumi.com/docs/install/)
-- [tflint](https://github.com/terraform-linters/tflint) - Terraform linter
-- [terraform-docs](https://terraform-docs.io/) - Generate docs from code
-- [Infracost](https://www.infracost.io/) - Cost estimation for Terraform
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 5:** Ansible will provision software on your VM (install Docker, deploy your app from Labs 1-3)
-  - **You'll need a VM ready** - either keep your cloud VM from this lab, use a local VM, or recreate later
-- **Lab 6:** Ansible + Terraform integration (provision and configure in one workflow)
-- **Lab 9:** Kubernetes will replace individual VMs (but concepts are same)
-- **Lab 13:** ArgoCD will manage infrastructure changes (GitOps for infrastructure)
-
----
-
-**Good luck!** 🚀
-
-> **Remember:** Infrastructure as Code is about automation, repeatability, and collaboration. Focus on understanding WHY we define infrastructure in code, not just HOW. Consider keeping one VM for Lab 5 (Ansible). If destroying resources, document your Lab 5 plan. Never commit secrets!
+# Lab 4 — Infrastructure as Code (Terraform & Pulumi)
+
+![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
+![topic](https://img.shields.io/badge/topic-Infrastructure%20as%20Code-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Terraform%20%7C%20Pulumi-informational)
+
+> Provision cloud infrastructure using code with Terraform and Pulumi, comparing both approaches.
+
+## Overview
+
+Learn Infrastructure as Code (IaC) by creating virtual machines in the cloud using two popular tools: Terraform (declarative, HCL) and Pulumi (imperative, real programming languages).
+
+**What You'll Learn:**
+- Terraform fundamentals and HCL syntax
+- Pulumi fundamentals and infrastructure with code
+- Cloud provider APIs and resources
+- Infrastructure lifecycle management
+- IaC best practices and validation
+- Comparing IaC tools and approaches
+
+**Connection to Previous Labs:**
+- **Lab 2:** Created Docker images - now we'll provision infrastructure to run them
+- **Lab 3:** CI/CD for applications - now we'll add CI/CD for infrastructure
+- **Lab 5:** Ansible will provision software on these VMs (you'll need a VM ready!)
+
+**Tech Stack:** Terraform 1.9+ | Pulumi 3.x | Yandex Cloud / AWS
+
+**Why Two Tools?**
+By using both Terraform and Pulumi for the same task, you'll understand:
+- Different IaC philosophies (declarative vs imperative)
+- Tool trade-offs and use cases
+- How to evaluate IaC tools for your needs
+
+**Important for Lab 5:**
+The VM you create in this lab will be used in **Lab 5 (Ansible)** for configuration management. You have two options:
+- **Option A (Recommended):** Keep your cloud VM running until you complete Lab 5
+- **Option B:** Use a local VM (see Local VM Alternative section below)
+
+If you choose to destroy your cloud VM after Lab 4, you can easily recreate it later using your Terraform/Pulumi code!
+
+---
+
+## Important: Cloud Provider Selection
+
+### Recommended for Russia: Yandex Cloud
+
+Yandex Cloud offers free tier and is accessible in Russia:
+- 1 VM with 20% vCPU, 1 GB RAM (free tier)
+- 10 GB SSD storage
+- No credit card required initially
+
+### Alternative Cloud Providers
+
+If Yandex Cloud is unavailable, choose any of these:
+
+**VK Cloud (Russia):**
+- Russian cloud provider
+- Free trial with bonus credits
+- Good documentation in Russian
+
+**AWS (Amazon Web Services):**
+- 750 hours/month free tier (t2.micro)
+- Most popular globally
+- Extensive documentation
+
+**GCP (Google Cloud Platform):**
+- $300 free credits for 90 days
+- Always-free tier for e2-micro
+- Modern interface
+
+**Azure (Microsoft):**
+- $200 free credits for 30 days
+- Free tier for B1s instances
+- Good Windows support
+
+**DigitalOcean:**
+- Simple pricing and interface
+- $200 free credits with GitHub Student Pack
+- Beginner-friendly
+
+### Cost Management 🚨
+
+**IMPORTANT - Read This:**
+- ✅ **Use smallest/free tier instances only**
+- ✅ **Run `terraform destroy` when done testing**
+- ✅ **Consider keeping VM for Lab 5 to avoid recreation**
+- ✅ **Set billing alerts if available**
+- ✅ **If not using for Lab 5, delete resources after lab completion**
+- ❌ **Never commit cloud credentials to Git**
+
+---
+
+## Local VM Alternative
+
+If you cannot or prefer not to use cloud providers, you can use a local VM instead. This VM will need to meet specific requirements for Lab 5 (Ansible).
+
+### Option 1: VirtualBox/VMware VM
+
+**Requirements:**
+- Ubuntu 24.04 LTS (recommended) or Ubuntu 22.04 LTS
+- 1 GB RAM minimum (2 GB recommended)
+- 10 GB disk space
+- Network adapter in Bridged mode (or NAT with port forwarding)
+- SSH server installed and configured
+- Your SSH public key added to `~/.ssh/authorized_keys`
+- Static or predictable IP address
+
+**Setup Steps:**
+```bash
+# Install SSH server (if not installed)
+sudo apt update
+sudo apt install openssh-server
+
+# Add your SSH public key
+mkdir -p ~/.ssh
+echo "your-public-key-here" >> ~/.ssh/authorized_keys
+chmod 700 ~/.ssh
+chmod 600 ~/.ssh/authorized_keys
+
+# Verify SSH access from your host machine
+ssh username@vm-ip-address
+```
+
+### Option 2: Vagrant VM
+
+**Requirements:**
+- Vagrant installed on your machine
+- VirtualBox (or another Vagrant provider)
+
+**Basic Vagrantfile:**
+```ruby
+Vagrant.configure("2") do |config|
+  config.vm.box = "ubuntu/noble64"  # Ubuntu 24.04 LTS
+  # Or use "ubuntu/jammy64" for Ubuntu 22.04 LTS
+  config.vm.network "private_network", ip: "192.168.56.10"
+  config.vm.provider "virtualbox" do |vb|
+    vb.memory = "2048"
+  end
+end
+```
+
+### Option 3: WSL2 (Windows Subsystem for Linux)
+
+**Note:** WSL2 can work but has networking limitations. Bridged mode VM is preferred.
+
+**If using local VM:**
+- You can skip Terraform/Pulumi cloud provider setup
+- Document your local VM setup instead
+- For Task 1, show VM creation (manual or Vagrant)
+- For Task 2, you can skip Pulumi (or use Pulumi to manage Vagrant)
+- Focus on understanding IaC concepts with cloud provider research
+
+**Recommended Approach:**
+Even with a local VM, complete the Terraform/Pulumi tasks with a cloud provider to gain real IaC experience. You can destroy the cloud VM after Lab 4 and use your local VM for Lab 5.
+
+---
+
+## Tasks
+
+### Task 1 — Terraform VM Creation (4 pts)
+
+**Objective:** Create a virtual machine using Terraform on your chosen cloud provider.
+
+**Requirements:**
+
+1. **Setup Terraform**
+   - Install Terraform CLI
+   - Choose and configure your cloud provider
+   - Set up authentication (access keys, service accounts, etc.)
+   - Initialize Terraform
+
+2. **Define Infrastructure**
+
+   Create a `terraform/` directory with the following resources:
+
+   **Minimum Required Resources:**
+   - **VM/Compute Instance** (smallest free tier size)
+   - **Network/VPC** (if required by provider)
+   - **Security Group/Firewall Rules:**
+     - Allow SSH (port 22) from your IP
+     - Allow HTTP (port 80)
+     - Allow custom port 5000 (for future app deployment)
+   - **Public IP Address** (to access VM remotely)
+
+3. **Configuration Best Practices**
+   - Use variables for configurable values (region, instance type, etc.)
+   - Use outputs to display important information (public IP, etc.)
+   - Add appropriate tags/labels for resource identification
+   - Use `.gitignore` for sensitive files
+
+4. **Apply Infrastructure**
+   - Run `terraform plan` to preview changes
+   - Review the plan carefully
+   - Apply infrastructure
+   - Verify VM is accessible via SSH
+   - Document the public IP and connection method
+
+5. **State Management**
+   - Keep state file local (for now)
+   - Understand what the state file contains
+   - **Never commit `terraform.tfstate` to Git**
+
+<details>
+<summary>💡 Terraform Fundamentals</summary>
+
+**What is Terraform?**
+
+Terraform is a declarative IaC tool that lets you define infrastructure in configuration files (HCL - HashiCorp Configuration Language).
+
+**Key Concepts:**
+
+**Providers:**
+- Plugins that interact with cloud APIs
+- Each cloud has its own provider (yandex, aws, google, azurerm)
+- Configure authentication and region
+
+**Resources:**
+- Infrastructure components (VMs, networks, firewalls)
+- Format: `resource "type" "name" { ... }`
+- Each resource has required and optional arguments
+
+**Data Sources:**
+- Query existing infrastructure
+- Example: Find latest Ubuntu image ID
+- Format: `data "type" "name" { ... }`
+
+**Variables:**
+- Make configurations reusable
+- Define in `variables.tf`
+- Set values in `terraform.tfvars` (gitignored!)
+- Reference: `var.variable_name`
+
+**Outputs:**
+- Display important values after apply
+- Example: VM public IP
+- Define in `outputs.tf`
+
+**State File:**
+- Tracks real infrastructure
+- Maps config to reality
+- **Never commit to Git** (contains sensitive data)
+- Add to `.gitignore`
+
+**Typical Workflow:**
+```bash
+terraform init      # Initialize provider plugins
+terraform fmt       # Format code
+terraform validate  # Check syntax
+terraform plan      # Preview changes
+terraform apply     # Create/update infrastructure
+terraform destroy   # Delete all infrastructure
+```
+
+**Resources:**
+- [Terraform Documentation](https://developer.hashicorp.com/terraform/docs)
+- [Terraform Registry](https://registry.terraform.io/) - Provider docs
+- [HCL Syntax](https://developer.hashicorp.com/terraform/language/syntax)
+
+</details>
+
+<details>
+<summary>☁️ Yandex Cloud Terraform Guide</summary>
+
+**Yandex Cloud Setup:**
+
+**Authentication:**
+- Create service account in Yandex Cloud Console
+- Generate authorized key (JSON)
+- Set key file path or use environment variables
+
+**Provider Configuration Pattern:**
+```hcl
+terraform {
+  required_providers {
+    yandex = {
+      source = "yandex-cloud/yandex"
+    }
+  }
+}
+
+provider "yandex" {
+  # Configuration here (zone, folder_id, etc.)
+}
+```
+
+**Key Resources:**
+- `yandex_compute_instance` - Virtual machine
+- `yandex_vpc_network` - Virtual private cloud
+- `yandex_vpc_subnet` - Subnet within VPC
+- `yandex_vpc_security_group` - Firewall rules
+
+**Free Tier Instance:**
+- Platform: standard-v2
+- Cores: 2 (core_fraction = 20%)
+- Memory: 1 GB
+- Boot disk: 10 GB HDD
+
+**SSH Access:**
+- Add SSH public key to `metadata`
+- Use `ssh-keys` metadata field
+- Connect: `ssh <username>@<public_ip>`
+
+**Resources:**
+- [Yandex Cloud Terraform Provider](https://registry.terraform.io/providers/yandex-cloud/yandex/latest/docs)
+- [Getting Started Guide](https://cloud.yandex.com/en/docs/tutorials/infrastructure-management/terraform-quickstart)
+- [Compute Instance Example](https://registry.terraform.io/providers/yandex-cloud/yandex/latest/docs/resources/compute_instance)
+
+</details>
+
+<details>
+<summary>☁️ AWS Terraform Guide</summary>
+
+**AWS Setup:**
+
+**Authentication:**
+- Create IAM user with EC2 permissions
+- Generate access key ID and secret access key
+- Configure AWS CLI or use environment variables
+- Never hardcode credentials
+
+**Provider Configuration Pattern:**
+```hcl
+terraform {
+  required_providers {
+    aws = {
+      source = "hashicorp/aws"
+    }
+  }
+}
+
+provider "aws" {
+  region = var.region  # e.g., "us-east-1"
+}
+```
+
+**Key Resources:**
+- `aws_instance` - EC2 instance
+- `aws_vpc` - Virtual Private Cloud
+- `aws_subnet` - Subnet within VPC
+- `aws_security_group` - Firewall rules
+- `aws_key_pair` - SSH key
+
+**Free Tier Instance:**
+- Instance type: t2.micro
+- AMI: Amazon Linux 2 or Ubuntu (find with data source)
+- 750 hours/month free for 12 months
+- 30 GB storage included
+
+**Data Source for AMI:**
+Use `aws_ami` data source to find latest Ubuntu image dynamically
+
+**Resources:**
+- [AWS Provider Documentation](https://registry.terraform.io/providers/hashicorp/aws/latest/docs)
+- [EC2 Instance Resource](https://registry.terraform.io/providers/hashicorp/aws/latest/docs/resources/instance)
+- [AWS Free Tier](https://aws.amazon.com/free/)
+
+</details>
+
+<details>
+<summary>☁️ GCP Terraform Guide</summary>
+
+**GCP Setup:**
+
+**Authentication:**
+- Create service account in Google Cloud Console
+- Download JSON key file
+- Set `GOOGLE_APPLICATION_CREDENTIALS` environment variable
+- Enable Compute Engine API
+
+**Provider Configuration Pattern:**
+```hcl
+terraform {
+  required_providers {
+    google = {
+      source = "hashicorp/google"
+    }
+  }
+}
+
+provider "google" {
+  project = var.project_id
+  region  = var.region
+}
+```
+
+**Key Resources:**
+- `google_compute_instance` - VM instance
+- `google_compute_network` - VPC network
+- `google_compute_subnetwork` - Subnet
+- `google_compute_firewall` - Firewall rules
+
+**Free Tier Instance:**
+- Machine type: e2-micro
+- Zone: us-central1-a (or other free tier zone)
+- Always free (within limits)
+- Boot disk: 30 GB standard persistent disk
+
+**Resources:**
+- [Google Provider Documentation](https://registry.terraform.io/providers/hashicorp/google/latest/docs)
+- [Compute Instance Resource](https://registry.terraform.io/providers/hashicorp/google/latest/docs/resources/compute_instance)
+- [GCP Free Tier](https://cloud.google.com/free)
+
+</details>
+
+<details>
+<summary>☁️ Other Cloud Providers</summary>
+
+**Azure:**
+- Provider: `azurerm`
+- Resource: `azurerm_linux_virtual_machine`
+- Free tier: B1s instance
+- [Azure Provider Docs](https://registry.terraform.io/providers/hashicorp/azurerm/latest/docs)
+
+**VK Cloud:**
+- Based on OpenStack
+- Provider: OpenStack provider
+- [VK Cloud Documentation](https://mcs.mail.ru/help/)
+
+**DigitalOcean:**
+- Provider: `digitalocean`
+- Resource: `digitalocean_droplet`
+- Simple and beginner-friendly
+- [DigitalOcean Provider Docs](https://registry.terraform.io/providers/digitalocean/digitalocean/latest/docs)
+
+**Questions to Explore:**
+- What's the smallest instance size for your provider?
+- How do you find the right OS image ID?
+- What authentication method does your provider use?
+- How do you add SSH keys to instances?
+
+</details>
+
+<details>
+<summary>🔒 Security Best Practices</summary>
+
+**Credentials Management:**
+
+**❌ NEVER DO THIS:**
+```hcl
+provider "aws" {
+  access_key = "AKIAIOSFODNN7EXAMPLE"  # NEVER!
+  secret_key = "wJalrXUtnFEMI/K7MDENG/bPxRfiCYEXAMPLEKEY"  # NEVER!
+}
+```
+
+**✅ DO THIS INSTEAD:**
+
+**Option 1: Environment Variables**
+```bash
+export AWS_ACCESS_KEY_ID="your-key"
+export AWS_SECRET_ACCESS_KEY="your-secret"
+# Provider will auto-detect
+```
+
+**Option 2: Credentials File**
+```bash
+# ~/.aws/credentials (for AWS)
+[default]
+aws_access_key_id = your-key
+aws_secret_access_key = your-secret
+```
+
+**Option 3: terraform.tfvars (gitignored)**
+```hcl
+# terraform.tfvars (add to .gitignore!)
+access_key = "your-key"
+secret_key = "your-secret"
+```
+
+**Files to Add to .gitignore:**
+```
+# Terraform
+*.tfstate
+*.tfstate.*
+.terraform/
+terraform.tfvars
+*.tfvars
+.terraform.lock.hcl
+
+# Cloud credentials
+*.pem
+*.key
+*.json  # Service account keys
+credentials
+```
+
+**SSH Key Management:**
+- Generate SSH key pair locally
+- Add public key to cloud provider
+- Keep private key secure (never commit)
+- Use `chmod 600` on private key file
+
+**Security Group Rules:**
+- Restrict SSH to your IP only (not 0.0.0.0/0)
+- Only open ports you need
+- Document why each port is open
+
+</details>
+
+<details>
+<summary>📁 Terraform Project Structure</summary>
+
+**Recommended Structure:**
+
+```
+terraform/
+├── .gitignore           # Ignore state, credentials
+├── main.tf              # Main resources
+├── variables.tf         # Input variables
+├── outputs.tf           # Output values
+├── terraform.tfvars     # Variable values (gitignored!)
+└── README.md            # Setup instructions
+```
+
+**What Goes in Each File:**
+
+**main.tf:**
+- Provider configuration
+- Resource definitions
+- Data sources
+
+**variables.tf:**
+- Variable declarations
+- Descriptions
+- Default values (non-sensitive only)
+
+**outputs.tf:**
+- Important values to display
+- VM IP addresses
+- Connection strings
+
+**terraform.tfvars:**
+- Actual variable values
+- Secrets and credentials
+- **MUST be in .gitignore**
+
+**Alternative: Single File**
+For small projects, you can put everything in `main.tf`, but multi-file is more maintainable.
+
+</details>
+
+**What to Document:**
+- Cloud provider chosen and why
+- Terraform version used
+- Resources created (VM size, region, etc.)
+- Public IP address of created VM
+- SSH connection command
+- Terminal output from `terraform plan` and `terraform apply`
+- Proof of SSH access to VM
+
+---
+
+### Task 2 — Pulumi VM Creation (4 pts)
+
+**Objective:** Destroy the Terraform VM and recreate the same infrastructure using Pulumi.
+
+**Requirements:**
+
+1. **Cleanup Terraform Infrastructure**
+   - Run `terraform destroy` to delete all resources
+   - Verify all resources are deleted in cloud console
+   - Document the cleanup process
+
+2. **Setup Pulumi**
+   - Install Pulumi CLI
+   - Choose a programming language (Python recommended, or TypeScript, Go, C#, Java)
+   - Initialize a new Pulumi project
+   - Configure cloud provider
+
+3. **Recreate Same Infrastructure**
+
+   Create a `pulumi/` directory with equivalent resources:
+
+   **Same Resources as Task 1:**
+   - VM/Compute Instance (same size)
+   - Network/VPC
+   - Security Group/Firewall (same rules)
+   - Public IP Address
+
+   **Goal:** Functionally identical infrastructure, different tool
+
+4. **Apply Infrastructure**
+   - Run `pulumi preview` to see planned changes
+   - Apply infrastructure with `pulumi up`
+   - Verify VM is accessible via SSH
+   - Document the public IP
+
+5. **Compare Experience**
+   - What was easier/harder than Terraform?
+   - How does the code differ?
+   - Which approach do you prefer and why?
+
+<details>
+<summary>💡 Pulumi Fundamentals</summary>
+
+**What is Pulumi?**
+
+Pulumi is an imperative IaC tool that lets you write infrastructure using real programming languages (Python, TypeScript, Go, etc.).
+
+**Key Differences from Terraform:**
+
+| Aspect | Terraform | Pulumi |
+|--------|-----------|--------|
+| **Language** | HCL (declarative) | Python, JS, Go, etc. (imperative) |
+| **State** | Local or remote state file | Pulumi Cloud (free tier) or self-hosted |
+| **Logic** | Limited (count, for_each) | Full programming language |
+| **Testing** | External tools | Native unit tests |
+| **Secrets** | Plain in state | Encrypted by default |
+
+**Key Concepts:**
+
+**Resources:**
+- Similar to Terraform, but defined in code
+- Example (Python): `vm = compute.Instance("my-vm", ...)`
+
+**Stacks:**
+- Like Terraform workspaces
+- Separate environments (dev, staging, prod)
+- Each has its own config and state
+
+**Outputs:**
+- Return values from your program
+- Example: `pulumi.export("ip", vm.public_ip)`
+
+**Config:**
+- Per-stack configuration
+- Set with: `pulumi config set key value`
+- Access in code: `config.get("key")`
+
+**Typical Workflow:**
+```bash
+pulumi new <template>   # Create new project
+pulumi config set ...   # Configure settings
+pulumi preview          # Preview changes (like terraform plan)
+pulumi up               # Create/update infrastructure
+pulumi destroy          # Delete all infrastructure
+pulumi stack output     # View outputs
+```
+
+**Advantages of Pulumi:**
+- Use familiar programming languages
+- Full language features (loops, functions, classes)
+- Better IDE support (autocomplete, type checking)
+- Native testing capabilities
+- Secrets encrypted by default
+
+**Disadvantages of Pulumi:**
+- Smaller community than Terraform
+- More complex for simple tasks
+- Requires programming knowledge
+- Pulumi Cloud dependency (or self-hosted backend)
+
+**Resources:**
+- [Pulumi Documentation](https://www.pulumi.com/docs/)
+- [Pulumi Registry](https://www.pulumi.com/registry/) - Provider docs
+- [Python Examples](https://www.pulumi.com/docs/languages-sdks/python/)
+
+</details>
+
+<details>
+<summary>🐍 Pulumi with Python</summary>
+
+**Project Setup:**
+
+```bash
+pulumi new python
+# Follow prompts for project name, stack name
+```
+
+**Project Structure:**
+```
+pulumi/
+├── __main__.py          # Main infrastructure code
+├── requirements.txt     # Python dependencies
+├── Pulumi.yaml         # Project metadata
+├── Pulumi.dev.yaml     # Stack configuration
+└── venv/               # Python virtual environment
+```
+
+**Basic Pattern (AWS Example):**
+
+```python
+import pulumi
+import pulumi_aws as aws
+
+# Create a security group
+security_group = aws.ec2.SecurityGroup("web-sg",
+    description="Allow SSH and HTTP",
+    ingress=[
+        {"protocol": "tcp", "from_port": 22, "to_port": 22, "cidr_blocks": ["0.0.0.0/0"]},
+        {"protocol": "tcp", "from_port": 80, "to_port": 80, "cidr_blocks": ["0.0.0.0/0"]},
+    ])
+
+# Create an EC2 instance
+instance = aws.ec2.Instance("my-vm",
+    instance_type="t2.micro",
+    ami="ami-0c55b159cbfafe1f0",  # Ubuntu
+    security_groups=[security_group.name])
+
+# Export the instance's public IP
+pulumi.export("public_ip", instance.public_ip)
+```
+
+**Configuration:**
+```bash
+pulumi config set aws:region us-east-1
+pulumi config set --secret aws:accessKey YOUR_KEY
+pulumi config set --secret aws:secretKey YOUR_SECRET
+```
+
+**Running:**
+```bash
+# Activate venv
+source venv/bin/activate  # or venv\Scripts\activate on Windows
+
+# Install dependencies
+pip install -r requirements.txt
+
+# Preview and apply
+pulumi preview
+pulumi up
+```
+
+**Resources:**
+- [Pulumi Python SDK](https://www.pulumi.com/docs/languages-sdks/python/)
+- [Pulumi AWS Examples](https://github.com/pulumi/examples/tree/master/aws-py-webserver)
+
+</details>
+
+<details>
+<summary>📦 Pulumi with TypeScript</summary>
+
+**Project Setup:**
+
+```bash
+pulumi new typescript
+```
+
+**Basic Pattern (AWS Example):**
+
+```typescript
+import * as pulumi from "@pulumi/pulumi";
+import * as aws from "@pulumi/aws";
+
+// Create a security group
+const securityGroup = new aws.ec2.SecurityGroup("web-sg", {
+    description: "Allow SSH and HTTP",
+    ingress: [
+        { protocol: "tcp", fromPort: 22, toPort: 22, cidrBlocks: ["0.0.0.0/0"] },
+        { protocol: "tcp", fromPort: 80, toPort: 80, cidrBlocks: ["0.0.0.0/0"] },
+    ],
+});
+
+// Create an EC2 instance
+const instance = new aws.ec2.Instance("my-vm", {
+    instanceType: "t2.micro",
+    ami: "ami-0c55b159cbfafe1f0",
+    securityGroups: [securityGroup.name],
+});
+
+// Export the instance's public IP
+export const publicIp = instance.publicIp;
+```
+
+**Running:**
+```bash
+npm install
+pulumi preview
+pulumi up
+```
+
+</details>
+
+<details>
+<summary>☁️ Pulumi Cloud Providers</summary>
+
+**Installing Provider Packages:**
+
+**Yandex Cloud (Python):**
+```bash
+pip install pulumi-yandex
+```
+
+**AWS (Python):**
+```bash
+pip install pulumi-aws
+```
+
+**GCP (Python):**
+```bash
+pip install pulumi-gcp
+```
+
+**Azure (Python):**
+```bash
+pip install pulumi-azure-native
+```
+
+**Provider Documentation:**
+- [Pulumi Yandex](https://www.pulumi.com/registry/packages/yandex/)
+- [Pulumi AWS](https://www.pulumi.com/registry/packages/aws/)
+- [Pulumi GCP](https://www.pulumi.com/registry/packages/gcp/)
+- [Pulumi Azure](https://www.pulumi.com/registry/packages/azure-native/)
+
+**Authentication:**
+- Same as Terraform (environment variables, config files)
+- Pulumi can also use `pulumi config set --secret` for secure credential storage
+
+</details>
+
+<details>
+<summary>🔄 Migrating from Terraform to Pulumi</summary>
+
+**Key Differences:**
+
+**Resource Names:**
+- Terraform: `resource "aws_instance" "web" { ... }`
+- Pulumi: `const web = new aws.ec2.Instance("web", { ... })`
+
+**Variables:**
+- Terraform: `var.instance_type`
+- Pulumi: `config.require("instanceType")` or just regular variables
+
+**Outputs:**
+- Terraform: `output "ip" { value = aws_instance.web.public_ip }`
+- Pulumi: `export const ip = web.publicIp` (TS) or `pulumi.export("ip", web.public_ip)` (Python)
+
+**Benefits of Real Programming Language:**
+- Use loops, conditionals, functions naturally
+- Import external libraries
+- Better code reuse (functions, classes)
+- Type checking and IDE support
+
+**Conversion Tips:**
+1. Start with Terraform docs to understand resources needed
+2. Find equivalent Pulumi resources in registry
+3. Convert HCL blocks to function calls
+4. Use language features for logic
+
+**Pulumi Can Import Terraform State:**
+```bash
+pulumi import ...
+```
+But for this lab, start fresh with Pulumi.
+
+</details>
+
+**What to Document:**
+- Programming language chosen for Pulumi
+- Terraform destroy output
+- Pulumi preview and up output
+- Public IP of Pulumi-created VM
+- Comparison: Terraform vs Pulumi experience
+- Code differences (HCL vs Python/TypeScript)
+- Which tool you prefer and why
+
+---
+
+### Task 3 — Documentation (2 pts)
+
+**Objective:** Document your IaC implementation, decisions, and learnings.
+
+Create `terraform/docs/LAB04.md` (or `docs/LAB04.md` at root) with these sections:
+
+### 1. Cloud Provider & Infrastructure
+- Cloud provider chosen and rationale
+- Instance type/size and why
+- Region/zone selected
+- Total cost (should be $0 with free tier)
+- Resources created (list all)
+
+### 2. Terraform Implementation
+- Terraform version used
+- Project structure explanation
+- Key configuration decisions
+- Challenges encountered
+- Terminal output from key commands:
+  - `terraform init`
+  - `terraform plan` (sanitized, no secrets)
+  - `terraform apply`
+  - SSH connection to VM
+
+### 3. Pulumi Implementation
+- Pulumi version and language used
+- How code differs from Terraform
+- Advantages you discovered
+- Challenges encountered
+- Terminal output from:
+  - `pulumi preview`
+  - `pulumi up`
+  - SSH connection to VM
+
+### 4. Terraform vs Pulumi Comparison
+
+Brief comparison (3-5 sentences each):
+- **Ease of Learning:** Which was easier to learn and why?
+- **Code Readability:** Which is more readable for you?
+- **Debugging:** Which was easier to debug when things went wrong?
+- **Documentation:** Which has better docs and examples?
+- **Use Case:** When would you use Terraform? When Pulumi?
+
+### 5. Lab 5 Preparation & Cleanup
+
+**VM for Lab 5:**
+- Are you keeping your VM for Lab 5? (Yes/No)
+- If yes: Which VM (Terraform or Pulumi created)?
+- If no: What will you use for Lab 5? (Local VM/Will recreate cloud VM)
+
+**Cleanup Status:**
+- If keeping VM for Lab 5: Show VM is still running and accessible
+- If destroying everything: Terminal output showing both tools' resources destroyed
+- Cloud console screenshot showing resource status (optional but recommended)
+
+---
+
+## Bonus Task — IaC CI/CD + Infrastructure Import (2.5 pts)
+
+**Objective:** Add automated validation for infrastructure code and learn to import existing resources into Terraform.
+
+### Part 1: GitHub Actions for IaC Validation (1.5 pts)
+
+**Objective:** Automatically validate Terraform code on pull requests.
+
+**Requirements:**
+
+1. **Create Validation Workflow**
+
+   Create `.github/workflows/terraform-ci.yml` that:
+   - Triggers only on changes to `terraform/**` files
+   - Runs `terraform fmt -check` (code formatting validation)
+   - Runs `terraform init`
+   - Runs `terraform validate` (syntax validation)
+   - Runs `tflint` (Terraform linter for best practices)
+
+2. **Workflow Setup**
+   - Install Terraform in workflow
+   - Install tflint
+   - Configure path filters (similar to Lab 3)
+   - Show validation results in workflow logs
+
+3. **Testing**
+   - Create a PR with Terraform changes
+   - Verify workflow runs only for Terraform changes
+   - Show passing and failing validation examples
+
+<details>
+<summary>💡 Terraform CI/CD Concepts</summary>
+
+**Why Validate Infrastructure Code in CI?**
+
+- Catch syntax errors before apply
+- Enforce code formatting standards
+- Check for security issues and bad practices
+- Prevent broken configurations from merging
+- Review infrastructure changes before deployment
+
+**Terraform CI Steps:**
+
+**terraform fmt:**
+- Formats code to canonical style
+- Use `-check` flag to verify without changing files
+- Ensures consistency across team
+
+**terraform validate:**
+- Checks syntax and internal consistency
+- Validates resource configurations
+- Doesn't access provider APIs (fast)
+
+**tflint:**
+- Linter for Terraform code
+- Finds possible errors (invalid instance types, etc.)
+- Checks best practices
+- Provider-specific rules
+
+**Path Filters:**
+- Only run workflow when IaC files change
+- Same concept as Lab 3 path filters
+- Prevents unnecessary CI runs
+
+**Pattern for Workflow:**
+```yaml
+on:
+  pull_request:
+    paths:
+      - 'terraform/**'
+      - '.github/workflows/terraform-ci.yml'
+
+jobs:
+  validate:
+    runs-on: ubuntu-latest
+    steps:
+      - Checkout code
+      - Setup Terraform
+      - Install tflint
+      - Run terraform fmt -check
+      - Run terraform init
+      - Run terraform validate
+      - Run tflint
+```
+
+**Advanced: Terraform Plan in PR**
+
+You can also add `terraform plan` to show what would change:
+- Requires cloud credentials (use GitHub Secrets)
+- Shows plan output as PR comment
+- Helps reviewers understand impact
+- Use `terraform plan -no-color` for readable output
+
+**Security Considerations:**
+- Be careful with secrets in CI
+- Don't expose sensitive outputs
+- Use `-backend=false` for init if not using state
+- Consider using Terraform Cloud for plan sharing
+
+**Resources:**
+- [GitHub Actions for Terraform](https://developer.hashicorp.com/terraform/tutorials/automation/github-actions)
+- [tflint Documentation](https://github.com/terraform-linters/tflint)
+- [Setup Terraform Action](https://github.com/hashicorp/setup-terraform)
+
+</details>
+
+<details>
+<summary>🔧 tflint Setup</summary>
+
+**What is tflint?**
+
+A linter for Terraform that finds:
+- Possible errors (invalid instance types, deprecated syntax)
+- Best practice violations
+- Provider-specific issues
+
+**Installation in CI:**
+```yaml
+- name: Setup TFLint
+  uses: terraform-linters/setup-tflint@v3
+  with:
+    tflint_version: latest
+
+- name: Run TFLint
+  run: tflint --format compact
+  working-directory: terraform/
+```
+
+**Local Installation:**
+```bash
+# macOS
+brew install tflint
+
+# Linux
+curl -s https://raw.githubusercontent.com/terraform-linters/tflint/master/install_linux.sh | bash
+
+# Windows
+choco install tflint
+```
+
+**Configuration (.tflint.hcl):**
+```hcl
+plugin "terraform" {
+  enabled = true
+}
+
+plugin "aws" {  # Or your cloud provider
+  enabled = true
+}
+```
+
+**Running Locally:**
+```bash
+cd terraform/
+tflint --init  # Download plugins
+tflint         # Run linting
+```
+
+**Common Issues Found:**
+- Invalid instance types
+- Missing required arguments
+- Deprecated syntax
+- Security group issues
+- Invalid AMI IDs
+
+</details>
+
+### Part 2: Import GitHub Repository to Terraform (1 pt)
+
+**Objective:** Learn to manage existing infrastructure with Terraform by importing your course repository.
+
+**Requirements:**
+
+1. **Import GitHub Repository**
+   - Create Terraform configuration for GitHub provider
+   - Define a `github_repository` resource for your course repo
+   - Use `terraform import` to bring existing repo under Terraform management
+   - Verify state matches reality
+
+2. **Manage Repository Settings**
+   - Add Terraform code to manage repository settings:
+     - Description
+     - Visibility (public/private)
+     - Has issues enabled
+     - Has wiki enabled
+     - Branch protection rules (optional)
+   - Apply changes and verify in GitHub
+
+3. **Documentation**
+   - Explain the import process
+   - Show terminal output of import command
+   - Document why importing existing resources matters
+
+<details>
+<summary>💡 Why Import Existing Resources?</summary>
+
+**The Problem:**
+
+In real world, you often have:
+- Infrastructure created manually (before IaC adoption)
+- Resources created by other tools or people
+- Legacy systems that need to be managed with code
+
+You can't just run `terraform apply` - resources already exist!
+
+**The Solution: terraform import**
+
+Import brings existing resources into Terraform management:
+1. Write Terraform config describing the resource
+2. Run `terraform import` to link config to real resource
+3. Terraform now manages that resource
+4. Future changes go through Terraform
+
+**Advantages of Managing Existing Resources with IaC:**
+
+**1. Version Control:**
+- Track configuration changes over time
+- See who changed what and when
+- Rollback to previous configurations
+
+**2. Consistency:**
+- Standardize configuration across resources
+- Prevent configuration drift
+- Ensure compliance with policies
+
+**3. Automation:**
+- Changes require code review
+- CI/CD validation
+- Automated testing
+
+**4. Documentation:**
+- Code is living documentation
+- Anyone can see current configuration
+- No "tribal knowledge" needed
+
+**5. Disaster Recovery:**
+- Quickly recreate infrastructure from code
+- No manual steps to remember
+- Tested recovery process
+
+**6. Team Collaboration:**
+- Multiple people can work on infrastructure
+- PR-based workflow
+- No conflicting manual changes
+
+**Real-World Use Cases:**
+
+**Brownfield Infrastructure:**
+- Company has 100s of manually created resources
+- Import them gradually into Terraform
+- Eventually all infrastructure is code-managed
+
+**Migrating Between Tools:**
+- Moving from CloudFormation to Terraform
+- Moving from manual management to IaC
+- Gradual transition without downtime
+
+**Compliance and Governance:**
+- All changes must go through code review
+- Audit trail of who changed what
+- Prevent unauthorized changes
+
+**Cost Management:**
+- Review infrastructure changes before apply
+- Prevent accidental expensive resources
+- Track infrastructure costs in code
+
+**The Import Process:**
+
+```bash
+# 1. Write the resource config (empty or partial)
+resource "github_repository" "course_repo" {
+  name = "DevOps-Core-Course"
+  # ... other settings
+}
+
+# 2. Import the existing resource
+terraform import github_repository.course_repo DevOps-Core-Course
+
+# 3. Terraform now tracks this resource in state
+# 4. Run terraform plan to see any drift
+# 5. Update config to match reality
+# 6. Apply to bring under full management
+```
+
+**Challenges:**
+
+- Config must match reality exactly
+- May need to import many related resources
+- Some resources don't support import
+- Requires careful planning
+
+**Best Practices:**
+
+- Import one resource at a time
+- Test in non-production first
+- Use `terraform plan` to verify match
+- Document the import process
+- Keep manual backups before import
+
+**Resources:**
+- [Terraform Import Command](https://developer.hashicorp.com/terraform/cli/import)
+- [Import Usage Examples](https://developer.hashicorp.com/terraform/cli/import/usage)
+
+</details>
+
+<details>
+<summary>🐙 GitHub Provider Setup</summary>
+
+**Installing GitHub Provider:**
+
+```hcl
+terraform {
+  required_providers {
+    github = {
+      source  = "integrations/github"
+      version = "~> 5.0"
+    }
+  }
+}
+
+provider "github" {
+  token = var.github_token  # Personal access token
+}
+```
+
+**Authentication:**
+
+**Create Personal Access Token:**
+1. GitHub → Settings → Developer settings → Personal access tokens → Tokens (classic)
+2. Generate new token
+3. Select scopes: `repo` (all repo permissions)
+4. Copy token (shown once!)
+
+**Configure Token:**
+```bash
+# Environment variable (recommended)
+export GITHUB_TOKEN="your-token-here"
+
+# Or in terraform.tfvars (gitignored!)
+github_token = "your-token-here"
+```
+
+**Repository Resource:**
+
+```hcl
+resource "github_repository" "course_repo" {
+  name        = "DevOps-Core-Course"
+  description = "DevOps course lab assignments"
+  visibility  = "public"
+
+  has_issues   = true
+  has_wiki     = false
+  has_projects = false
+
+  # Other settings...
+}
+```
+
+**Import Command:**
+
+```bash
+# Format: terraform import <resource_type>.<name> <repo_name>
+terraform import github_repository.course_repo DevOps-Core-Course
+```
+
+**After Import:**
+1. Run `terraform plan` - shows differences between code and reality
+2. Update your config to match reality (eliminate differences)
+3. Run `terraform plan` again - should show "No changes"
+4. Now you can manage the repo with Terraform!
+
+**What You Can Manage:**
+- Repository settings
+- Branch protection rules
+- Collaborators and teams
+- Webhooks
+- Deploy keys
+- Repository secrets
+
+**Resources:**
+- [GitHub Provider Documentation](https://registry.terraform.io/providers/integrations/github/latest/docs)
+- [Repository Resource](https://registry.terraform.io/providers/integrations/github/latest/docs/resources/repository)
+- [Import Guide](https://registry.terraform.io/providers/integrations/github/latest/docs/resources/repository#import)
+
+</details>
+
+**What to Document:**
+- Workflow file implementation
+- Path filter configuration
+- tflint results and any issues found
+- Example of workflow running on PR
+- GitHub repository import process
+- Terminal output of import command
+- Why importing matters (brief explanation)
+- Benefits you see for managing repos with IaC
+
+---
+
+## How to Submit
+
+1. **Create Branch:**
+   - Create a new branch called `lab04`
+   - Work on this branch
+
+2. **Commit Work:**
+   - Add Terraform code (`terraform/` directory)
+   - Add Pulumi code (`pulumi/` directory)
+   - Add documentation (`docs/LAB04.md` or `terraform/docs/LAB04.md`)
+   - Add GitHub workflow (`.github/workflows/terraform-ci.yml` if doing bonus)
+   - **IMPORTANT:** Ensure `.gitignore` excludes:
+     - `*.tfstate`, `*.tfstate.*`, `.terraform/`, `terraform.tfvars`
+     - `pulumi/venv/`, `Pulumi.*.yaml` (stack configs with secrets)
+     - Any credential files
+   - Commit with conventional commits format
+
+3. **CLEANUP BEFORE COMMITTING:**
+
+   **If keeping VM for Lab 5:**
+   - ✅ Keep one VM running (Terraform or Pulumi - your choice)
+   - ✅ Destroy the other tool's resources
+   - ✅ Document which VM you're keeping in LAB04.md
+   - ✅ Check no secrets in code
+   - ✅ Review .gitignore is correct
+
+   **If NOT keeping VM for Lab 5:**
+   - ✅ Run `terraform destroy`
+   - ✅ Run `pulumi destroy`
+   - ✅ Verify no resources in cloud console
+   - ✅ Check no secrets in code
+   - ✅ Review .gitignore is correct
+   - ✅ Document your Lab 5 plan (local VM or recreate cloud VM)
+
+4. **Create Pull Requests:**
+   - **PR #1:** `your-fork:lab04` → `course-repo:master`
+   - **PR #2:** `your-fork:lab04` → `your-fork:master`
+   - Bonus workflow will validate Terraform code automatically
+
+---
+
+## Acceptance Criteria
+
+### Main Tasks (10 points)
+
+**Terraform VM Creation (4 pts):**
+- [ ] Cloud provider chosen and configured
+- [ ] Terraform project created in `terraform/` directory
+- [ ] All required resources defined (VM, network, security group, public IP)
+- [ ] Free tier instance used
+- [ ] Variables and outputs used appropriately
+- [ ] `.gitignore` configured correctly
+- [ ] Infrastructure applied successfully
+- [ ] VM accessible via SSH (proof provided)
+- [ ] Terminal output from `terraform plan` and `terraform apply` provided
+- [ ] No secrets committed to Git
+
+**Pulumi VM Recreation (4 pts):**
+- [ ] Terraform resources destroyed (proof provided)
+- [ ] Pulumi project created in `pulumi/` directory
+- [ ] Programming language chosen
+- [ ] Same infrastructure recreated with Pulumi
+- [ ] Infrastructure applied successfully
+- [ ] VM accessible via SSH (proof provided)
+- [ ] Terminal output from `pulumi preview` and `pulumi up` provided
+- [ ] Comparison with Terraform documented
+
+**Documentation (2 pts):**
+- [ ] `docs/LAB04.md` complete with all required sections
+- [ ] Cloud provider choice justified
+- [ ] Terraform implementation documented
+- [ ] Pulumi implementation documented
+- [ ] Terraform vs Pulumi comparison provided
+- [ ] Lab 5 preparation documented (keeping VM or using local/recreating)
+- [ ] Cleanup status documented (what's kept, what's destroyed)
+- [ ] Terminal outputs provided (sanitized, no secrets)
+
+### Bonus Task (2.5 points)
+
+**Part 1: IaC CI/CD (1.5 pts)**
+- [ ] GitHub Actions workflow created (`.github/workflows/terraform-ci.yml`)
+- [ ] Path filters configured for `terraform/**`
+- [ ] Workflow runs `terraform fmt -check`
+- [ ] Workflow runs `terraform validate`
+- [ ] Workflow runs `tflint`
+- [ ] Workflow triggers only on Terraform changes (proof provided)
+- [ ] Documentation includes workflow implementation details
+
+**Part 2: GitHub Repository Import (1 pt)**
+- [ ] GitHub provider configured in Terraform
+- [ ] Repository resource defined
+- [ ] `terraform import` executed successfully
+- [ ] State matches reality (terraform plan shows no changes)
+- [ ] Terminal output of import process provided
+- [ ] Documentation explains why importing matters
+- [ ] Benefits of managing existing resources documented
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Terraform Implementation** | 4 pts | Working infrastructure, best practices, documentation |
+| **Pulumi Implementation** | 4 pts | Working infrastructure, comparison provided |
+| **Documentation** | 2 pts | Complete, clear, includes cleanup proof |
+| **Bonus: IaC CI/CD** | 1.5 pts | Automated validation, path filters working |
+| **Bonus: Import** | 1 pt | Successful import, benefits explained |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Both tools working perfectly, excellent comparison, comprehensive documentation, proper cleanup
+- **8-9/10:** Infrastructure works, good documentation, minor issues or missing comparisons
+- **6-7/10:** One tool works well, other has issues, minimal comparison, incomplete docs
+- **<6/10:** Infrastructure doesn't work, major issues, secrets committed, no cleanup
+
+**Critical Requirements:**
+- ✅ MUST use free tier resources only
+- ✅ MUST document Lab 5 VM plan (keeping, local, or recreating)
+- ✅ MUST NOT commit secrets or state files
+- ✅ MUST provide SSH access proof
+- ⚠️ Keeping ONE VM for Lab 5 is acceptable (document it!)
+- ❌ Multiple VMs running without documentation = point deduction
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Terraform Documentation</summary>
+
+- [Terraform Documentation](https://developer.hashicorp.com/terraform/docs)
+- [Terraform Registry](https://registry.terraform.io/) - All providers
+- [Terraform Best Practices](https://www.terraform-best-practices.com/)
+- [HCL Configuration Language](https://developer.hashicorp.com/terraform/language)
+
+</details>
+
+<details>
+<summary>📚 Pulumi Documentation</summary>
+
+- [Pulumi Documentation](https://www.pulumi.com/docs/)
+- [Pulumi Registry](https://www.pulumi.com/registry/)
+- [Pulumi Examples](https://github.com/pulumi/examples)
+- [Pulumi vs Terraform](https://www.pulumi.com/docs/concepts/vs/terraform/)
+
+</details>
+
+<details>
+<summary>☁️ Cloud Provider Documentation</summary>
+
+- [Yandex Cloud Docs](https://cloud.yandex.com/en/docs)
+- [AWS Documentation](https://docs.aws.amazon.com/)
+- [GCP Documentation](https://cloud.google.com/docs)
+- [Azure Documentation](https://learn.microsoft.com/azure/)
+- [VK Cloud Docs](https://mcs.mail.ru/help/)
+
+</details>
+
+<details>
+<summary>🔒 Security & Best Practices</summary>
+
+- [Terraform Security Best Practices](https://spacelift.io/blog/terraform-security-best-practices)
+- [Managing Secrets in Terraform](https://developer.hashicorp.com/terraform/tutorials/configuration-language/sensitive-variables)
+- [Pulumi Secrets Management](https://www.pulumi.com/docs/concepts/secrets/)
+- [Git Secrets Prevention](https://github.com/awslabs/git-secrets)
+
+</details>
+
+<details>
+<summary>🛠️ Tools</summary>
+
+- [Terraform CLI](https://developer.hashicorp.com/terraform/downloads)
+- [Pulumi CLI](https://www.pulumi.com/docs/install/)
+- [tflint](https://github.com/terraform-linters/tflint) - Terraform linter
+- [terraform-docs](https://terraform-docs.io/) - Generate docs from code
+- [Infracost](https://www.infracost.io/) - Cost estimation for Terraform
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 5:** Ansible will provision software on your VM (install Docker, deploy your app from Labs 1-3)
+  - **You'll need a VM ready** - either keep your cloud VM from this lab, use a local VM, or recreate later
+- **Lab 6:** Ansible + Terraform integration (provision and configure in one workflow)
+- **Lab 9:** Kubernetes will replace individual VMs (but concepts are same)
+- **Lab 13:** ArgoCD will manage infrastructure changes (GitOps for infrastructure)
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** Infrastructure as Code is about automation, repeatability, and collaboration. Focus on understanding WHY we define infrastructure in code, not just HOW. Consider keeping one VM for Lab 5 (Ansible). If destroying resources, document your Lab 5 plan. Never commit secrets!
diff --git a/labs/lab05.md b/labs/lab05.md
index a76d4960aa..7789e1f4b9 100644
--- a/labs/lab05.md
+++ b/labs/lab05.md
@@ -1,976 +1,976 @@
-# Lab 5 — Ansible Fundamentals
-
-![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
-![topic](https://img.shields.io/badge/topic-Configuration%20Management-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Ansible-informational)
-
-> Learn configuration management fundamentals by building reusable Ansible roles for infrastructure provisioning and application deployment.
-
-## Overview
-
-Master the basics of Ansible by creating a professional role-based automation system. You'll build roles for system provisioning (Docker, common packages) and application deployment, demonstrating idempotency, handlers, and secure credential management with Ansible Vault.
-
-**What You'll Learn:**
-- Ansible roles architecture and best practices
-- Role-based code organization for reusability
-- Writing tasks, handlers, and defaults
-- Idempotency and why it matters
-- Ansible Vault for secure credential management
-- Handlers for efficient service management
-- Infrastructure verification and health checks
-- Basic application deployment with Docker
-
-**Tech Stack:** Ansible 2.16+ | Ansible Vault | Docker | YAML
-
-**Connection to Previous Labs:**
-- **Lab 4:** Use the VM you created (cloud or local)
-- **Labs 1-3:** Deploy your containerized Python app with CI/CD-built images
-- **Lab 6:** Add advanced features (blocks, tags, Docker Compose, CI/CD)
-
----
-
-## Prerequisites
-
-You need a target VM from Lab 4:
-- **Option A:** Cloud VM from Lab 4 (Terraform/Pulumi)
-- **Option B:** Local VM (VirtualBox/Vagrant)
-- **Option C:** Recreate VM using your Lab 4 code
-
-**VM Requirements:**
-- Ubuntu 24.04 LTS or 22.04 LTS
-- SSH access configured
-- Your SSH key added
-- Sudo access (passwordless recommended for automation)
-- Python 3 installed (usually pre-installed on Ubuntu)
-
----
-
-## Tasks
-
-### Task 1 — Ansible Setup & Role Structure (2 pts)
-
-**Objective:** Install Ansible locally, create proper role-based project structure, and configure inventory.
-
-#### 1.1 Install Ansible
-
-Install Ansible on your local machine (control node):
-
-**Ubuntu/Debian:**
-```bash
-sudo apt update
-sudo apt install ansible
-```
-
-**macOS:**
-```bash
-brew install ansible
-```
-
-**Windows:**
-- Use WSL2 and install in Linux environment
-- OR use Ansible via Docker
-
-Verify installation: `ansible --version`
-
-#### 1.2 Create Role-Based Project Structure
-
-Create this structure:
-
-```
-ansible/
-├── inventory/
-│   └── hosts.ini              # Static inventory
-├── roles/
-│   ├── common/                # Common system tasks
-│   │   ├── tasks/
-│   │   │   └── main.yml
-│   │   └── defaults/
-│   │       └── main.yml
-│   ├── docker/                # Docker installation
-│   │   ├── tasks/
-│   │   │   └── main.yml
-│   │   ├── handlers/
-│   │   │   └── main.yml
-│   │   └── defaults/
-│   │       └── main.yml
-│   └── app_deploy/            # Application deployment
-│       ├── tasks/
-│       │   └── main.yml
-│       ├── handlers/
-│       │   └── main.yml
-│       └── defaults/
-│           └── main.yml
-├── playbooks/
-│   ├── site.yml               # Main playbook
-│   ├── provision.yml          # System provisioning
-│   └── deploy.yml             # App deployment
-├── group_vars/
-│   └── all.yml               # Encrypted variables (Vault)
-├── ansible.cfg               # Ansible configuration
-└── docs/
-    └── LAB05.md              # Your documentation
-```
-
-<details>
-<summary>💡 Why Ansible Roles?</summary>
-
-**What are Roles?**
-
-Roles are the standard way to organize Ansible code for reusability and maintainability.
-
-**Benefits of Roles:**
-
-1. **Reusability**: Use same role across projects
-2. **Organization**: Clear structure, easy to navigate
-3. **Maintainability**: Changes in one place
-4. **Sharing**: Share roles via Ansible Galaxy
-5. **Testing**: Test roles independently
-6. **Modularity**: Mix and match roles
-
-**Role Structure:**
-
-Each role has a standard structure:
-
-```
-role_name/
-├── tasks/           # Main task list
-│   └── main.yml
-├── handlers/        # Handler definitions
-│   └── main.yml
-├── defaults/        # Default variables (low priority)
-│   └── main.yml
-├── vars/            # Role variables (high priority)
-│   └── main.yml
-├── files/           # Static files to copy
-├── templates/       # Jinja2 templates
-└── meta/            # Role metadata and dependencies
-    └── main.yml
-```
-
-**Only create directories you need!** Empty directories can be omitted.
-
-**Resources:**
-- [Ansible Roles Documentation](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html)
-- [Role Directory Structure](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html#role-directory-structure)
-
-</details>
-
-#### 1.3 Configure Inventory
-
-Create `inventory/hosts.ini` with your VM details:
-
-```ini
-[webservers]
-your-vm-name ansible_host=<VM-IP-ADDRESS> ansible_user=<username>
-```
-
-<details>
-<summary>💡 Inventory Configuration</summary>
-
-**Static Inventory Format:**
-```ini
-[group_name]
-hostname ansible_host=192.168.1.100 ansible_user=ubuntu ansible_ssh_private_key_file=~/.ssh/id_rsa
-
-[group_name:vars]
-ansible_python_interpreter=/usr/bin/python3
-```
-
-**Common Connection Parameters:**
-- `ansible_host` - IP address or hostname
-- `ansible_user` - SSH username
-- `ansible_port` - SSH port (default: 22)
-- `ansible_ssh_private_key_file` - Path to SSH key
-- `ansible_python_interpreter` - Python path on target
-
-**Testing Connectivity:**
-```bash
-ansible all -i inventory/hosts.ini -m ping
-ansible webservers -i inventory/hosts.ini -a "uptime"
-```
-
-**Resources:**
-- [Ansible Inventory Documentation](https://docs.ansible.com/ansible/latest/user_guide/intro_inventory.html)
-
-</details>
-
-#### 1.4 Create Ansible Configuration
-
-Create `ansible.cfg`:
-
-```ini
-[defaults]
-inventory = inventory/hosts.ini
-roles_path = roles
-host_key_checking = False
-remote_user = ubuntu
-retry_files_enabled = False
-
-[privilege_escalation]
-become = True
-become_method = sudo
-become_user = root
-```
-
-#### 1.5 Test Connectivity
-
-Verify Ansible can connect to your VM:
-
-```bash
-cd ansible/
-ansible all -m ping
-ansible webservers -a "uname -a"
-```
-
-You should see successful responses (green "SUCCESS" messages).
-
----
-
-### Task 2 — System Provisioning Roles (4 pts)
-
-**Objective:** Create dedicated roles for system provisioning and demonstrate idempotency.
-
-#### 2.1 Create Common Role
-
-Create `roles/common/tasks/main.yml`:
-
-**Required Tasks:**
-- Update apt cache
-- Install essential packages (python3-pip, curl, git, vim, htop, etc.)
-- Set timezone (optional but good practice)
-
-**Create `roles/common/defaults/main.yml`:**
-Define default variables for packages to install.
-
-<details>
-<summary>💡 Common Role Pattern</summary>
-
-**Purpose:**
-Basic system setup that every server needs.
-
-**Typical Tasks:**
-- Update package cache
-- Install essential tools
-- Configure system settings
-- Set up logging
-- Create users/groups
-
-**Example pattern to research:**
-```yaml
----
-- name: Update apt cache
-  apt:
-    update_cache: yes
-    cache_valid_time: 3600
-
-- name: Install common packages
-  apt:
-    name: "{{ common_packages }}"
-    state: present
-```
-
-**Questions:**
-- What does `cache_valid_time` do?
-- How do you define a list of packages in defaults?
-- Should you use `state: present` or `state: latest`?
-
-**Resources:**
-- [apt module](https://docs.ansible.com/ansible/latest/collections/ansible/builtin/apt_module.html)
-- [timezone module](https://docs.ansible.com/ansible/latest/collections/community/general/timezone_module.html)
-
-</details>
-
-#### 2.2 Create Docker Role
-
-Create `roles/docker/tasks/main.yml`:
-
-**Required Tasks:**
-1. Add Docker GPG key
-2. Add Docker repository
-3. Install Docker packages (docker-ce, docker-ce-cli, containerd.io)
-4. Ensure Docker service is running and enabled
-5. Add user to docker group
-6. Install python3-docker (for Ansible docker modules)
-
-**Create `roles/docker/handlers/main.yml`:**
-- Handler to restart Docker service
-
-**Create `roles/docker/defaults/main.yml`:**
-- Docker version constraints (if any)
-- User to add to docker group
-
-<details>
-<summary>💡 Docker Installation Pattern</summary>
-
-**Docker Installation Steps:**
-
-You need to research the official Docker installation for Ubuntu and translate it to Ansible tasks.
-
-**Key Modules:**
-- `apt_key` - Manage APT repository keys
-- `apt_repository` - Manage APT repositories
-- `apt` - Manage packages
-- `service` - Manage services
-- `user` - Manage users and groups
-
-**Questions to Research:**
-- What's Docker's official GPG key URL?
-- What repository URL should you use for Ubuntu?
-- How do you use Ansible facts like `{{ ansible_distribution_release }}`?
-- Why add user to docker group?
-- When should the handler be triggered?
-
-**Handler Pattern:**
-```yaml
----
-- name: restart docker
-  service:
-    name: docker
-    state: restarted
-```
-
-**Trigger handler with:**
-```yaml
-- name: Some task
-  module: ...
-  notify: restart docker
-```
-
-**Resources:**
-- [Install Docker on Ubuntu (Official)](https://docs.docker.com/engine/install/ubuntu/)
-- [Ansible Handlers](https://docs.ansible.com/ansible/latest/user_guide/playbooks_handlers.html)
-
-</details>
-
-#### 2.3 Create Provisioning Playbook
-
-Create `playbooks/provision.yml`:
-
-```yaml
----
-- name: Provision web servers
-  hosts: webservers
-  become: yes
-
-  roles:
-    - common
-    - docker
-```
-
-**That's it!** The playbook is clean because all logic is in roles.
-
-#### 2.4 Run Provisioning and Demonstrate Idempotency
-
-**First Run:**
-```bash
-ansible-playbook playbooks/provision.yml
-```
-
-Observe the output - tasks should show "changed" status (yellow).
-
-**Second Run:**
-```bash
-ansible-playbook playbooks/provision.yml
-```
-
-**CRITICAL:** Tasks should show "ok" status (green), not "changed". This demonstrates idempotency!
-
-<details>
-<summary>💡 Understanding Idempotency</summary>
-
-**What is Idempotency?**
-
-An idempotent operation produces the same result whether executed once or multiple times.
-
-**In Ansible:**
-- Running a playbook multiple times should be safe
-- Only makes changes when needed
-- Doesn't break if run repeatedly
-- Converges to desired state
-
-**Ansible Output Colors:**
-- **Green (ok):** Task ran, no change needed (desired state already achieved)
-- **Yellow (changed):** Task made a change to reach desired state
-- **Red (failed):** Task failed
-- **Dark (skipped):** Task was skipped
-
-**Why Idempotency Matters:**
-
-1. **Safety:** Can re-run playbooks without fear
-2. **Reliability:** Consistent results
-3. **Recovery:** Re-run after partial failure
-4. **Drift Detection:** Changes only when state drifts
-5. **Confidence:** Know exactly what will change
-
-**Making Tasks Idempotent:**
-
-**Use Stateful Modules:**
-- `apt: state=present` (not just `apt: name=package`)
-- `service: state=started` (not `command: systemctl start`)
-- `file: state=directory` (not `command: mkdir`)
-
-**Testing Idempotency:**
-
-1. Run playbook first time → many "changed"
-2. Run playbook second time → all "ok", zero "changed"
-3. If tasks show "changed" on second run, investigate why
-
-**Resources:**
-- [Ansible Idempotency](https://docs.ansible.com/ansible/latest/reference_appendices/glossary.html)
-
-</details>
-
-**What to Document:**
-- Terminal output from BOTH runs
-- Analysis: Which tasks changed first time? Why?
-- Explanation: Why nothing changed second time?
-
----
-
-### Task 3 — Application Deployment Role (2 pts)
-
-**Objective:** Create a deployment role that securely pulls and runs your Python containerized app using Ansible Vault for credentials.
-
-#### 3.1 Initialize Ansible Vault
-
-Create encrypted file for sensitive data:
-
-```bash
-ansible-vault create group_vars/all.yml
-```
-
-You'll be prompted for a vault password. **Remember this password!**
-
-Add your Docker Hub credentials and app configuration:
-
-```yaml
----
-# Docker Hub credentials
-dockerhub_username: your-username
-dockerhub_password: your-access-token
-
-# Application configuration
-app_name: devops-app
-docker_image: "{{ dockerhub_username }}/{{ app_name }}"
-docker_image_tag: latest
-app_port: 5000
-app_container_name: "{{ app_name }}"
-```
-
-Save and exit.
-
-<details>
-<summary>💡 Ansible Vault Best Practices</summary>
-
-**What is Ansible Vault?**
-
-Ansible Vault encrypts sensitive data so it can be safely stored in version control.
-
-**Vault Commands:**
-
-```bash
-# Create encrypted file
-ansible-vault create filename.yml
-
-# Edit encrypted file
-ansible-vault edit filename.yml
-
-# View encrypted file
-ansible-vault view filename.yml
-
-# Encrypt existing file
-ansible-vault encrypt filename.yml
-
-# Decrypt file (careful!)
-ansible-vault decrypt filename.yml
-```
-
-**Using Vaulted Files:**
-
-**Option 1: Prompt for password:**
-```bash
-ansible-playbook playbook.yml --ask-vault-pass
-```
-
-**Option 2: Password file:**
-```bash
-echo "your-password" > .vault_pass
-chmod 600 .vault_pass
-# Add .vault_pass to .gitignore!
-
-ansible-playbook playbook.yml --vault-password-file .vault_pass
-```
-
-**Option 3: In ansible.cfg:**
-```ini
-[defaults]
-vault_password_file = .vault_pass
-```
-
-**Best Practices:**
-
-1. **Never commit unencrypted secrets**
-2. **Use separate file for vault password** (add to .gitignore)
-3. **Rotate vault password regularly**
-4. **Don't decrypt files permanently**
-5. **Use `no_log: true` for tasks with secrets**
-
-**Resources:**
-- [Ansible Vault Documentation](https://docs.ansible.com/ansible/latest/user_guide/vault.html)
-
-</details>
-
-#### 3.2 Create Application Deployment Role
-
-Create `roles/app_deploy/tasks/main.yml`:
-
-**Required Tasks:**
-1. Log in to Docker Hub (using vaulted credentials)
-2. Pull Docker image
-3. Stop existing container (if running)
-4. Remove old container (if exists)
-5. Run new container with:
-   - Proper port mapping (5000:5000)
-   - Environment variables (if any)
-   - Restart policy (unless-stopped)
-   - Container name
-6. Wait for application to be ready (port check)
-7. Verify health endpoint
-
-**Create `roles/app_deploy/handlers/main.yml`:**
-- Handler to restart application container
-
-**Create `roles/app_deploy/defaults/main.yml`:**
-- Default port
-- Default restart policy
-- Default environment variables
-
-<details>
-<summary>💡 Docker Deployment with Ansible</summary>
-
-**Key Modules:**
-
-**docker_login:**
-Authenticate with Docker registry.
-
-**Questions:**
-- How do you pass credentials from vaulted variables?
-- What's the `no_log` parameter for?
-
-**docker_image:**
-Manage Docker images (pull, build, remove).
-
-**Questions:**
-- How do you pull an image?
-- What's the `source: pull` parameter?
-
-**docker_container:**
-Manage Docker containers.
-
-**Questions:**
-- How do you ensure a container is running?
-- What restart policies exist?
-- How do you map ports?
-- How do you set environment variables?
-- What's the difference between `state: started` and `state: present`?
-
-**wait_for:**
-Wait for port to be available.
-
-**uri:**
-Make HTTP requests (for health checks).
-
-**Security Note:**
-Always use `no_log: true` for tasks with credentials:
-```yaml
-- name: Login
-  docker_login:
-    username: "{{ dockerhub_username }}"
-    password: "{{ dockerhub_password }}"
-  no_log: true  # Prevents credentials in logs
-```
-
-**Resources:**
-- [docker_login module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_login_module.html)
-- [docker_image module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_image_module.html)
-- [docker_container module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_container_module.html)
-- [wait_for module](https://docs.ansible.com/ansible/latest/collections/ansible/builtin/wait_for_module.html)
-- [uri module](https://docs.ansible.com/ansible/latest/collections/ansible/builtin/uri_module.html)
-
-</details>
-
-#### 3.3 Create Deployment Playbook
-
-Create `playbooks/deploy.yml`:
-
-```yaml
----
-- name: Deploy application
-  hosts: webservers
-  become: yes
-
-  roles:
-    - app_deploy
-```
-
-#### 3.4 Run Deployment
-
-```bash
-ansible-playbook playbooks/deploy.yml --ask-vault-pass
-```
-
-Or if using password file:
-```bash
-ansible-playbook playbooks/deploy.yml
-```
-
-**Verify:**
-- Container is running: `ansible webservers -a "docker ps"`
-- App is accessible: `curl http://<VM-IP>:5000/health`
-- Check main endpoint: `curl http://<VM-IP>:5000/`
-
-**What to Document:**
-- Terminal output from deployment
-- Container status: `docker ps` output
-- Health check verification
-- Handler execution (if any)
-
----
-
-### Task 4 — Documentation (2 pts)
-
-**Objective:** Document your Ansible implementation and demonstrate understanding.
-
-Create `ansible/docs/LAB05.md` with these sections:
-
-#### 1. Architecture Overview
-- Ansible version used
-- Target VM OS and version
-- Role structure diagram or explanation
-- Why roles instead of monolithic playbooks?
-
-#### 2. Roles Documentation
-
-For each role (common, docker, app_deploy):
-- **Purpose**: What does this role do?
-- **Variables**: Key variables and defaults
-- **Handlers**: What handlers are defined?
-- **Dependencies**: Does it depend on other roles?
-
-#### 3. Idempotency Demonstration
-- Terminal output from FIRST provision.yml run
-- Terminal output from SECOND provision.yml run
-- Analysis: What changed first time? What didn't change second time?
-- Explanation: What makes your roles idempotent?
-
-#### 4. Ansible Vault Usage
-- How you store credentials securely
-- Vault password management strategy
-- Example of encrypted file (show it's encrypted!)
-- Why Ansible Vault is important
-
-#### 5. Deployment Verification
-- Terminal output from deploy.yml run
-- Container status: `docker ps` output
-- Health check verification: `curl` outputs
-- Handler execution (if any)
-
-#### 6. Key Decisions
-Answer briefly (2-3 sentences each):
-- **Why use roles instead of plain playbooks?**
-- **How do roles improve reusability?**
-- **What makes a task idempotent?**
-- **How do handlers improve efficiency?**
-- **Why is Ansible Vault necessary?**
-
-#### 7. Challenges (Optional)
-- Issues encountered and solutions
-- Keep it brief - bullet points OK
-
----
-
-## Bonus Task — Dynamic Inventory with Cloud Plugins (2.5 pts)
-
-**Objective:** Use Ansible's built-in inventory plugins to dynamically discover your cloud VMs instead of hardcoding IPs.
-
-<details>
-<summary>💡 Why Dynamic Inventory?</summary>
-
-**The Problem with Static Inventory:**
-```ini
-[webservers]
-vm ansible_host=192.168.1.100 ansible_user=ubuntu
-```
-- IP changes? Must update manually
-- Multiple VMs? Update each one
-- Scaling? Very tedious
-
-**Dynamic Inventory Solution:**
-- Query cloud provider API automatically
-- Always up-to-date IPs
-- Filter by tags/labels
-- Group automatically
-- Scale to hundreds of VMs
-
-**Ansible Inventory Plugins:**
-Ansible has official plugins for major clouds.
-
-**Available Plugins:**
-- `yandex.cloud.yandex_compute` - Yandex Cloud
-- `amazon.aws.aws_ec2` - Amazon EC2
-- `google.gcp.gcp_compute` - Google Cloud
-- `azure.azcollection.azure_rm` - Microsoft Azure
-- `community.digitalocean.digitalocean` - DigitalOcean
-
-</details>
-
-**Requirements:**
-
-1. **Install the collection for your cloud provider** from Lab 4
-
-2. **Create inventory plugin configuration file** - `ansible/inventory/<cloud>.yml`
-   - Must specify plugin name
-   - Must configure authentication
-   - Must set `ansible_host` to public IP (use `compose` parameter)
-   - Must set `ansible_user` (use `compose` parameter)
-   - Should filter running VMs only
-   - Should create groups (like `webservers`)
-
-3. **Update ansible.cfg** to use the plugin
-
-4. **Test the inventory:**
-   ```bash
-   ansible-inventory --graph    # Show discovered hosts
-   ansible all -m ping          # Test connectivity
-   ```
-
-5. **Run your playbooks** with dynamic inventory
-
-<details>
-<summary>💡 Research Path</summary>
-
-**Steps to Complete:**
-
-1. **Find the right plugin** for your cloud provider
-   - Search: "ansible [your-cloud] inventory plugin"
-   - Official documentation link
-
-2. **Install collection:**
-   - Use `ansible-galaxy collection install <collection-name>`
-   - Some require additional Python packages
-
-3. **Understand required parameters:**
-   - Authentication: How does plugin authenticate?
-   - Connection: How to set `ansible_host` from cloud metadata?
-   - Grouping: How to organize hosts?
-   - Filtering: How to select only your VMs?
-
-4. **Create YAML config file:**
-   - Must start with `plugin: <plugin-name>`
-   - Research what each cloud calls their fields
-   - Example: AWS uses `public_ip_address`, GCP uses `networkInterfaces[0]...`, etc.
-
-5. **Key Questions to Research:**
-   - What authentication method to use?
-   - What's the API field name for public IP?
-   - How to filter only running VMs?
-   - How to create host groups?
-
-**Hints by Cloud:**
-
-**Yandex Cloud:**
-- Collection: `yandex.cloud`
-- Key parameters: `auth_kind`, `folder_id`, `compose`
-- IP field is nested: `network_interfaces[0]...`
-
-**AWS:**
-- Collection: `amazon.aws`
-- Key parameters: `regions`, `filters`, `compose`
-- IP field: `public_ip_address`
-- Filter by tags: `"tag:Name": value`
-
-**GCP:**
-- Collection: `google.gcp`
-- Key parameters: `projects`, `auth_kind`, `compose`
-- IP field: `networkInterfaces[0].accessConfigs[0].natIP`
-
-**Azure:**
-- Collection: `azure.azcollection`
-- Key parameters: `include_vm_resource_groups`, `compose`
-- IP field: `public_ipv4_addresses[0]`
-
-**Documentation Links:**
-- [Ansible Inventory Plugins](https://docs.ansible.com/ansible/latest/plugins/inventory.html)
-- [Dynamic Inventory Guide](https://docs.ansible.com/ansible/latest/user_guide/intro_dynamic_inventory.html)
-- Search: "ansible [cloud] inventory plugin" for specific docs
-
-</details>
-
-**What to Document:**
-- Which cloud plugin you chose and why
-- How you configured authentication
-- How you mapped cloud metadata to Ansible variables
-- Terminal output from `ansible-inventory --graph` showing auto-discovered hosts
-- Terminal output from running playbooks with dynamic inventory
-- Explanation: What happens when VM IP changes? (No manual updates needed!)
-- Benefits compared to static inventory
-
----
-
-## How to Submit
-
-1. **Create Branch:**
-   ```bash
-   git checkout -b lab05
-   ```
-
-2. **Commit Work:**
-   - Add Ansible project (`ansible/` directory with roles)
-   - Add documentation (`ansible/docs/LAB05.md`)
-   - **IMPORTANT:** Add to `.gitignore`:
-     ```
-     # Ansible
-     *.retry
-     .vault_pass
-     ansible/inventory/*.pyc
-     __pycache__/
-     ```
-   - Commit: `git commit -m "feat: complete lab05 - ansible fundamentals"`
-
-3. **Verify No Secrets:**
-   - ✅ Check vault password not committed
-   - ✅ Check `.vault_pass` not committed
-   - ✅ Encrypted vault files OK to commit (they're encrypted!)
-   - ✅ SSH private keys not committed
-
-4. **Create Pull Requests:**
-   - **PR #1:** `your-fork:lab05` → `course-repo:master`
-   - **PR #2:** `your-fork:lab05` → `your-fork:master`
-
----
-
-## Acceptance Criteria
-
-### Main Tasks (10 points)
-
-**Setup & Structure (2 pts):**
-- [ ] Proper role-based directory structure created
-- [ ] All three roles created (common, docker, app_deploy)
-- [ ] Each role has appropriate tasks, handlers, and defaults
-- [ ] Ansible.cfg configured correctly
-- [ ] Inventory configured and connectivity tested
-
-**System Provisioning (4 pts):**
-- [ ] Common role implemented
-- [ ] Docker role implemented with all required tasks
-- [ ] Provision playbook uses roles correctly
-- [ ] **Idempotency demonstrated** (two runs, second shows no changes)
-- [ ] Terminal output from both runs provided
-- [ ] Handlers used appropriately
-
-**Application Deployment (2 pts):**
-- [ ] Ansible Vault used for credentials
-- [ ] Vault file encrypted (verify with `ansible-vault view`)
-- [ ] App_deploy role complete with all required tasks
-- [ ] Deploy playbook uses role correctly
-- [ ] Container running with proper configuration
-- [ ] Health check verification included
-- [ ] Handlers defined in role
-
-**Documentation (2 pts):**
-- [ ] `ansible/docs/LAB05.md` complete with all sections
-- [ ] Architecture and role structure explained
-- [ ] Each role documented (purpose, variables, handlers)
-- [ ] Idempotency analysis included
-- [ ] Vault usage documented
-- [ ] Key decisions explained
-
-### Bonus Task (2.5 points)
-
-**Dynamic Inventory (2.5 pts):**
-- [ ] Cloud inventory plugin configured
-- [ ] Integrates with your cloud provider from Lab 4
-- [ ] Playbooks work with dynamic inventory
-- [ ] Terminal output showing `ansible-inventory --graph`
-- [ ] Benefits documented
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Setup & Structure** | 2 pts | Proper role architecture, clean organization |
-| **System Provisioning** | 4 pts | All roles working, idempotent, handlers used |
-| **Application Deployment** | 2 pts | Vault used, role-based deployment, app running |
-| **Documentation** | 2 pts | Complete, clear, justifies decisions |
-| **Bonus: Dynamic Inventory** | 2.5 pts | Cloud plugin working |
-| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
-
-**Grading:**
-- **10/10:** Perfect role structure, deep understanding, excellent idempotency demo
-- **8-9/10:** Working roles, good practices, solid understanding
-- **6-7/10:** Basic roles work, some understanding, missing best practices
-- **<6/10:** Roles don't work properly, no idempotency, poor structure
-
-**Critical Requirements:**
-- ✅ MUST use role-based structure (not monolithic playbooks)
-- ✅ MUST demonstrate idempotency (two runs documented)
-- ✅ MUST use Ansible Vault for credentials
-- ✅ MUST NOT commit vault password or unencrypted secrets
-
----
-
-## Resources
-
-<details>
-<summary>📚 Ansible Core</summary>
-
-- [Ansible Documentation](https://docs.ansible.com/)
-- [Ansible Roles](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html)
-- [Best Practices](https://docs.ansible.com/ansible/latest/user_guide/playbooks_best_practices.html)
-
-</details>
-
-<details>
-<summary>🔒 Security</summary>
-
-- [Ansible Vault](https://docs.ansible.com/ansible/latest/user_guide/vault.html)
-- [Security Best Practices](https://docs.ansible.com/ansible/latest/user_guide/playbooks_best_practices.html#best-practices-for-security)
-
-</details>
-
-<details>
-<summary>🐳 Docker with Ansible</summary>
-
-- [Docker Modules](https://docs.ansible.com/ansible/latest/collections/community/docker/index.html)
-- [Docker Scenario Guide](https://docs.ansible.com/ansible/latest/scenario_guides/guide_docker.html)
-
-</details>
-
-<details>
-<summary>🔄 Dynamic Inventory</summary>
-
-- [Dynamic Inventory](https://docs.ansible.com/ansible/latest/user_guide/intro_dynamic_inventory.html)
-- [Inventory Plugins](https://docs.ansible.com/ansible/latest/plugins/inventory.html)
-
-</details>
-
----
-
-## Looking Ahead
-
-**Lab 6:** Advanced Ansible features (blocks, tags, Docker Compose, CI/CD automation)
-
-You'll build on these roles by:
-- Adding blocks and tags for better control
-- Upgrading to Docker Compose
-- Implementing wipe logic
-- Automating deployment with GitHub Actions
-
----
-
-**Good luck!** 🚀
-
-> **Remember:** Roles are the foundation of Ansible. Focus on creating clean, idempotent roles with proper structure. Use handlers efficiently. Secure your credentials with Vault. Document your decisions, not just your code. This foundation will be essential for Lab 6!
+# Lab 5 — Ansible Fundamentals
+
+![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
+![topic](https://img.shields.io/badge/topic-Configuration%20Management-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Ansible-informational)
+
+> Learn configuration management fundamentals by building reusable Ansible roles for infrastructure provisioning and application deployment.
+
+## Overview
+
+Master the basics of Ansible by creating a professional role-based automation system. You'll build roles for system provisioning (Docker, common packages) and application deployment, demonstrating idempotency, handlers, and secure credential management with Ansible Vault.
+
+**What You'll Learn:**
+- Ansible roles architecture and best practices
+- Role-based code organization for reusability
+- Writing tasks, handlers, and defaults
+- Idempotency and why it matters
+- Ansible Vault for secure credential management
+- Handlers for efficient service management
+- Infrastructure verification and health checks
+- Basic application deployment with Docker
+
+**Tech Stack:** Ansible 2.16+ | Ansible Vault | Docker | YAML
+
+**Connection to Previous Labs:**
+- **Lab 4:** Use the VM you created (cloud or local)
+- **Labs 1-3:** Deploy your containerized Python app with CI/CD-built images
+- **Lab 6:** Add advanced features (blocks, tags, Docker Compose, CI/CD)
+
+---
+
+## Prerequisites
+
+You need a target VM from Lab 4:
+- **Option A:** Cloud VM from Lab 4 (Terraform/Pulumi)
+- **Option B:** Local VM (VirtualBox/Vagrant)
+- **Option C:** Recreate VM using your Lab 4 code
+
+**VM Requirements:**
+- Ubuntu 24.04 LTS or 22.04 LTS
+- SSH access configured
+- Your SSH key added
+- Sudo access (passwordless recommended for automation)
+- Python 3 installed (usually pre-installed on Ubuntu)
+
+---
+
+## Tasks
+
+### Task 1 — Ansible Setup & Role Structure (2 pts)
+
+**Objective:** Install Ansible locally, create proper role-based project structure, and configure inventory.
+
+#### 1.1 Install Ansible
+
+Install Ansible on your local machine (control node):
+
+**Ubuntu/Debian:**
+```bash
+sudo apt update
+sudo apt install ansible
+```
+
+**macOS:**
+```bash
+brew install ansible
+```
+
+**Windows:**
+- Use WSL2 and install in Linux environment
+- OR use Ansible via Docker
+
+Verify installation: `ansible --version`
+
+#### 1.2 Create Role-Based Project Structure
+
+Create this structure:
+
+```
+ansible/
+├── inventory/
+│   └── hosts.ini              # Static inventory
+├── roles/
+│   ├── common/                # Common system tasks
+│   │   ├── tasks/
+│   │   │   └── main.yml
+│   │   └── defaults/
+│   │       └── main.yml
+│   ├── docker/                # Docker installation
+│   │   ├── tasks/
+│   │   │   └── main.yml
+│   │   ├── handlers/
+│   │   │   └── main.yml
+│   │   └── defaults/
+│   │       └── main.yml
+│   └── app_deploy/            # Application deployment
+│       ├── tasks/
+│       │   └── main.yml
+│       ├── handlers/
+│       │   └── main.yml
+│       └── defaults/
+│           └── main.yml
+├── playbooks/
+│   ├── site.yml               # Main playbook
+│   ├── provision.yml          # System provisioning
+│   └── deploy.yml             # App deployment
+├── group_vars/
+│   └── all.yml               # Encrypted variables (Vault)
+├── ansible.cfg               # Ansible configuration
+└── docs/
+    └── LAB05.md              # Your documentation
+```
+
+<details>
+<summary>💡 Why Ansible Roles?</summary>
+
+**What are Roles?**
+
+Roles are the standard way to organize Ansible code for reusability and maintainability.
+
+**Benefits of Roles:**
+
+1. **Reusability**: Use same role across projects
+2. **Organization**: Clear structure, easy to navigate
+3. **Maintainability**: Changes in one place
+4. **Sharing**: Share roles via Ansible Galaxy
+5. **Testing**: Test roles independently
+6. **Modularity**: Mix and match roles
+
+**Role Structure:**
+
+Each role has a standard structure:
+
+```
+role_name/
+├── tasks/           # Main task list
+│   └── main.yml
+├── handlers/        # Handler definitions
+│   └── main.yml
+├── defaults/        # Default variables (low priority)
+│   └── main.yml
+├── vars/            # Role variables (high priority)
+│   └── main.yml
+├── files/           # Static files to copy
+├── templates/       # Jinja2 templates
+└── meta/            # Role metadata and dependencies
+    └── main.yml
+```
+
+**Only create directories you need!** Empty directories can be omitted.
+
+**Resources:**
+- [Ansible Roles Documentation](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html)
+- [Role Directory Structure](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html#role-directory-structure)
+
+</details>
+
+#### 1.3 Configure Inventory
+
+Create `inventory/hosts.ini` with your VM details:
+
+```ini
+[webservers]
+your-vm-name ansible_host=<VM-IP-ADDRESS> ansible_user=<username>
+```
+
+<details>
+<summary>💡 Inventory Configuration</summary>
+
+**Static Inventory Format:**
+```ini
+[group_name]
+hostname ansible_host=192.168.1.100 ansible_user=ubuntu ansible_ssh_private_key_file=~/.ssh/id_rsa
+
+[group_name:vars]
+ansible_python_interpreter=/usr/bin/python3
+```
+
+**Common Connection Parameters:**
+- `ansible_host` - IP address or hostname
+- `ansible_user` - SSH username
+- `ansible_port` - SSH port (default: 22)
+- `ansible_ssh_private_key_file` - Path to SSH key
+- `ansible_python_interpreter` - Python path on target
+
+**Testing Connectivity:**
+```bash
+ansible all -i inventory/hosts.ini -m ping
+ansible webservers -i inventory/hosts.ini -a "uptime"
+```
+
+**Resources:**
+- [Ansible Inventory Documentation](https://docs.ansible.com/ansible/latest/user_guide/intro_inventory.html)
+
+</details>
+
+#### 1.4 Create Ansible Configuration
+
+Create `ansible.cfg`:
+
+```ini
+[defaults]
+inventory = inventory/hosts.ini
+roles_path = roles
+host_key_checking = False
+remote_user = ubuntu
+retry_files_enabled = False
+
+[privilege_escalation]
+become = True
+become_method = sudo
+become_user = root
+```
+
+#### 1.5 Test Connectivity
+
+Verify Ansible can connect to your VM:
+
+```bash
+cd ansible/
+ansible all -m ping
+ansible webservers -a "uname -a"
+```
+
+You should see successful responses (green "SUCCESS" messages).
+
+---
+
+### Task 2 — System Provisioning Roles (4 pts)
+
+**Objective:** Create dedicated roles for system provisioning and demonstrate idempotency.
+
+#### 2.1 Create Common Role
+
+Create `roles/common/tasks/main.yml`:
+
+**Required Tasks:**
+- Update apt cache
+- Install essential packages (python3-pip, curl, git, vim, htop, etc.)
+- Set timezone (optional but good practice)
+
+**Create `roles/common/defaults/main.yml`:**
+Define default variables for packages to install.
+
+<details>
+<summary>💡 Common Role Pattern</summary>
+
+**Purpose:**
+Basic system setup that every server needs.
+
+**Typical Tasks:**
+- Update package cache
+- Install essential tools
+- Configure system settings
+- Set up logging
+- Create users/groups
+
+**Example pattern to research:**
+```yaml
+---
+- name: Update apt cache
+  apt:
+    update_cache: yes
+    cache_valid_time: 3600
+
+- name: Install common packages
+  apt:
+    name: "{{ common_packages }}"
+    state: present
+```
+
+**Questions:**
+- What does `cache_valid_time` do?
+- How do you define a list of packages in defaults?
+- Should you use `state: present` or `state: latest`?
+
+**Resources:**
+- [apt module](https://docs.ansible.com/ansible/latest/collections/ansible/builtin/apt_module.html)
+- [timezone module](https://docs.ansible.com/ansible/latest/collections/community/general/timezone_module.html)
+
+</details>
+
+#### 2.2 Create Docker Role
+
+Create `roles/docker/tasks/main.yml`:
+
+**Required Tasks:**
+1. Add Docker GPG key
+2. Add Docker repository
+3. Install Docker packages (docker-ce, docker-ce-cli, containerd.io)
+4. Ensure Docker service is running and enabled
+5. Add user to docker group
+6. Install python3-docker (for Ansible docker modules)
+
+**Create `roles/docker/handlers/main.yml`:**
+- Handler to restart Docker service
+
+**Create `roles/docker/defaults/main.yml`:**
+- Docker version constraints (if any)
+- User to add to docker group
+
+<details>
+<summary>💡 Docker Installation Pattern</summary>
+
+**Docker Installation Steps:**
+
+You need to research the official Docker installation for Ubuntu and translate it to Ansible tasks.
+
+**Key Modules:**
+- `apt_key` - Manage APT repository keys
+- `apt_repository` - Manage APT repositories
+- `apt` - Manage packages
+- `service` - Manage services
+- `user` - Manage users and groups
+
+**Questions to Research:**
+- What's Docker's official GPG key URL?
+- What repository URL should you use for Ubuntu?
+- How do you use Ansible facts like `{{ ansible_distribution_release }}`?
+- Why add user to docker group?
+- When should the handler be triggered?
+
+**Handler Pattern:**
+```yaml
+---
+- name: restart docker
+  service:
+    name: docker
+    state: restarted
+```
+
+**Trigger handler with:**
+```yaml
+- name: Some task
+  module: ...
+  notify: restart docker
+```
+
+**Resources:**
+- [Install Docker on Ubuntu (Official)](https://docs.docker.com/engine/install/ubuntu/)
+- [Ansible Handlers](https://docs.ansible.com/ansible/latest/user_guide/playbooks_handlers.html)
+
+</details>
+
+#### 2.3 Create Provisioning Playbook
+
+Create `playbooks/provision.yml`:
+
+```yaml
+---
+- name: Provision web servers
+  hosts: webservers
+  become: yes
+
+  roles:
+    - common
+    - docker
+```
+
+**That's it!** The playbook is clean because all logic is in roles.
+
+#### 2.4 Run Provisioning and Demonstrate Idempotency
+
+**First Run:**
+```bash
+ansible-playbook playbooks/provision.yml
+```
+
+Observe the output - tasks should show "changed" status (yellow).
+
+**Second Run:**
+```bash
+ansible-playbook playbooks/provision.yml
+```
+
+**CRITICAL:** Tasks should show "ok" status (green), not "changed". This demonstrates idempotency!
+
+<details>
+<summary>💡 Understanding Idempotency</summary>
+
+**What is Idempotency?**
+
+An idempotent operation produces the same result whether executed once or multiple times.
+
+**In Ansible:**
+- Running a playbook multiple times should be safe
+- Only makes changes when needed
+- Doesn't break if run repeatedly
+- Converges to desired state
+
+**Ansible Output Colors:**
+- **Green (ok):** Task ran, no change needed (desired state already achieved)
+- **Yellow (changed):** Task made a change to reach desired state
+- **Red (failed):** Task failed
+- **Dark (skipped):** Task was skipped
+
+**Why Idempotency Matters:**
+
+1. **Safety:** Can re-run playbooks without fear
+2. **Reliability:** Consistent results
+3. **Recovery:** Re-run after partial failure
+4. **Drift Detection:** Changes only when state drifts
+5. **Confidence:** Know exactly what will change
+
+**Making Tasks Idempotent:**
+
+**Use Stateful Modules:**
+- `apt: state=present` (not just `apt: name=package`)
+- `service: state=started` (not `command: systemctl start`)
+- `file: state=directory` (not `command: mkdir`)
+
+**Testing Idempotency:**
+
+1. Run playbook first time → many "changed"
+2. Run playbook second time → all "ok", zero "changed"
+3. If tasks show "changed" on second run, investigate why
+
+**Resources:**
+- [Ansible Idempotency](https://docs.ansible.com/ansible/latest/reference_appendices/glossary.html)
+
+</details>
+
+**What to Document:**
+- Terminal output from BOTH runs
+- Analysis: Which tasks changed first time? Why?
+- Explanation: Why nothing changed second time?
+
+---
+
+### Task 3 — Application Deployment Role (2 pts)
+
+**Objective:** Create a deployment role that securely pulls and runs your Python containerized app using Ansible Vault for credentials.
+
+#### 3.1 Initialize Ansible Vault
+
+Create encrypted file for sensitive data:
+
+```bash
+ansible-vault create group_vars/all.yml
+```
+
+You'll be prompted for a vault password. **Remember this password!**
+
+Add your Docker Hub credentials and app configuration:
+
+```yaml
+---
+# Docker Hub credentials
+dockerhub_username: your-username
+dockerhub_password: your-access-token
+
+# Application configuration
+app_name: devops-app
+docker_image: "{{ dockerhub_username }}/{{ app_name }}"
+docker_image_tag: latest
+app_port: 5000
+app_container_name: "{{ app_name }}"
+```
+
+Save and exit.
+
+<details>
+<summary>💡 Ansible Vault Best Practices</summary>
+
+**What is Ansible Vault?**
+
+Ansible Vault encrypts sensitive data so it can be safely stored in version control.
+
+**Vault Commands:**
+
+```bash
+# Create encrypted file
+ansible-vault create filename.yml
+
+# Edit encrypted file
+ansible-vault edit filename.yml
+
+# View encrypted file
+ansible-vault view filename.yml
+
+# Encrypt existing file
+ansible-vault encrypt filename.yml
+
+# Decrypt file (careful!)
+ansible-vault decrypt filename.yml
+```
+
+**Using Vaulted Files:**
+
+**Option 1: Prompt for password:**
+```bash
+ansible-playbook playbook.yml --ask-vault-pass
+```
+
+**Option 2: Password file:**
+```bash
+echo "your-password" > .vault_pass
+chmod 600 .vault_pass
+# Add .vault_pass to .gitignore!
+
+ansible-playbook playbook.yml --vault-password-file .vault_pass
+```
+
+**Option 3: In ansible.cfg:**
+```ini
+[defaults]
+vault_password_file = .vault_pass
+```
+
+**Best Practices:**
+
+1. **Never commit unencrypted secrets**
+2. **Use separate file for vault password** (add to .gitignore)
+3. **Rotate vault password regularly**
+4. **Don't decrypt files permanently**
+5. **Use `no_log: true` for tasks with secrets**
+
+**Resources:**
+- [Ansible Vault Documentation](https://docs.ansible.com/ansible/latest/user_guide/vault.html)
+
+</details>
+
+#### 3.2 Create Application Deployment Role
+
+Create `roles/app_deploy/tasks/main.yml`:
+
+**Required Tasks:**
+1. Log in to Docker Hub (using vaulted credentials)
+2. Pull Docker image
+3. Stop existing container (if running)
+4. Remove old container (if exists)
+5. Run new container with:
+   - Proper port mapping (5000:5000)
+   - Environment variables (if any)
+   - Restart policy (unless-stopped)
+   - Container name
+6. Wait for application to be ready (port check)
+7. Verify health endpoint
+
+**Create `roles/app_deploy/handlers/main.yml`:**
+- Handler to restart application container
+
+**Create `roles/app_deploy/defaults/main.yml`:**
+- Default port
+- Default restart policy
+- Default environment variables
+
+<details>
+<summary>💡 Docker Deployment with Ansible</summary>
+
+**Key Modules:**
+
+**docker_login:**
+Authenticate with Docker registry.
+
+**Questions:**
+- How do you pass credentials from vaulted variables?
+- What's the `no_log` parameter for?
+
+**docker_image:**
+Manage Docker images (pull, build, remove).
+
+**Questions:**
+- How do you pull an image?
+- What's the `source: pull` parameter?
+
+**docker_container:**
+Manage Docker containers.
+
+**Questions:**
+- How do you ensure a container is running?
+- What restart policies exist?
+- How do you map ports?
+- How do you set environment variables?
+- What's the difference between `state: started` and `state: present`?
+
+**wait_for:**
+Wait for port to be available.
+
+**uri:**
+Make HTTP requests (for health checks).
+
+**Security Note:**
+Always use `no_log: true` for tasks with credentials:
+```yaml
+- name: Login
+  docker_login:
+    username: "{{ dockerhub_username }}"
+    password: "{{ dockerhub_password }}"
+  no_log: true  # Prevents credentials in logs
+```
+
+**Resources:**
+- [docker_login module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_login_module.html)
+- [docker_image module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_image_module.html)
+- [docker_container module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_container_module.html)
+- [wait_for module](https://docs.ansible.com/ansible/latest/collections/ansible/builtin/wait_for_module.html)
+- [uri module](https://docs.ansible.com/ansible/latest/collections/ansible/builtin/uri_module.html)
+
+</details>
+
+#### 3.3 Create Deployment Playbook
+
+Create `playbooks/deploy.yml`:
+
+```yaml
+---
+- name: Deploy application
+  hosts: webservers
+  become: yes
+
+  roles:
+    - app_deploy
+```
+
+#### 3.4 Run Deployment
+
+```bash
+ansible-playbook playbooks/deploy.yml --ask-vault-pass
+```
+
+Or if using password file:
+```bash
+ansible-playbook playbooks/deploy.yml
+```
+
+**Verify:**
+- Container is running: `ansible webservers -a "docker ps"`
+- App is accessible: `curl http://<VM-IP>:5000/health`
+- Check main endpoint: `curl http://<VM-IP>:5000/`
+
+**What to Document:**
+- Terminal output from deployment
+- Container status: `docker ps` output
+- Health check verification
+- Handler execution (if any)
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Objective:** Document your Ansible implementation and demonstrate understanding.
+
+Create `ansible/docs/LAB05.md` with these sections:
+
+#### 1. Architecture Overview
+- Ansible version used
+- Target VM OS and version
+- Role structure diagram or explanation
+- Why roles instead of monolithic playbooks?
+
+#### 2. Roles Documentation
+
+For each role (common, docker, app_deploy):
+- **Purpose**: What does this role do?
+- **Variables**: Key variables and defaults
+- **Handlers**: What handlers are defined?
+- **Dependencies**: Does it depend on other roles?
+
+#### 3. Idempotency Demonstration
+- Terminal output from FIRST provision.yml run
+- Terminal output from SECOND provision.yml run
+- Analysis: What changed first time? What didn't change second time?
+- Explanation: What makes your roles idempotent?
+
+#### 4. Ansible Vault Usage
+- How you store credentials securely
+- Vault password management strategy
+- Example of encrypted file (show it's encrypted!)
+- Why Ansible Vault is important
+
+#### 5. Deployment Verification
+- Terminal output from deploy.yml run
+- Container status: `docker ps` output
+- Health check verification: `curl` outputs
+- Handler execution (if any)
+
+#### 6. Key Decisions
+Answer briefly (2-3 sentences each):
+- **Why use roles instead of plain playbooks?**
+- **How do roles improve reusability?**
+- **What makes a task idempotent?**
+- **How do handlers improve efficiency?**
+- **Why is Ansible Vault necessary?**
+
+#### 7. Challenges (Optional)
+- Issues encountered and solutions
+- Keep it brief - bullet points OK
+
+---
+
+## Bonus Task — Dynamic Inventory with Cloud Plugins (2.5 pts)
+
+**Objective:** Use Ansible's built-in inventory plugins to dynamically discover your cloud VMs instead of hardcoding IPs.
+
+<details>
+<summary>💡 Why Dynamic Inventory?</summary>
+
+**The Problem with Static Inventory:**
+```ini
+[webservers]
+vm ansible_host=192.168.1.100 ansible_user=ubuntu
+```
+- IP changes? Must update manually
+- Multiple VMs? Update each one
+- Scaling? Very tedious
+
+**Dynamic Inventory Solution:**
+- Query cloud provider API automatically
+- Always up-to-date IPs
+- Filter by tags/labels
+- Group automatically
+- Scale to hundreds of VMs
+
+**Ansible Inventory Plugins:**
+Ansible has official plugins for major clouds.
+
+**Available Plugins:**
+- `yandex.cloud.yandex_compute` - Yandex Cloud
+- `amazon.aws.aws_ec2` - Amazon EC2
+- `google.gcp.gcp_compute` - Google Cloud
+- `azure.azcollection.azure_rm` - Microsoft Azure
+- `community.digitalocean.digitalocean` - DigitalOcean
+
+</details>
+
+**Requirements:**
+
+1. **Install the collection for your cloud provider** from Lab 4
+
+2. **Create inventory plugin configuration file** - `ansible/inventory/<cloud>.yml`
+   - Must specify plugin name
+   - Must configure authentication
+   - Must set `ansible_host` to public IP (use `compose` parameter)
+   - Must set `ansible_user` (use `compose` parameter)
+   - Should filter running VMs only
+   - Should create groups (like `webservers`)
+
+3. **Update ansible.cfg** to use the plugin
+
+4. **Test the inventory:**
+   ```bash
+   ansible-inventory --graph    # Show discovered hosts
+   ansible all -m ping          # Test connectivity
+   ```
+
+5. **Run your playbooks** with dynamic inventory
+
+<details>
+<summary>💡 Research Path</summary>
+
+**Steps to Complete:**
+
+1. **Find the right plugin** for your cloud provider
+   - Search: "ansible [your-cloud] inventory plugin"
+   - Official documentation link
+
+2. **Install collection:**
+   - Use `ansible-galaxy collection install <collection-name>`
+   - Some require additional Python packages
+
+3. **Understand required parameters:**
+   - Authentication: How does plugin authenticate?
+   - Connection: How to set `ansible_host` from cloud metadata?
+   - Grouping: How to organize hosts?
+   - Filtering: How to select only your VMs?
+
+4. **Create YAML config file:**
+   - Must start with `plugin: <plugin-name>`
+   - Research what each cloud calls their fields
+   - Example: AWS uses `public_ip_address`, GCP uses `networkInterfaces[0]...`, etc.
+
+5. **Key Questions to Research:**
+   - What authentication method to use?
+   - What's the API field name for public IP?
+   - How to filter only running VMs?
+   - How to create host groups?
+
+**Hints by Cloud:**
+
+**Yandex Cloud:**
+- Collection: `yandex.cloud`
+- Key parameters: `auth_kind`, `folder_id`, `compose`
+- IP field is nested: `network_interfaces[0]...`
+
+**AWS:**
+- Collection: `amazon.aws`
+- Key parameters: `regions`, `filters`, `compose`
+- IP field: `public_ip_address`
+- Filter by tags: `"tag:Name": value`
+
+**GCP:**
+- Collection: `google.gcp`
+- Key parameters: `projects`, `auth_kind`, `compose`
+- IP field: `networkInterfaces[0].accessConfigs[0].natIP`
+
+**Azure:**
+- Collection: `azure.azcollection`
+- Key parameters: `include_vm_resource_groups`, `compose`
+- IP field: `public_ipv4_addresses[0]`
+
+**Documentation Links:**
+- [Ansible Inventory Plugins](https://docs.ansible.com/ansible/latest/plugins/inventory.html)
+- [Dynamic Inventory Guide](https://docs.ansible.com/ansible/latest/user_guide/intro_dynamic_inventory.html)
+- Search: "ansible [cloud] inventory plugin" for specific docs
+
+</details>
+
+**What to Document:**
+- Which cloud plugin you chose and why
+- How you configured authentication
+- How you mapped cloud metadata to Ansible variables
+- Terminal output from `ansible-inventory --graph` showing auto-discovered hosts
+- Terminal output from running playbooks with dynamic inventory
+- Explanation: What happens when VM IP changes? (No manual updates needed!)
+- Benefits compared to static inventory
+
+---
+
+## How to Submit
+
+1. **Create Branch:**
+   ```bash
+   git checkout -b lab05
+   ```
+
+2. **Commit Work:**
+   - Add Ansible project (`ansible/` directory with roles)
+   - Add documentation (`ansible/docs/LAB05.md`)
+   - **IMPORTANT:** Add to `.gitignore`:
+     ```
+     # Ansible
+     *.retry
+     .vault_pass
+     ansible/inventory/*.pyc
+     __pycache__/
+     ```
+   - Commit: `git commit -m "feat: complete lab05 - ansible fundamentals"`
+
+3. **Verify No Secrets:**
+   - ✅ Check vault password not committed
+   - ✅ Check `.vault_pass` not committed
+   - ✅ Encrypted vault files OK to commit (they're encrypted!)
+   - ✅ SSH private keys not committed
+
+4. **Create Pull Requests:**
+   - **PR #1:** `your-fork:lab05` → `course-repo:master`
+   - **PR #2:** `your-fork:lab05` → `your-fork:master`
+
+---
+
+## Acceptance Criteria
+
+### Main Tasks (10 points)
+
+**Setup & Structure (2 pts):**
+- [ ] Proper role-based directory structure created
+- [ ] All three roles created (common, docker, app_deploy)
+- [ ] Each role has appropriate tasks, handlers, and defaults
+- [ ] Ansible.cfg configured correctly
+- [ ] Inventory configured and connectivity tested
+
+**System Provisioning (4 pts):**
+- [ ] Common role implemented
+- [ ] Docker role implemented with all required tasks
+- [ ] Provision playbook uses roles correctly
+- [ ] **Idempotency demonstrated** (two runs, second shows no changes)
+- [ ] Terminal output from both runs provided
+- [ ] Handlers used appropriately
+
+**Application Deployment (2 pts):**
+- [ ] Ansible Vault used for credentials
+- [ ] Vault file encrypted (verify with `ansible-vault view`)
+- [ ] App_deploy role complete with all required tasks
+- [ ] Deploy playbook uses role correctly
+- [ ] Container running with proper configuration
+- [ ] Health check verification included
+- [ ] Handlers defined in role
+
+**Documentation (2 pts):**
+- [ ] `ansible/docs/LAB05.md` complete with all sections
+- [ ] Architecture and role structure explained
+- [ ] Each role documented (purpose, variables, handlers)
+- [ ] Idempotency analysis included
+- [ ] Vault usage documented
+- [ ] Key decisions explained
+
+### Bonus Task (2.5 points)
+
+**Dynamic Inventory (2.5 pts):**
+- [ ] Cloud inventory plugin configured
+- [ ] Integrates with your cloud provider from Lab 4
+- [ ] Playbooks work with dynamic inventory
+- [ ] Terminal output showing `ansible-inventory --graph`
+- [ ] Benefits documented
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Setup & Structure** | 2 pts | Proper role architecture, clean organization |
+| **System Provisioning** | 4 pts | All roles working, idempotent, handlers used |
+| **Application Deployment** | 2 pts | Vault used, role-based deployment, app running |
+| **Documentation** | 2 pts | Complete, clear, justifies decisions |
+| **Bonus: Dynamic Inventory** | 2.5 pts | Cloud plugin working |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Perfect role structure, deep understanding, excellent idempotency demo
+- **8-9/10:** Working roles, good practices, solid understanding
+- **6-7/10:** Basic roles work, some understanding, missing best practices
+- **<6/10:** Roles don't work properly, no idempotency, poor structure
+
+**Critical Requirements:**
+- ✅ MUST use role-based structure (not monolithic playbooks)
+- ✅ MUST demonstrate idempotency (two runs documented)
+- ✅ MUST use Ansible Vault for credentials
+- ✅ MUST NOT commit vault password or unencrypted secrets
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Ansible Core</summary>
+
+- [Ansible Documentation](https://docs.ansible.com/)
+- [Ansible Roles](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html)
+- [Best Practices](https://docs.ansible.com/ansible/latest/user_guide/playbooks_best_practices.html)
+
+</details>
+
+<details>
+<summary>🔒 Security</summary>
+
+- [Ansible Vault](https://docs.ansible.com/ansible/latest/user_guide/vault.html)
+- [Security Best Practices](https://docs.ansible.com/ansible/latest/user_guide/playbooks_best_practices.html#best-practices-for-security)
+
+</details>
+
+<details>
+<summary>🐳 Docker with Ansible</summary>
+
+- [Docker Modules](https://docs.ansible.com/ansible/latest/collections/community/docker/index.html)
+- [Docker Scenario Guide](https://docs.ansible.com/ansible/latest/scenario_guides/guide_docker.html)
+
+</details>
+
+<details>
+<summary>🔄 Dynamic Inventory</summary>
+
+- [Dynamic Inventory](https://docs.ansible.com/ansible/latest/user_guide/intro_dynamic_inventory.html)
+- [Inventory Plugins](https://docs.ansible.com/ansible/latest/plugins/inventory.html)
+
+</details>
+
+---
+
+## Looking Ahead
+
+**Lab 6:** Advanced Ansible features (blocks, tags, Docker Compose, CI/CD automation)
+
+You'll build on these roles by:
+- Adding blocks and tags for better control
+- Upgrading to Docker Compose
+- Implementing wipe logic
+- Automating deployment with GitHub Actions
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** Roles are the foundation of Ansible. Focus on creating clean, idempotent roles with proper structure. Use handlers efficiently. Secure your credentials with Vault. Document your decisions, not just your code. This foundation will be essential for Lab 6!
diff --git a/labs/lab06.md b/labs/lab06.md
index c4405cbc47..3f2107b870 100644
--- a/labs/lab06.md
+++ b/labs/lab06.md
@@ -1,1352 +1,1352 @@
-# Lab 6 — Advanced Ansible & CI/CD
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-Ansible%20%26%20CI%2FCD-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Ansible%20|%20Docker%20Compose%20|%20GitHub%20Actions-informational)
-
-> Enhance your Ansible automation with advanced features including blocks, tags, Docker Compose, role dependencies, wipe logic, and CI/CD integration.
-
-## Overview
-
-Build on Lab 5 by enhancing your Ansible automation with production-ready features. You'll refactor roles with blocks and tags, upgrade to Docker Compose, implement safe cleanup logic, and fully automate deployments with CI/CD.
-
-**What You'll Learn:**
-- Blocks for error handling and task grouping
-- Tags for selective Ansible execution
-- Docker Compose templating with Jinja2
-- Role dependencies and execution order
-- Safe wipe logic with double-gating (variable + tag)
-- GitHub Actions for Ansible automation
-- Multi-app deployment patterns (Bonus)
-
-**Tech Stack:** Ansible 2.16+ | Docker Compose v2 | GitHub Actions | Jinja2
-
-**Prerequisites:** Lab 5 completed (Ansible roles, playbooks, Vault), containerized app from Lab 2, GitHub Actions knowledge from Lab 3
-
----
-
-## Tasks
-
-### Task 1 — Refactor with Blocks & Tags (2 pts)
-
-#### 1.1 Understanding Blocks
-
-Blocks allow you to:
-- **Group tasks** logically (e.g., all Docker installation tasks)
-- **Apply directives** once to multiple tasks (when, become, tags)
-- **Handle errors** with rescue and always sections
-- **Improve readability** by showing task relationships
-
-**Example Block Pattern:**
-```yaml
-- name: Install package with error handling
-  block:
-    - name: Update apt cache
-      # task 1
-
-    - name: Install package
-      # task 2
-
-  rescue:
-    - name: Handle installation failure
-      # runs only if block fails
-
-  always:
-    - name: Cleanup temp files
-      # runs regardless of success/failure
-
-  when: ansible_os_family == "Debian"
-  become: true
-  tags:
-    - packages
-```
-
-#### 1.2 Understanding Tags
-
-Tags enable selective execution:
-```bash
-# Run only tagged tasks
-ansible-playbook provision.yml --tags "docker"
-
-# Skip specific tags
-ansible-playbook provision.yml --skip-tags "common"
-
-# Multiple tags
-ansible-playbook provision.yml --tags "packages,docker"
-
-# List all available tags
-ansible-playbook provision.yml --list-tags
-```
-
-#### 1.3 Refactor `common` Role
-
-**File:** `roles/common/tasks/main.yml`
-
-**Requirements:**
-1. Group package installation tasks in a block with tag `packages`
-2. Group user creation tasks in a block with tag `users`
-3. Add error handling with rescue for apt cache update failures
-4. Use always block to log completion
-
-**Tag Strategy:**
-- `packages` - all package installation tasks
-- `users` - all user management tasks
-- `common` - entire role (applied at role level)
-
-**Hints:**
-- Add rescue block that runs `apt-get update --fix-missing` on failure
-- Use always block to create a log file in /tmp indicating completion
-- Apply `become: true` at block level instead of per task
-
-**Research Questions:**
-- Q: What happens if rescue block also fails?
-- Q: Can you have nested blocks?
-- Q: How do tags inherit to tasks within blocks?
-
-#### 1.4 Refactor `docker` Role
-
-**File:** `roles/docker/tasks/main.yml`
-
-**Requirements:**
-1. Group Docker installation tasks in block with tag `docker_install`
-2. Group Docker configuration tasks in block with tag `docker_config`
-3. Add rescue block to retry apt update on GPG key failure
-4. Use always block to ensure Docker service is enabled
-
-**Additional Tags:**
-- `docker` - entire role
-- `docker_install` - installation only
-- `docker_config` - configuration only
-
-**Hints:**
-- Docker GPG key addition may fail on first try (network timeout)
-- Rescue block should wait 10 seconds and retry
-- Always block should ensure Docker service is enabled and started
-
-#### 1.5 Testing Blocks & Tags
-
-**Test Commands:**
-```bash
-# Test provision with only docker
-ansible-playbook playbooks/provision.yml --tags "docker"
-
-# Skip common role
-ansible-playbook playbooks/provision.yml --skip-tags "common"
-
-# Install packages only across all roles
-ansible-playbook playbooks/provision.yml --tags "packages"
-
-# Check mode to see what would run
-ansible-playbook playbooks/provision.yml --tags "docker" --check
-
-# Run only docker installation tasks
-ansible-playbook playbooks/provision.yml --tags "docker_install"
-```
-
-**Evidence Required:**
-- Output showing selective execution with --tags
-- Output showing error handling with rescue block triggered
-- List of all available tags (--list-tags output)
-
----
-
-### Task 2 — Upgrade to Docker Compose (3 pts)
-
-#### 2.1 Why Docker Compose?
-
-**Advantages over `docker run`:**
-- **Declarative configuration** - define desired state, not commands
-- **Multi-container management** - networks, volumes, dependencies
-- **Environment variable management** - .env files, variable substitution
-- **Easy updates** - change config file and recreate
-- **Better for production** - consistent, reproducible deployments
-
-#### 2.2 Rename Role
-
-**Action Required:**
-```bash
-cd ansible/roles
-mv app_deploy web_app
-```
-
-**Update all references:**
-- Playbook imports: `roles/app_deploy` → `roles/web_app`
-- Documentation: app_deploy → web_app
-- Variable prefixes: Consider `web_app_*` for consistency
-
-**Why rename?**
-- `web_app` is more specific and descriptive
-- Prepares for potential other app types (database_app, cache_app)
-- Better aligns with wipe logic variable naming
-
-#### 2.3 Create Docker Compose Template
-
-**File:** `roles/web_app/templates/docker-compose.yml.j2`
-
-**Requirements:**
-1. Use Jinja2 templating for dynamic values
-2. Define service name, image, ports, environment variables
-3. Include restart policy
-4. Use networks if needed
-5. Support variable substitution for app-specific config
-
-**Template Pattern:**
-```yaml
-version: '3.8'
-
-services:
-  {{ app_name }}:
-    image: {{ docker_image }}:{{ docker_tag }}
-    container_name: {{ app_name }}
-    ports:
-      - "{{ app_port }}:{{ app_internal_port }}"
-    environment:
-      # Add environment variables here
-      # Use Vault-encrypted secrets
-    restart: unless-stopped
-    # Add other configuration
-```
-
-**Variables to support:**
-- `app_name` - service/container name (default: devops-app)
-- `docker_image` - Docker Hub image
-- `docker_tag` - image version (default: latest)
-- `app_port` - host port (default: 8000)
-- `app_internal_port` - container port (default: 8000)
-- Environment variables for app configuration
-
-**Research Questions:**
-- Q: What's the difference between `restart: always` and `restart: unless-stopped`?
-- Q: How do Docker Compose networks differ from Docker bridge networks?
-- Q: Can you reference Ansible Vault variables in the template?
-
-#### 2.4 Define Role Dependencies
-
-**File:** `roles/web_app/meta/main.yml`
-
-**Purpose:** Ensure Docker is installed before deploying web app.
-
-**Pattern:**
-```yaml
----
-dependencies:
-  - role: role_name
-    # Optional variables to pass
-    vars:
-      var_name: value
-```
-
-**Requirements:**
-1. Add `docker` role as dependency
-2. Ensure correct execution order automatically
-3. Document why dependency is needed
-
-**Test:** Run only `web_app` role - Docker should install automatically:
-```bash
-ansible-playbook playbooks/deploy.yml
-# Should automatically run docker role first
-```
-
-#### 2.5 Implement Docker Compose Deployment
-
-**File:** `roles/web_app/tasks/main.yml`
-
-**Requirements:**
-1. Create application directory (e.g., /opt/{{ app_name }})
-2. Template docker-compose.yml to the directory
-3. Use `docker_compose` module (or `community.docker.docker_compose`)
-4. Ensure idempotency (check if already running)
-5. Add appropriate tags: `app_deploy`, `compose`
-
-**Deployment Block Pattern:**
-```yaml
-- name: Deploy application with Docker Compose
-  block:
-    - name: Create app directory
-      # Use file module
-
-    - name: Template docker-compose file
-      # Use template module
-
-    - name: Deploy with docker-compose
-      # Use docker_compose module
-      # state: present (or up)
-
-  rescue:
-    - name: Handle deployment failure
-      # Log error, optionally rollback
-
-  tags:
-    - app_deploy
-    - compose
-```
-
-**Hints:**
-- Install docker-compose Python library: `pip3 install docker-compose`
-- Or use `community.docker` collection (requires installation)
-- Set `pull: yes` to always get latest image
-- Use `project_src` to specify directory with docker-compose.yml
-
-**Research:**
-- Look up `community.docker.docker_compose_v2` module
-- Compare `state: present` vs other state options
-- Understand `recreate` parameter options
-
-#### 2.6 Variables Configuration
-
-**File:** `group_vars/all.yml` (or role defaults)
-
-**Required Variables:**
-```yaml
-# Application Configuration
-app_name: devops-app
-docker_image: your_dockerhub_username/devops-info-service
-docker_tag: latest
-app_port: 8000
-app_internal_port: 8000
-
-# Docker Compose Config
-compose_project_dir: "/opt/{{ app_name }}"
-docker_compose_version: "3.8"
-
-# Secrets (use Vault)
-app_secret_key: !vault |
-          $ANSIBLE_VAULT;1.1;AES256
-          ...
-```
-
-**Encrypt sensitive values:**
-```bash
-ansible-vault encrypt_string 'secret_value' --name 'app_secret_key'
-```
-
-#### 2.7 Testing Docker Compose Deployment
-
-**Test Commands:**
-```bash
-# Full deployment
-ansible-playbook playbooks/deploy.yml
-
-# Check idempotency (run twice, second should show no changes)
-ansible-playbook playbooks/deploy.yml
-ansible-playbook playbooks/deploy.yml
-
-# Verify on target VM
-ssh user@vm_ip
-docker ps
-docker-compose -f /opt/devops-app/docker-compose.yml ps
-curl http://localhost:8000
-```
-
-**Evidence Required:**
-- Output showing Docker Compose deployment success
-- Idempotency proof (second run shows "ok" not "changed")
-- Application running and accessible
-- Contents of templated docker-compose.yml
-
----
-
-### Task 3 — Wipe Logic Implementation (1 pt)
-
-#### 3.1 Understanding Wipe Logic
-
-**Purpose:** Clean removal of deployed applications for:
-- **Clean reinstallation** (wipe old → deploy new)
-- Testing from fresh state
-- Rolling back to clean slate
-- Decommissioning applications
-- Resource cleanup before upgrades
-
-**Implementation Requirements:**
-- ✅ Controlled by variable: `web_app_wipe: true`
-- ✅ Gated by specific tag: `web_app_wipe`
-- ❌ NOT using the special "never" tag
-- Default behavior: wipe tasks do NOT run
-- Explicit invocation required
-
-#### 3.2 Create Wipe Tasks
-
-**File:** `roles/web_app/tasks/wipe.yml`
-
-**Requirements:**
-1. Stop and remove containers (Docker Compose down)
-2. Remove docker-compose.yml file
-3. Remove application directory
-4. Optionally remove Docker images (consider disk space)
-5. Log wipe completion
-
-**Implementation Pattern:**
-```yaml
----
-- name: Wipe web application
-  block:
-    - name: Stop and remove containers
-      ...
-
-    - name: Remove docker-compose file
-      ...
-
-    - name: Remove application directory
-      ...
-
-    - name: Log wipe completion
-      debug:
-        msg: "Application {{ app_name }} wiped successfully"
-
-  when: ...
-  tags:
-    - web_app_wipe
-```
-
-**Key Points:**
-- `when` condition checks variable (default: false)
-- `tags` enables selective execution
-- `ignore_errors` prevents failure if already clean
-- `| bool` ensures proper boolean evaluation
-
-#### 3.3 Include Wipe in Main Tasks
-
-**File:** `roles/web_app/tasks/main.yml`
-
-**Add at the beginning (before deployment tasks):**
-```yaml
----
-# Wipe logic runs first (when explicitly requested)
-- name: Include wipe tasks
-  include_tasks: wipe.yml
-  tags:
-    - web_app_wipe
-
-# Deployment tasks follow...
-- name: Deploy application with Docker Compose
-  block:
-    # ... your deployment tasks
-```
-
-**Why at the beginning?**
-- Enables clean reinstallation: wipe → deploy
-- Logical flow: remove old → install new
-- Tag isolation still prevents accidental wipe during normal deployment
-- Supports use case: `ansible-playbook deploy.yml -e "web_app_wipe=true"`
-
-#### 3.4 Configure Wipe Variable
-
-**File:** `roles/web_app/defaults/main.yml`
-
-**Add:**
-```yaml
-# Wipe Logic Control
-web_app_wipe: false  # Default: do not wipe
-```
-
-**Documentation comment:**
-```yaml
-# Set to true to remove application completely
-# Wipe only:    ansible-playbook deploy.yml -e "web_app_wipe=true" --tags web_app_wipe
-# Clean install: ansible-playbook deploy.yml -e "web_app_wipe=true"
-```
-
-#### 3.5 Testing Wipe Logic
-
-**Test Scenarios:**
-
-**Scenario 1: Normal deployment (wipe should NOT run)**
-```bash
-ansible-playbook playbooks/deploy.yml
-
-# Verify: app deploys normally, wipe tasks skipped (tag not specified)
-ssh user@vm_ip "docker ps"
-```
-
-**Scenario 2: Wipe only (remove existing deployment)**
-```bash
-ansible-playbook playbooks/deploy.yml \
-  -e "web_app_wipe=true" \
-  --tags web_app_wipe
-
-# Verify: app should be removed, deployment skipped
-ssh user@vm_ip "docker ps"  # Should not show app
-ssh user@vm_ip "ls /opt"    # Should not have app directory
-```
-
-**Scenario 3: Clean reinstallation (wipe → deploy)**
-```bash
-# This is the KEY use case: fresh start
-ansible-playbook playbooks/deploy.yml \
-  -e "web_app_wipe=true"
-
-# What happens:
-# 1. Wipe tasks run first (remove old installation)
-# 2. Deployment tasks run second (install fresh)
-# Result: clean reinstallation
-
-# Verify: old app removed, new app running
-ssh user@vm_ip "docker ps"
-```
-
-**Scenario 4: Safety checks (should NOT wipe)**
-```bash
-# 4a: Tag specified but variable false (when condition blocks it)
-ansible-playbook playbooks/deploy.yml --tags web_app_wipe
-# Result: wipe tasks skipped, deployment runs normally
-
-# 4b: Variable true, deployment skipped (only wipe runs)
-ansible-playbook playbooks/deploy.yml \
-  -e "web_app_wipe=true" \
-  --tags web_app_wipe
-# Result: only wipe, no deployment
-```
-
-**Evidence Required:**
-- Output of Scenario 1 showing normal deployment (wipe skipped)
-- Output of Scenario 2 showing wipe-only operation
-- Output of Scenario 3 showing clean reinstall (wipe → deploy)
-- Output of Scenario 4a showing wipe blocked by when condition
-- Screenshot of application running after clean reinstall
-
-#### 3.6 Research Questions
-
-Answer these in your documentation:
-1. **Why use both variable AND tag?** (Double safety mechanism)
-2. **What's the difference between `never` tag and this approach?**
-3. **Why must wipe logic come BEFORE deployment in main.yml?** (Clean reinstall scenario)
-4. **When would you want clean reinstallation vs. rolling update?**
-5. **How would you extend this to wipe Docker images and volumes too?**
-
----
-
-### Task 4 — CI/CD with GitHub Actions (3 pts)
-
-#### 4.1 Why Automate Ansible?
-
-**Benefits:**
-- **Consistency** - same process every time
-- **Speed** - automatic deployments on push
-- **Safety** - linting catches errors before execution
-- **Auditability** - GitHub logs every deployment
-- **Integration** - combines with testing, building, scanning
-
-**CI/CD Flow:**
-```
-Code Push → Lint Ansible → Run Ansible Playbook → Verify Deployment
-```
-
-#### 4.2 Install GitHub Actions Runner (Optional)
-
-**Two Approaches:**
-
-**Approach A: Self-hosted runner on target VM (Recommended)**
-- More realistic for production
-- Direct access to target server
-- Faster (no SSH overhead)
-- Setup: GitHub Repo → Settings → Actions → Runners → Add runner
-
-**Approach B: GitHub-hosted runner with SSH**
-- Easier setup
-- Requires SSH key configuration
-- Uses GitHub Secrets for credentials
-- Slower but simpler
-
-Choose based on your infrastructure preference.
-
-#### 4.3 Create Ansible Workflow
-
-**File:** `.github/workflows/ansible-deploy.yml`
-
-**Requirements:**
-1. Trigger on push to ansible directory
-2. Run ansible-lint for syntax checking
-3. Execute Ansible playbook
-4. Verify deployment success
-5. Use path filters to avoid unnecessary runs
-
-**Workflow Structure:**
-```yaml
-name: Ansible Deployment
-
-on:
-  push:
-    branches: [ main, master ]
-    paths:
-      - 'ansible/**'
-      - '.github/workflows/ansible-deploy.yml'
-  pull_request:
-    branches: [ main, master ]
-    paths:
-      - 'ansible/**'
-
-jobs:
-  lint:
-    name: Ansible Lint
-    runs-on: ubuntu-latest
-    steps:
-      - name: Checkout code
-        uses: actions/checkout@v4
-
-      - name: Set up Python
-        uses: actions/setup-python@v5
-        with:
-          python-version: '3.12'
-
-      - name: Install dependencies
-        run: |
-          pip install ansible ansible-lint
-
-      - name: Run ansible-lint
-        run: |
-          cd ansible
-          ansible-lint playbooks/*.yml
-
-  deploy:
-    name: Deploy Application
-    needs: lint
-    runs-on: ubuntu-latest  # or self-hosted
-    steps:
-      # Add deployment steps
-      # - Setup Ansible
-      # - Configure SSH (if needed)
-      # - Decrypt Vault (use GitHub Secrets)
-      # - Run playbook
-      # - Verify deployment
-```
-
-#### 4.4 Configure GitHub Secrets
-
-**Required Secrets:** (Settings → Secrets and variables → Actions)
-
-1. `ANSIBLE_VAULT_PASSWORD` - Vault password for decryption
-2. `SSH_PRIVATE_KEY` - SSH key for target VM (if using remote runner)
-3. `VM_HOST` - Target VM IP/hostname
-4. `VM_USER` - SSH username
-
-**Using Secrets in Workflow:**
-```yaml
-- name: Deploy with Ansible
-  env:
-    ANSIBLE_VAULT_PASSWORD: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
-  run: |
-    echo "$ANSIBLE_VAULT_PASSWORD" > /tmp/vault_pass
-    ansible-playbook playbooks/deploy.yml \
-      --vault-password-file /tmp/vault_pass
-    rm /tmp/vault_pass
-```
-
-#### 4.5 Implement Deployment Step
-
-**For self-hosted runner:**
-```yaml
-deploy:
-  runs-on: self-hosted
-  steps:
-    - uses: actions/checkout@v4
-
-    - name: Deploy with Ansible
-      run: |
-        cd ansible
-        echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
-        ansible-playbook playbooks/deploy.yml \
-          --vault-password-file /tmp/vault_pass \
-          --tags "app_deploy"
-        rm /tmp/vault_pass
-```
-
-**For GitHub-hosted runner:**
-```yaml
-deploy:
-  runs-on: ubuntu-latest
-  steps:
-    - uses: actions/checkout@v4
-
-    - name: Set up Python
-      uses: actions/setup-python@v5
-      with:
-        python-version: '3.12'
-
-    - name: Install Ansible
-      run: pip install ansible
-
-    - name: Setup SSH
-      run: |
-        mkdir -p ~/.ssh
-        echo "${{ secrets.SSH_PRIVATE_KEY }}" > ~/.ssh/id_rsa
-        chmod 600 ~/.ssh/id_rsa
-        ssh-keyscan -H ${{ secrets.VM_HOST }} >> ~/.ssh/known_hosts
-
-    - name: Deploy with Ansible
-      run: |
-        cd ansible
-        echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
-        ansible-playbook playbooks/deploy.yml \
-          -i inventory/hosts.ini \
-          --vault-password-file /tmp/vault_pass
-        rm /tmp/vault_pass
-```
-
-#### 4.6 Add Verification Step
-
-**After deployment, verify it worked:**
-```yaml
-- name: Verify Deployment
-  run: |
-    sleep 10  # Wait for app to start
-    curl -f http://${{ secrets.VM_HOST }}:8000 || exit 1
-    curl -f http://${{ secrets.VM_HOST }}:8000/health || exit 1
-```
-
-#### 4.7 Path Filters Best Practice
-
-**Why path filters?**
-- Don't run Ansible workflow when changing docs
-- Separate workflows for different concerns
-- Faster CI, lower costs
-
-**Example:**
-```yaml
-on:
-  push:
-    paths:
-      - 'ansible/**'           # Ansible code
-      - '!ansible/docs/**'     # Exclude docs
-      - '.github/workflows/ansible-deploy.yml'  # Workflow changes
-```
-
-#### 4.8 Add Status Badge
-
-**File:** `README.md` (or ansible/README.md)
-
-**Add badge:**
-```markdown
-[![Ansible Deployment](https://github.com/your-username/your-repo/actions/workflows/ansible-deploy.yml/badge.svg)](https://github.com/your-username/your-repo/actions/workflows/ansible-deploy.yml)
-```
-
-#### 4.9 Testing CI/CD
-
-**Test Sequence:**
-1. Make a change to ansible code (e.g., update variable in group_vars)
-2. Commit and push to GitHub
-3. Watch Actions tab for workflow execution
-4. Verify lint job passes
-5. Verify deploy job succeeds
-6. Check application is updated on target VM
-
-**Evidence Required:**
-- Screenshot of successful workflow run
-- Output logs showing ansible-lint passing
-- Output logs showing ansible-playbook execution
-- Verification step output showing app responding
-- Status badge in README showing passing
-
-#### 4.10 Research Questions
-
-Answer in documentation:
-1. **What are the security implications of storing SSH keys in GitHub Secrets?**
-2. **How would you implement a staging → production deployment pipeline?**
-3. **What would you add to make rollbacks possible?**
-4. **How does self-hosted runner improve security compared to GitHub-hosted?**
-
----
-
-### Task 5 — Documentation (1 pt)
-
-Create `ansible/docs/LAB06.md` with the following:
-
-**Required Sections:**
-1. **Overview** - What you accomplished and technologies used
-2. **Blocks & Tags** - Block usage in each role, tag strategy, execution examples with screenshots
-3. **Docker Compose Migration** - Template structure, role dependencies, before/after comparison
-4. **Wipe Logic** - Implementation details, variable + tag approach, test results
-5. **CI/CD Integration** - Workflow architecture, setup steps, evidence of automated deployments
-6. **Testing Results** - All test scenarios, idempotency verification, application accessibility
-7. **Challenges & Solutions** - Difficulties encountered and how you solved them
-8. **Research Answers** - All research questions answered with analysis
-
-**Code Documentation:**
-- Add clear comments in all modified Ansible files
-- Document variables in templates
-- Explain safety mechanisms in wipe logic
-- Document workflow steps in CI/CD files
-
-**Evidence:**
-- Terminal outputs showing tagged execution
-- Wipe logic test results (all 4 scenarios)
-- CI/CD workflow logs and screenshots
-- Application accessibility verification
-
----
-
-### Bonus Part 1 — Multi-App Deployment (1.5 pts)
-
-#### Bonus 1.1 Prerequisites
-
-**Required:**
-- Completed Lab 1 Bonus (compiled language app: Go/Rust/Java/C#)
-- Completed Lab 2 Bonus (multi-stage Docker build)
-- Completed Lab 3 Bonus Part 1 (multi-app CI/CD)
-
-**You should have:**
-- Python web app (everyone has this)
-- Compiled language web app (Go/Rust/Java/C#)
-- Both apps containerized and on Docker Hub
-- Both apps with similar endpoints (/, /health)
-
-#### Bonus 1.2 Role Reusability Pattern
-
-**Key Concept:** Use the same `web_app` role for both apps with different variables.
-
-**Directory Structure:**
-```
-ansible/
-├── inventory/
-│   └── hosts.ini
-├── group_vars/
-│   └── all.yml
-├── host_vars/          # Optional: per-host vars
-├── vars/
-│   ├── app_python.yml  # NEW: Python app variables
-│   └── app_bonus.yml   # NEW: Bonus app variables
-├── roles/
-│   └── web_app/        # Reused for both apps
-└── playbooks/
-    ├── provision.yml
-    ├── deploy_python.yml    # NEW
-    ├── deploy_bonus.yml     # NEW
-    └── deploy_all.yml       # NEW: Deploy both
-```
-
-#### Bonus 1.3 Create Variable Files
-
-**File:** `ansible/vars/app_python.yml`
-```yaml
----
-app_name: devops-python
-docker_image: your_username/devops-info-service
-docker_tag: latest
-app_port: 8000
-app_internal_port: 8000
-compose_project_dir: "/opt/{{ app_name }}"
-```
-
-**File:** `ansible/vars/app_bonus.yml`
-```yaml
----
-app_name: devops-go  # or rust, java, csharp
-docker_image: your_username/devops-info-service-go
-docker_tag: latest
-app_port: 8001  # Different port!
-app_internal_port: 8080  # Go apps often use 8080
-compose_project_dir: "/opt/{{ app_name }}"
-```
-
-**Important:** Use different ports to run both apps simultaneously.
-
-#### Bonus 1.4 Create Deployment Playbooks
-
-**File:** `ansible/playbooks/deploy_python.yml`
-```yaml
----
-- name: Deploy Python Application
-  hosts: all
-  become: true
-  vars_files:
-    - ../vars/app_python.yml
-
-  roles:
-    - web_app
-```
-
-**File:** `ansible/playbooks/deploy_bonus.yml`
-```yaml
----
-- name: Deploy Bonus Application
-  hosts: all
-  become: true
-  vars_files:
-    - ../vars/app_bonus.yml
-
-  roles:
-    - web_app
-```
-
-**File:** `ansible/playbooks/deploy_all.yml`
-```yaml
----
-- name: Deploy All Applications
-  hosts: all
-  become: true
-
-  tasks:
-    - name: Deploy Python App
-      include_role:
-        name: web_app
-      vars:
-        app_name: devops-python
-        docker_image: your_username/devops-info-service
-        app_port: 8000
-
-    - name: Deploy Bonus App
-      include_role:
-        name: web_app
-      vars:
-        app_name: devops-go
-        docker_image: your_username/devops-info-service-go
-        app_port: 8001
-        app_internal_port: 8080
-```
-
-#### Bonus 1.5 Extend Wipe Logic
-
-**Wipe logic should support app-specific wipe:**
-
-**Usage:**
-```bash
-# Wipe only Python app
-ansible-playbook playbooks/deploy_python.yml \
-  -e "web_app_wipe=true" \
-  --tags web_app_wipe
-
-# Wipe only Bonus app
-ansible-playbook playbooks/deploy_bonus.yml \
-  -e "web_app_wipe=true" \
-  --tags web_app_wipe
-
-# Wipe both apps
-ansible-playbook playbooks/deploy_all.yml \
-  -e "web_app_wipe=true" \
-  --tags web_app_wipe
-```
-
-**The role automatically handles different apps because `app_name` and `compose_project_dir` are different!**
-
-#### Bonus 1.6 Testing Multi-App Deployment
-
-**Test Commands:**
-```bash
-# Deploy both apps
-ansible-playbook playbooks/deploy_all.yml
-
-# Verify both running
-ssh user@vm_ip "docker ps"
-curl http://vm_ip:8000        # Python app
-curl http://vm_ip:8001        # Bonus app
-
-# Test independent deployment
-ansible-playbook playbooks/deploy_python.yml  # Should not affect bonus app
-ansible-playbook playbooks/deploy_bonus.yml   # Should not affect python app
-
-# Test independent wipe
-ansible-playbook playbooks/deploy_python.yml \
-  -e "web_app_wipe=true" --tags web_app_wipe
-# Verify: Python app removed, bonus app still running
-
-# Test idempotency
-ansible-playbook playbooks/deploy_all.yml
-ansible-playbook playbooks/deploy_all.yml  # Should show minimal changes
-```
-
-**Evidence Required:**
-- Output showing both apps deployed
-- `docker ps` output showing both containers
-- Curl outputs from both apps
-- Proof of independent wipe functionality
-- Idempotency verification for multi-app deployment
-
-#### Bonus 1.7 Documentation
-
-**Add to LAB06.md:**
-- Multi-app architecture explanation
-- Variable file strategy
-- Role reusability benefits
-- Port conflict resolution
-- Independent vs. combined deployment trade-offs
-
----
-
-### Bonus Part 2 — Multi-App CI/CD (1 pt)
-
-#### Bonus 2.1 Prerequisites
-
-**Required:**
-- Bonus Part 1 completed (multi-app deployment working)
-- Task 4 completed (single app CI/CD working)
-
-#### Bonus 2.2 Workflow Strategy
-
-**Two Approaches:**
-
-**Approach A: Separate Workflows**
-- One workflow per app
-- Path filters for each app's code
-- Independent deployment
-- More control, more files
-
-**Approach B: Matrix Strategy**
-- Single workflow with matrix
-- Deploys both apps
-- Simpler, less flexible
-
-Choose based on your preference (Approach A recommended).
-
-#### Bonus 2.3 Create Workflow for Bonus App
-
-**File:** `.github/workflows/ansible-deploy-bonus.yml`
-
-**Requirements:**
-1. Trigger on bonus app code changes
-2. Run ansible-lint
-3. Deploy bonus app only
-4. Verify bonus app responds
-5. Independent from Python app workflow
-
-**Path Filters:**
-```yaml
-on:
-  push:
-    branches: [ main, master ]
-    paths:
-      - 'ansible/vars/app_bonus.yml'
-      - 'ansible/playbooks/deploy_bonus.yml'
-      - 'ansible/roles/web_app/**'
-      - '.github/workflows/ansible-deploy-bonus.yml'
-```
-
-**Deployment Step:**
-```yaml
-- name: Deploy Bonus Application
-  run: |
-    cd ansible
-    echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
-    ansible-playbook playbooks/deploy_bonus.yml \
-      --vault-password-file /tmp/vault_pass
-    rm /tmp/vault_pass
-```
-
-**Verification:**
-```yaml
-- name: Verify Bonus App Deployment
-  run: |
-    sleep 10
-    curl -f http://${{ secrets.VM_HOST }}:8001 || exit 1
-    curl -f http://${{ secrets.VM_HOST }}:8001/health || exit 1
-```
-
-#### Bonus 2.4 Update Python App Workflow
-
-**File:** `.github/workflows/ansible-deploy.yml`
-
-**Update path filters to be more specific:**
-```yaml
-on:
-  push:
-    paths:
-      - 'ansible/vars/app_python.yml'
-      - 'ansible/playbooks/deploy_python.yml'
-      - 'ansible/playbooks/deploy.yml'  # If this deploys Python
-      - 'ansible/roles/web_app/**'
-      - '.github/workflows/ansible-deploy.yml'
-```
-
-**Update deployment to use specific playbook:**
-```yaml
-- name: Deploy Python Application
-  run: |
-    cd ansible
-    ansible-playbook playbooks/deploy_python.yml \
-      --vault-password-file /tmp/vault_pass
-```
-
-#### Bonus 2.5 Matrix Strategy Alternative
-
-**File:** `.github/workflows/ansible-deploy-matrix.yml`
-
-**Using matrix to deploy both:**
-```yaml
-name: Ansible Multi-App Deployment
-
-on:
-  push:
-    branches: [ main, master ]
-    paths:
-      - 'ansible/**'
-
-jobs:
-  deploy:
-    runs-on: ubuntu-latest
-    strategy:
-      matrix:
-        app:
-          - name: python
-            playbook: deploy_python.yml
-            port: 8000
-          - name: bonus
-            playbook: deploy_bonus.yml
-            port: 8001
-
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Deploy ${{ matrix.app.name }}
-        run: |
-          cd ansible
-          echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
-          ansible-playbook playbooks/${{ matrix.app.playbook }} \
-            --vault-password-file /tmp/vault_pass
-          rm /tmp/vault_pass
-
-      - name: Verify ${{ matrix.app.name }}
-        run: |
-          sleep 10
-          curl -f http://${{ secrets.VM_HOST }}:${{ matrix.app.port }}
-```
-
-#### Bonus 2.6 Testing Multi-App CI/CD
-
-**Test Scenarios:**
-
-**Test 1: Python app change should deploy only Python**
-```bash
-# Change ansible/vars/app_python.yml
-git add ansible/vars/app_python.yml
-git commit -m "Update Python app config"
-git push
-
-# Watch Actions - only ansible-deploy.yml should run
-# Verify only Python app redeployed
-```
-
-**Test 2: Bonus app change should deploy only Bonus**
-```bash
-# Change ansible/vars/app_bonus.yml
-git add ansible/vars/app_bonus.yml
-git commit -m "Update Bonus app config"
-git push
-
-# Watch Actions - only ansible-deploy-bonus.yml should run
-```
-
-**Test 3: Role change should deploy both**
-```bash
-# Change ansible/roles/web_app/tasks/main.yml
-git add ansible/roles/web_app/
-git commit -m "Update web_app role"
-git push
-
-# Watch Actions - both workflows should run
-```
-
-**Evidence Required:**
-- Screenshots showing independent workflow triggers
-- Logs proving only affected app deployed
-- Verification of both apps working after role change
-- Status badges for both workflows
-
-#### Bonus 2.7 Documentation
-
-**Add to LAB06.md:**
-- Multi-app CI/CD architecture
-- Workflow triggering logic
-- Path filter strategy
-- Matrix vs separate workflows comparison
-- Evidence of independent deployments
-
----
-
-## Submission Guidelines
-
-### What to Submit
-
-Submit a single markdown file: **`ansible/docs/LAB06.md`**
-
-### Required Structure
-
-```markdown
-# Lab 6: Advanced Ansible & CI/CD - Submission
-
-**Name:** Your Name
-**Date:** YYYY-MM-DD
-**Lab Points:** 10 + X bonus
-
----
-
-## Task 1: Blocks & Tags (2 pts)
-[Your implementation details]
-[Evidence: terminal outputs, tag listings]
-[Research answers]
-
-## Task 2: Docker Compose (3 pts)
-[Your implementation]
-[Template code]
-[Before/after comparison]
-[Evidence: deployments, idempotency]
-
-## Task 3: Wipe Logic (1 pt)
-[Implementation explanation]
-[Test results for all scenarios]
-[Evidence proving correct behavior]
-
-## Task 4: CI/CD (3 pts)
-[Workflow setup]
-[Secrets configuration]
-[Evidence: successful runs, badges]
-
-## Task 5: Documentation
-[This file serves as documentation]
-
-## Bonus Part 1: Multi-App (1.5 pts)
-[If completed]
-
-## Bonus Part 2: Multi-App CI/CD (1 pt)
-[If completed]
-
----
-
-## Summary
-[Overall reflection]
-[Total time spent]
-[Key learnings]
-```
-
-### GitHub Repository Requirements
-
-**Commit all code:**
-```bash
-git add ansible/
-git add .github/workflows/
-git add ansible/docs/LAB06.md
-git commit -m "Complete Lab 6: Advanced Ansible & CI/CD"
-git push
-```
-
-**Repository should contain:**
-- ✅ Updated roles with blocks and tags
-- ✅ Docker Compose templates
-- ✅ Wipe logic implementation
-- ✅ CI/CD workflows
-- ✅ Documentation with evidence
-- ✅ Working deployments (apps accessible)
-
-### Evidence Checklist
-
-**Required Proof:**
-- [ ] Ansible playbook output with selective tags
-- [ ] Rescue block triggered output
-- [ ] Docker Compose deployment success
-- [ ] Idempotency verification (2nd run)
-- [ ] Wipe logic test results (all 4 scenarios)
-- [ ] GitHub Actions successful workflow
-- [ ] ansible-lint passing
-- [ ] Status badge(s) in README
-- [ ] Application(s) accessible via curl
-
-**Bonus Proof (if applicable):**
-- [ ] Both apps deployed and accessible
-- [ ] Independent wipe functionality
-- [ ] Separate workflow runs for each app
-- [ ] Path filter effectiveness demonstrated
-
----
-
-## Checklist
-
-**Before submitting, ensure you have:**
-- [ ] All three roles refactored with blocks and tags
-- [ ] Docker Compose deployment working with templated config
-- [ ] Role dependencies correctly configured
-- [ ] Wipe logic implemented with variable + tag safety
-- [ ] All 4 wipe scenarios tested successfully
-- [ ] GitHub Actions workflow running and passing
-- [ ] ansible-lint integrated and passing
-- [ ] Path filters configured for efficient CI/CD
-- [ ] Complete documentation in `ansible/docs/LAB06.md`
-- [ ] All research questions answered
-- [ ] Terminal outputs and screenshots included
-- [ ] Application(s) accessible and verified
-
-**Bonus (if attempting):**
-- [ ] Second app deployed using role reusability
-- [ ] Independent wipe logic for each app
-- [ ] Separate CI/CD workflows or matrix strategy
-- [ ] Path filters for independent triggering
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Blocks & Tags** | 2 pts | All roles refactored with blocks, rescue/always, comprehensive tag strategy |
-| **Docker Compose** | 3 pts | Working templated deployment, role dependencies, idempotent |
-| **Wipe Logic** | 1 pt | Variable + tag implementation, all scenarios tested |
-| **CI/CD** | 3 pts | Automated workflow with linting, deployment, verification |
-| **Documentation** | 1 pt | Complete LAB06.md with evidence and analysis |
-| **Bonus: Multi-App** | 1.5 pts | Role reusability, independent deployment and wipe |
-| **Bonus: Multi-App CI/CD** | 1 pt | Separate workflows or matrix, independent triggering |
-| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
-
-**Grading Scale:**
-- **10/10:** All tasks working, excellent documentation, proper implementation
-- **8-9/10:** All works, good docs, minor improvements possible
-- **6-7/10:** Core functionality present, basic documentation
-- **<6/10:** Missing features or documentation, needs revision
-
----
-
-## Resources
-
-<details>
-<summary>📚 Ansible Documentation</summary>
-
-- [Ansible Blocks](https://docs.ansible.com/ansible/latest/user_guide/playbooks_blocks.html)
-- [Ansible Tags](https://docs.ansible.com/ansible/latest/user_guide/playbooks_tags.html)
-- [Ansible Role Dependencies](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html#using-role-dependencies)
-- [Ansible Variables](https://docs.ansible.com/ansible/latest/user_guide/playbooks_variables.html)
-- [Ansible Vault](https://docs.ansible.com/ansible/latest/user_guide/vault.html)
-
-</details>
-
-<details>
-<summary>🐳 Docker Compose</summary>
-
-- [Docker Compose File Reference](https://docs.docker.com/compose/compose-file/)
-- [Docker Compose Module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_compose_module.html)
-- [community.docker Collection](https://docs.ansible.com/ansible/latest/collections/community/docker/)
-- [Compose Best Practices](https://docs.docker.com/compose/production/)
-
-</details>
-
-<details>
-<summary>🔄 CI/CD & GitHub Actions</summary>
-
-- [GitHub Actions Documentation](https://docs.github.com/en/actions)
-- [GitHub Actions: Workflow Syntax](https://docs.github.com/en/actions/reference/workflow-syntax-for-github-actions)
-- [Self-hosted Runners](https://docs.github.com/en/actions/hosting-your-own-runners)
-- [Encrypted Secrets](https://docs.github.com/en/actions/security-guides/encrypted-secrets)
-
-</details>
-
-<details>
-<summary>🛠️ Tools & Best Practices</summary>
-
-- [ansible-lint](https://ansible-lint.readthedocs.io/) - Best practices checker
-- [Ansible Galaxy](https://galaxy.ansible.com/) - Community roles
-- [Jinja2 Templating](https://jinja.palletsprojects.com/) - Template engine
-- [YAML Syntax](https://docs.ansible.com/ansible/latest/reference_appendices/YAMLSyntax.html)
-
-</details>
-
----
-
-## Looking Ahead
-
-Your Ansible automation evolves throughout the course:
-
-- **Lab 7:** Logging Stack - Deploy Loki, Promtail, and Grafana
-- **Lab 8:** Metrics Stack - Add Prometheus metrics to your app
-- **Lab 9:** Kubernetes Basics - Migrate from Docker Compose to K8s deployments
-- **Lab 10:** Helm charts for templated K8s deployments
-- **Lab 11-12:** Secrets with Vault, ConfigMaps, and persistent storage
-- **Lab 13:** GitOps with ArgoCD - Declarative Kubernetes deployments
-
----
-
-**Good luck!** 🚀
+# Lab 6 — Advanced Ansible & CI/CD
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Ansible%20%26%20CI%2FCD-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Ansible%20|%20Docker%20Compose%20|%20GitHub%20Actions-informational)
+
+> Enhance your Ansible automation with advanced features including blocks, tags, Docker Compose, role dependencies, wipe logic, and CI/CD integration.
+
+## Overview
+
+Build on Lab 5 by enhancing your Ansible automation with production-ready features. You'll refactor roles with blocks and tags, upgrade to Docker Compose, implement safe cleanup logic, and fully automate deployments with CI/CD.
+
+**What You'll Learn:**
+- Blocks for error handling and task grouping
+- Tags for selective Ansible execution
+- Docker Compose templating with Jinja2
+- Role dependencies and execution order
+- Safe wipe logic with double-gating (variable + tag)
+- GitHub Actions for Ansible automation
+- Multi-app deployment patterns (Bonus)
+
+**Tech Stack:** Ansible 2.16+ | Docker Compose v2 | GitHub Actions | Jinja2
+
+**Prerequisites:** Lab 5 completed (Ansible roles, playbooks, Vault), containerized app from Lab 2, GitHub Actions knowledge from Lab 3
+
+---
+
+## Tasks
+
+### Task 1 — Refactor with Blocks & Tags (2 pts)
+
+#### 1.1 Understanding Blocks
+
+Blocks allow you to:
+- **Group tasks** logically (e.g., all Docker installation tasks)
+- **Apply directives** once to multiple tasks (when, become, tags)
+- **Handle errors** with rescue and always sections
+- **Improve readability** by showing task relationships
+
+**Example Block Pattern:**
+```yaml
+- name: Install package with error handling
+  block:
+    - name: Update apt cache
+      # task 1
+
+    - name: Install package
+      # task 2
+
+  rescue:
+    - name: Handle installation failure
+      # runs only if block fails
+
+  always:
+    - name: Cleanup temp files
+      # runs regardless of success/failure
+
+  when: ansible_os_family == "Debian"
+  become: true
+  tags:
+    - packages
+```
+
+#### 1.2 Understanding Tags
+
+Tags enable selective execution:
+```bash
+# Run only tagged tasks
+ansible-playbook provision.yml --tags "docker"
+
+# Skip specific tags
+ansible-playbook provision.yml --skip-tags "common"
+
+# Multiple tags
+ansible-playbook provision.yml --tags "packages,docker"
+
+# List all available tags
+ansible-playbook provision.yml --list-tags
+```
+
+#### 1.3 Refactor `common` Role
+
+**File:** `roles/common/tasks/main.yml`
+
+**Requirements:**
+1. Group package installation tasks in a block with tag `packages`
+2. Group user creation tasks in a block with tag `users`
+3. Add error handling with rescue for apt cache update failures
+4. Use always block to log completion
+
+**Tag Strategy:**
+- `packages` - all package installation tasks
+- `users` - all user management tasks
+- `common` - entire role (applied at role level)
+
+**Hints:**
+- Add rescue block that runs `apt-get update --fix-missing` on failure
+- Use always block to create a log file in /tmp indicating completion
+- Apply `become: true` at block level instead of per task
+
+**Research Questions:**
+- Q: What happens if rescue block also fails?
+- Q: Can you have nested blocks?
+- Q: How do tags inherit to tasks within blocks?
+
+#### 1.4 Refactor `docker` Role
+
+**File:** `roles/docker/tasks/main.yml`
+
+**Requirements:**
+1. Group Docker installation tasks in block with tag `docker_install`
+2. Group Docker configuration tasks in block with tag `docker_config`
+3. Add rescue block to retry apt update on GPG key failure
+4. Use always block to ensure Docker service is enabled
+
+**Additional Tags:**
+- `docker` - entire role
+- `docker_install` - installation only
+- `docker_config` - configuration only
+
+**Hints:**
+- Docker GPG key addition may fail on first try (network timeout)
+- Rescue block should wait 10 seconds and retry
+- Always block should ensure Docker service is enabled and started
+
+#### 1.5 Testing Blocks & Tags
+
+**Test Commands:**
+```bash
+# Test provision with only docker
+ansible-playbook playbooks/provision.yml --tags "docker"
+
+# Skip common role
+ansible-playbook playbooks/provision.yml --skip-tags "common"
+
+# Install packages only across all roles
+ansible-playbook playbooks/provision.yml --tags "packages"
+
+# Check mode to see what would run
+ansible-playbook playbooks/provision.yml --tags "docker" --check
+
+# Run only docker installation tasks
+ansible-playbook playbooks/provision.yml --tags "docker_install"
+```
+
+**Evidence Required:**
+- Output showing selective execution with --tags
+- Output showing error handling with rescue block triggered
+- List of all available tags (--list-tags output)
+
+---
+
+### Task 2 — Upgrade to Docker Compose (3 pts)
+
+#### 2.1 Why Docker Compose?
+
+**Advantages over `docker run`:**
+- **Declarative configuration** - define desired state, not commands
+- **Multi-container management** - networks, volumes, dependencies
+- **Environment variable management** - .env files, variable substitution
+- **Easy updates** - change config file and recreate
+- **Better for production** - consistent, reproducible deployments
+
+#### 2.2 Rename Role
+
+**Action Required:**
+```bash
+cd ansible/roles
+mv app_deploy web_app
+```
+
+**Update all references:**
+- Playbook imports: `roles/app_deploy` → `roles/web_app`
+- Documentation: app_deploy → web_app
+- Variable prefixes: Consider `web_app_*` for consistency
+
+**Why rename?**
+- `web_app` is more specific and descriptive
+- Prepares for potential other app types (database_app, cache_app)
+- Better aligns with wipe logic variable naming
+
+#### 2.3 Create Docker Compose Template
+
+**File:** `roles/web_app/templates/docker-compose.yml.j2`
+
+**Requirements:**
+1. Use Jinja2 templating for dynamic values
+2. Define service name, image, ports, environment variables
+3. Include restart policy
+4. Use networks if needed
+5. Support variable substitution for app-specific config
+
+**Template Pattern:**
+```yaml
+version: '3.8'
+
+services:
+  {{ app_name }}:
+    image: {{ docker_image }}:{{ docker_tag }}
+    container_name: {{ app_name }}
+    ports:
+      - "{{ app_port }}:{{ app_internal_port }}"
+    environment:
+      # Add environment variables here
+      # Use Vault-encrypted secrets
+    restart: unless-stopped
+    # Add other configuration
+```
+
+**Variables to support:**
+- `app_name` - service/container name (default: devops-app)
+- `docker_image` - Docker Hub image
+- `docker_tag` - image version (default: latest)
+- `app_port` - host port (default: 8000)
+- `app_internal_port` - container port (default: 8000)
+- Environment variables for app configuration
+
+**Research Questions:**
+- Q: What's the difference between `restart: always` and `restart: unless-stopped`?
+- Q: How do Docker Compose networks differ from Docker bridge networks?
+- Q: Can you reference Ansible Vault variables in the template?
+
+#### 2.4 Define Role Dependencies
+
+**File:** `roles/web_app/meta/main.yml`
+
+**Purpose:** Ensure Docker is installed before deploying web app.
+
+**Pattern:**
+```yaml
+---
+dependencies:
+  - role: role_name
+    # Optional variables to pass
+    vars:
+      var_name: value
+```
+
+**Requirements:**
+1. Add `docker` role as dependency
+2. Ensure correct execution order automatically
+3. Document why dependency is needed
+
+**Test:** Run only `web_app` role - Docker should install automatically:
+```bash
+ansible-playbook playbooks/deploy.yml
+# Should automatically run docker role first
+```
+
+#### 2.5 Implement Docker Compose Deployment
+
+**File:** `roles/web_app/tasks/main.yml`
+
+**Requirements:**
+1. Create application directory (e.g., /opt/{{ app_name }})
+2. Template docker-compose.yml to the directory
+3. Use `docker_compose` module (or `community.docker.docker_compose`)
+4. Ensure idempotency (check if already running)
+5. Add appropriate tags: `app_deploy`, `compose`
+
+**Deployment Block Pattern:**
+```yaml
+- name: Deploy application with Docker Compose
+  block:
+    - name: Create app directory
+      # Use file module
+
+    - name: Template docker-compose file
+      # Use template module
+
+    - name: Deploy with docker-compose
+      # Use docker_compose module
+      # state: present (or up)
+
+  rescue:
+    - name: Handle deployment failure
+      # Log error, optionally rollback
+
+  tags:
+    - app_deploy
+    - compose
+```
+
+**Hints:**
+- Install docker-compose Python library: `pip3 install docker-compose`
+- Or use `community.docker` collection (requires installation)
+- Set `pull: yes` to always get latest image
+- Use `project_src` to specify directory with docker-compose.yml
+
+**Research:**
+- Look up `community.docker.docker_compose_v2` module
+- Compare `state: present` vs other state options
+- Understand `recreate` parameter options
+
+#### 2.6 Variables Configuration
+
+**File:** `group_vars/all.yml` (or role defaults)
+
+**Required Variables:**
+```yaml
+# Application Configuration
+app_name: devops-app
+docker_image: your_dockerhub_username/devops-info-service
+docker_tag: latest
+app_port: 8000
+app_internal_port: 8000
+
+# Docker Compose Config
+compose_project_dir: "/opt/{{ app_name }}"
+docker_compose_version: "3.8"
+
+# Secrets (use Vault)
+app_secret_key: !vault |
+          $ANSIBLE_VAULT;1.1;AES256
+          ...
+```
+
+**Encrypt sensitive values:**
+```bash
+ansible-vault encrypt_string 'secret_value' --name 'app_secret_key'
+```
+
+#### 2.7 Testing Docker Compose Deployment
+
+**Test Commands:**
+```bash
+# Full deployment
+ansible-playbook playbooks/deploy.yml
+
+# Check idempotency (run twice, second should show no changes)
+ansible-playbook playbooks/deploy.yml
+ansible-playbook playbooks/deploy.yml
+
+# Verify on target VM
+ssh user@vm_ip
+docker ps
+docker-compose -f /opt/devops-app/docker-compose.yml ps
+curl http://localhost:8000
+```
+
+**Evidence Required:**
+- Output showing Docker Compose deployment success
+- Idempotency proof (second run shows "ok" not "changed")
+- Application running and accessible
+- Contents of templated docker-compose.yml
+
+---
+
+### Task 3 — Wipe Logic Implementation (1 pt)
+
+#### 3.1 Understanding Wipe Logic
+
+**Purpose:** Clean removal of deployed applications for:
+- **Clean reinstallation** (wipe old → deploy new)
+- Testing from fresh state
+- Rolling back to clean slate
+- Decommissioning applications
+- Resource cleanup before upgrades
+
+**Implementation Requirements:**
+- ✅ Controlled by variable: `web_app_wipe: true`
+- ✅ Gated by specific tag: `web_app_wipe`
+- ❌ NOT using the special "never" tag
+- Default behavior: wipe tasks do NOT run
+- Explicit invocation required
+
+#### 3.2 Create Wipe Tasks
+
+**File:** `roles/web_app/tasks/wipe.yml`
+
+**Requirements:**
+1. Stop and remove containers (Docker Compose down)
+2. Remove docker-compose.yml file
+3. Remove application directory
+4. Optionally remove Docker images (consider disk space)
+5. Log wipe completion
+
+**Implementation Pattern:**
+```yaml
+---
+- name: Wipe web application
+  block:
+    - name: Stop and remove containers
+      ...
+
+    - name: Remove docker-compose file
+      ...
+
+    - name: Remove application directory
+      ...
+
+    - name: Log wipe completion
+      debug:
+        msg: "Application {{ app_name }} wiped successfully"
+
+  when: ...
+  tags:
+    - web_app_wipe
+```
+
+**Key Points:**
+- `when` condition checks variable (default: false)
+- `tags` enables selective execution
+- `ignore_errors` prevents failure if already clean
+- `| bool` ensures proper boolean evaluation
+
+#### 3.3 Include Wipe in Main Tasks
+
+**File:** `roles/web_app/tasks/main.yml`
+
+**Add at the beginning (before deployment tasks):**
+```yaml
+---
+# Wipe logic runs first (when explicitly requested)
+- name: Include wipe tasks
+  include_tasks: wipe.yml
+  tags:
+    - web_app_wipe
+
+# Deployment tasks follow...
+- name: Deploy application with Docker Compose
+  block:
+    # ... your deployment tasks
+```
+
+**Why at the beginning?**
+- Enables clean reinstallation: wipe → deploy
+- Logical flow: remove old → install new
+- Tag isolation still prevents accidental wipe during normal deployment
+- Supports use case: `ansible-playbook deploy.yml -e "web_app_wipe=true"`
+
+#### 3.4 Configure Wipe Variable
+
+**File:** `roles/web_app/defaults/main.yml`
+
+**Add:**
+```yaml
+# Wipe Logic Control
+web_app_wipe: false  # Default: do not wipe
+```
+
+**Documentation comment:**
+```yaml
+# Set to true to remove application completely
+# Wipe only:    ansible-playbook deploy.yml -e "web_app_wipe=true" --tags web_app_wipe
+# Clean install: ansible-playbook deploy.yml -e "web_app_wipe=true"
+```
+
+#### 3.5 Testing Wipe Logic
+
+**Test Scenarios:**
+
+**Scenario 1: Normal deployment (wipe should NOT run)**
+```bash
+ansible-playbook playbooks/deploy.yml
+
+# Verify: app deploys normally, wipe tasks skipped (tag not specified)
+ssh user@vm_ip "docker ps"
+```
+
+**Scenario 2: Wipe only (remove existing deployment)**
+```bash
+ansible-playbook playbooks/deploy.yml \
+  -e "web_app_wipe=true" \
+  --tags web_app_wipe
+
+# Verify: app should be removed, deployment skipped
+ssh user@vm_ip "docker ps"  # Should not show app
+ssh user@vm_ip "ls /opt"    # Should not have app directory
+```
+
+**Scenario 3: Clean reinstallation (wipe → deploy)**
+```bash
+# This is the KEY use case: fresh start
+ansible-playbook playbooks/deploy.yml \
+  -e "web_app_wipe=true"
+
+# What happens:
+# 1. Wipe tasks run first (remove old installation)
+# 2. Deployment tasks run second (install fresh)
+# Result: clean reinstallation
+
+# Verify: old app removed, new app running
+ssh user@vm_ip "docker ps"
+```
+
+**Scenario 4: Safety checks (should NOT wipe)**
+```bash
+# 4a: Tag specified but variable false (when condition blocks it)
+ansible-playbook playbooks/deploy.yml --tags web_app_wipe
+# Result: wipe tasks skipped, deployment runs normally
+
+# 4b: Variable true, deployment skipped (only wipe runs)
+ansible-playbook playbooks/deploy.yml \
+  -e "web_app_wipe=true" \
+  --tags web_app_wipe
+# Result: only wipe, no deployment
+```
+
+**Evidence Required:**
+- Output of Scenario 1 showing normal deployment (wipe skipped)
+- Output of Scenario 2 showing wipe-only operation
+- Output of Scenario 3 showing clean reinstall (wipe → deploy)
+- Output of Scenario 4a showing wipe blocked by when condition
+- Screenshot of application running after clean reinstall
+
+#### 3.6 Research Questions
+
+Answer these in your documentation:
+1. **Why use both variable AND tag?** (Double safety mechanism)
+2. **What's the difference between `never` tag and this approach?**
+3. **Why must wipe logic come BEFORE deployment in main.yml?** (Clean reinstall scenario)
+4. **When would you want clean reinstallation vs. rolling update?**
+5. **How would you extend this to wipe Docker images and volumes too?**
+
+---
+
+### Task 4 — CI/CD with GitHub Actions (3 pts)
+
+#### 4.1 Why Automate Ansible?
+
+**Benefits:**
+- **Consistency** - same process every time
+- **Speed** - automatic deployments on push
+- **Safety** - linting catches errors before execution
+- **Auditability** - GitHub logs every deployment
+- **Integration** - combines with testing, building, scanning
+
+**CI/CD Flow:**
+```
+Code Push → Lint Ansible → Run Ansible Playbook → Verify Deployment
+```
+
+#### 4.2 Install GitHub Actions Runner (Optional)
+
+**Two Approaches:**
+
+**Approach A: Self-hosted runner on target VM (Recommended)**
+- More realistic for production
+- Direct access to target server
+- Faster (no SSH overhead)
+- Setup: GitHub Repo → Settings → Actions → Runners → Add runner
+
+**Approach B: GitHub-hosted runner with SSH**
+- Easier setup
+- Requires SSH key configuration
+- Uses GitHub Secrets for credentials
+- Slower but simpler
+
+Choose based on your infrastructure preference.
+
+#### 4.3 Create Ansible Workflow
+
+**File:** `.github/workflows/ansible-deploy.yml`
+
+**Requirements:**
+1. Trigger on push to ansible directory
+2. Run ansible-lint for syntax checking
+3. Execute Ansible playbook
+4. Verify deployment success
+5. Use path filters to avoid unnecessary runs
+
+**Workflow Structure:**
+```yaml
+name: Ansible Deployment
+
+on:
+  push:
+    branches: [ main, master ]
+    paths:
+      - 'ansible/**'
+      - '.github/workflows/ansible-deploy.yml'
+  pull_request:
+    branches: [ main, master ]
+    paths:
+      - 'ansible/**'
+
+jobs:
+  lint:
+    name: Ansible Lint
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@v4
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: '3.12'
+
+      - name: Install dependencies
+        run: |
+          pip install ansible ansible-lint
+
+      - name: Run ansible-lint
+        run: |
+          cd ansible
+          ansible-lint playbooks/*.yml
+
+  deploy:
+    name: Deploy Application
+    needs: lint
+    runs-on: ubuntu-latest  # or self-hosted
+    steps:
+      # Add deployment steps
+      # - Setup Ansible
+      # - Configure SSH (if needed)
+      # - Decrypt Vault (use GitHub Secrets)
+      # - Run playbook
+      # - Verify deployment
+```
+
+#### 4.4 Configure GitHub Secrets
+
+**Required Secrets:** (Settings → Secrets and variables → Actions)
+
+1. `ANSIBLE_VAULT_PASSWORD` - Vault password for decryption
+2. `SSH_PRIVATE_KEY` - SSH key for target VM (if using remote runner)
+3. `VM_HOST` - Target VM IP/hostname
+4. `VM_USER` - SSH username
+
+**Using Secrets in Workflow:**
+```yaml
+- name: Deploy with Ansible
+  env:
+    ANSIBLE_VAULT_PASSWORD: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
+  run: |
+    echo "$ANSIBLE_VAULT_PASSWORD" > /tmp/vault_pass
+    ansible-playbook playbooks/deploy.yml \
+      --vault-password-file /tmp/vault_pass
+    rm /tmp/vault_pass
+```
+
+#### 4.5 Implement Deployment Step
+
+**For self-hosted runner:**
+```yaml
+deploy:
+  runs-on: self-hosted
+  steps:
+    - uses: actions/checkout@v4
+
+    - name: Deploy with Ansible
+      run: |
+        cd ansible
+        echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
+        ansible-playbook playbooks/deploy.yml \
+          --vault-password-file /tmp/vault_pass \
+          --tags "app_deploy"
+        rm /tmp/vault_pass
+```
+
+**For GitHub-hosted runner:**
+```yaml
+deploy:
+  runs-on: ubuntu-latest
+  steps:
+    - uses: actions/checkout@v4
+
+    - name: Set up Python
+      uses: actions/setup-python@v5
+      with:
+        python-version: '3.12'
+
+    - name: Install Ansible
+      run: pip install ansible
+
+    - name: Setup SSH
+      run: |
+        mkdir -p ~/.ssh
+        echo "${{ secrets.SSH_PRIVATE_KEY }}" > ~/.ssh/id_rsa
+        chmod 600 ~/.ssh/id_rsa
+        ssh-keyscan -H ${{ secrets.VM_HOST }} >> ~/.ssh/known_hosts
+
+    - name: Deploy with Ansible
+      run: |
+        cd ansible
+        echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
+        ansible-playbook playbooks/deploy.yml \
+          -i inventory/hosts.ini \
+          --vault-password-file /tmp/vault_pass
+        rm /tmp/vault_pass
+```
+
+#### 4.6 Add Verification Step
+
+**After deployment, verify it worked:**
+```yaml
+- name: Verify Deployment
+  run: |
+    sleep 10  # Wait for app to start
+    curl -f http://${{ secrets.VM_HOST }}:8000 || exit 1
+    curl -f http://${{ secrets.VM_HOST }}:8000/health || exit 1
+```
+
+#### 4.7 Path Filters Best Practice
+
+**Why path filters?**
+- Don't run Ansible workflow when changing docs
+- Separate workflows for different concerns
+- Faster CI, lower costs
+
+**Example:**
+```yaml
+on:
+  push:
+    paths:
+      - 'ansible/**'           # Ansible code
+      - '!ansible/docs/**'     # Exclude docs
+      - '.github/workflows/ansible-deploy.yml'  # Workflow changes
+```
+
+#### 4.8 Add Status Badge
+
+**File:** `README.md` (or ansible/README.md)
+
+**Add badge:**
+```markdown
+[![Ansible Deployment](https://github.com/your-username/your-repo/actions/workflows/ansible-deploy.yml/badge.svg)](https://github.com/your-username/your-repo/actions/workflows/ansible-deploy.yml)
+```
+
+#### 4.9 Testing CI/CD
+
+**Test Sequence:**
+1. Make a change to ansible code (e.g., update variable in group_vars)
+2. Commit and push to GitHub
+3. Watch Actions tab for workflow execution
+4. Verify lint job passes
+5. Verify deploy job succeeds
+6. Check application is updated on target VM
+
+**Evidence Required:**
+- Screenshot of successful workflow run
+- Output logs showing ansible-lint passing
+- Output logs showing ansible-playbook execution
+- Verification step output showing app responding
+- Status badge in README showing passing
+
+#### 4.10 Research Questions
+
+Answer in documentation:
+1. **What are the security implications of storing SSH keys in GitHub Secrets?**
+2. **How would you implement a staging → production deployment pipeline?**
+3. **What would you add to make rollbacks possible?**
+4. **How does self-hosted runner improve security compared to GitHub-hosted?**
+
+---
+
+### Task 5 — Documentation (1 pt)
+
+Create `ansible/docs/LAB06.md` with the following:
+
+**Required Sections:**
+1. **Overview** - What you accomplished and technologies used
+2. **Blocks & Tags** - Block usage in each role, tag strategy, execution examples with screenshots
+3. **Docker Compose Migration** - Template structure, role dependencies, before/after comparison
+4. **Wipe Logic** - Implementation details, variable + tag approach, test results
+5. **CI/CD Integration** - Workflow architecture, setup steps, evidence of automated deployments
+6. **Testing Results** - All test scenarios, idempotency verification, application accessibility
+7. **Challenges & Solutions** - Difficulties encountered and how you solved them
+8. **Research Answers** - All research questions answered with analysis
+
+**Code Documentation:**
+- Add clear comments in all modified Ansible files
+- Document variables in templates
+- Explain safety mechanisms in wipe logic
+- Document workflow steps in CI/CD files
+
+**Evidence:**
+- Terminal outputs showing tagged execution
+- Wipe logic test results (all 4 scenarios)
+- CI/CD workflow logs and screenshots
+- Application accessibility verification
+
+---
+
+### Bonus Part 1 — Multi-App Deployment (1.5 pts)
+
+#### Bonus 1.1 Prerequisites
+
+**Required:**
+- Completed Lab 1 Bonus (compiled language app: Go/Rust/Java/C#)
+- Completed Lab 2 Bonus (multi-stage Docker build)
+- Completed Lab 3 Bonus Part 1 (multi-app CI/CD)
+
+**You should have:**
+- Python web app (everyone has this)
+- Compiled language web app (Go/Rust/Java/C#)
+- Both apps containerized and on Docker Hub
+- Both apps with similar endpoints (/, /health)
+
+#### Bonus 1.2 Role Reusability Pattern
+
+**Key Concept:** Use the same `web_app` role for both apps with different variables.
+
+**Directory Structure:**
+```
+ansible/
+├── inventory/
+│   └── hosts.ini
+├── group_vars/
+│   └── all.yml
+├── host_vars/          # Optional: per-host vars
+├── vars/
+│   ├── app_python.yml  # NEW: Python app variables
+│   └── app_bonus.yml   # NEW: Bonus app variables
+├── roles/
+│   └── web_app/        # Reused for both apps
+└── playbooks/
+    ├── provision.yml
+    ├── deploy_python.yml    # NEW
+    ├── deploy_bonus.yml     # NEW
+    └── deploy_all.yml       # NEW: Deploy both
+```
+
+#### Bonus 1.3 Create Variable Files
+
+**File:** `ansible/vars/app_python.yml`
+```yaml
+---
+app_name: devops-python
+docker_image: your_username/devops-info-service
+docker_tag: latest
+app_port: 8000
+app_internal_port: 8000
+compose_project_dir: "/opt/{{ app_name }}"
+```
+
+**File:** `ansible/vars/app_bonus.yml`
+```yaml
+---
+app_name: devops-go  # or rust, java, csharp
+docker_image: your_username/devops-info-service-go
+docker_tag: latest
+app_port: 8001  # Different port!
+app_internal_port: 8080  # Go apps often use 8080
+compose_project_dir: "/opt/{{ app_name }}"
+```
+
+**Important:** Use different ports to run both apps simultaneously.
+
+#### Bonus 1.4 Create Deployment Playbooks
+
+**File:** `ansible/playbooks/deploy_python.yml`
+```yaml
+---
+- name: Deploy Python Application
+  hosts: all
+  become: true
+  vars_files:
+    - ../vars/app_python.yml
+
+  roles:
+    - web_app
+```
+
+**File:** `ansible/playbooks/deploy_bonus.yml`
+```yaml
+---
+- name: Deploy Bonus Application
+  hosts: all
+  become: true
+  vars_files:
+    - ../vars/app_bonus.yml
+
+  roles:
+    - web_app
+```
+
+**File:** `ansible/playbooks/deploy_all.yml`
+```yaml
+---
+- name: Deploy All Applications
+  hosts: all
+  become: true
+
+  tasks:
+    - name: Deploy Python App
+      include_role:
+        name: web_app
+      vars:
+        app_name: devops-python
+        docker_image: your_username/devops-info-service
+        app_port: 8000
+
+    - name: Deploy Bonus App
+      include_role:
+        name: web_app
+      vars:
+        app_name: devops-go
+        docker_image: your_username/devops-info-service-go
+        app_port: 8001
+        app_internal_port: 8080
+```
+
+#### Bonus 1.5 Extend Wipe Logic
+
+**Wipe logic should support app-specific wipe:**
+
+**Usage:**
+```bash
+# Wipe only Python app
+ansible-playbook playbooks/deploy_python.yml \
+  -e "web_app_wipe=true" \
+  --tags web_app_wipe
+
+# Wipe only Bonus app
+ansible-playbook playbooks/deploy_bonus.yml \
+  -e "web_app_wipe=true" \
+  --tags web_app_wipe
+
+# Wipe both apps
+ansible-playbook playbooks/deploy_all.yml \
+  -e "web_app_wipe=true" \
+  --tags web_app_wipe
+```
+
+**The role automatically handles different apps because `app_name` and `compose_project_dir` are different!**
+
+#### Bonus 1.6 Testing Multi-App Deployment
+
+**Test Commands:**
+```bash
+# Deploy both apps
+ansible-playbook playbooks/deploy_all.yml
+
+# Verify both running
+ssh user@vm_ip "docker ps"
+curl http://vm_ip:8000        # Python app
+curl http://vm_ip:8001        # Bonus app
+
+# Test independent deployment
+ansible-playbook playbooks/deploy_python.yml  # Should not affect bonus app
+ansible-playbook playbooks/deploy_bonus.yml   # Should not affect python app
+
+# Test independent wipe
+ansible-playbook playbooks/deploy_python.yml \
+  -e "web_app_wipe=true" --tags web_app_wipe
+# Verify: Python app removed, bonus app still running
+
+# Test idempotency
+ansible-playbook playbooks/deploy_all.yml
+ansible-playbook playbooks/deploy_all.yml  # Should show minimal changes
+```
+
+**Evidence Required:**
+- Output showing both apps deployed
+- `docker ps` output showing both containers
+- Curl outputs from both apps
+- Proof of independent wipe functionality
+- Idempotency verification for multi-app deployment
+
+#### Bonus 1.7 Documentation
+
+**Add to LAB06.md:**
+- Multi-app architecture explanation
+- Variable file strategy
+- Role reusability benefits
+- Port conflict resolution
+- Independent vs. combined deployment trade-offs
+
+---
+
+### Bonus Part 2 — Multi-App CI/CD (1 pt)
+
+#### Bonus 2.1 Prerequisites
+
+**Required:**
+- Bonus Part 1 completed (multi-app deployment working)
+- Task 4 completed (single app CI/CD working)
+
+#### Bonus 2.2 Workflow Strategy
+
+**Two Approaches:**
+
+**Approach A: Separate Workflows**
+- One workflow per app
+- Path filters for each app's code
+- Independent deployment
+- More control, more files
+
+**Approach B: Matrix Strategy**
+- Single workflow with matrix
+- Deploys both apps
+- Simpler, less flexible
+
+Choose based on your preference (Approach A recommended).
+
+#### Bonus 2.3 Create Workflow for Bonus App
+
+**File:** `.github/workflows/ansible-deploy-bonus.yml`
+
+**Requirements:**
+1. Trigger on bonus app code changes
+2. Run ansible-lint
+3. Deploy bonus app only
+4. Verify bonus app responds
+5. Independent from Python app workflow
+
+**Path Filters:**
+```yaml
+on:
+  push:
+    branches: [ main, master ]
+    paths:
+      - 'ansible/vars/app_bonus.yml'
+      - 'ansible/playbooks/deploy_bonus.yml'
+      - 'ansible/roles/web_app/**'
+      - '.github/workflows/ansible-deploy-bonus.yml'
+```
+
+**Deployment Step:**
+```yaml
+- name: Deploy Bonus Application
+  run: |
+    cd ansible
+    echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
+    ansible-playbook playbooks/deploy_bonus.yml \
+      --vault-password-file /tmp/vault_pass
+    rm /tmp/vault_pass
+```
+
+**Verification:**
+```yaml
+- name: Verify Bonus App Deployment
+  run: |
+    sleep 10
+    curl -f http://${{ secrets.VM_HOST }}:8001 || exit 1
+    curl -f http://${{ secrets.VM_HOST }}:8001/health || exit 1
+```
+
+#### Bonus 2.4 Update Python App Workflow
+
+**File:** `.github/workflows/ansible-deploy.yml`
+
+**Update path filters to be more specific:**
+```yaml
+on:
+  push:
+    paths:
+      - 'ansible/vars/app_python.yml'
+      - 'ansible/playbooks/deploy_python.yml'
+      - 'ansible/playbooks/deploy.yml'  # If this deploys Python
+      - 'ansible/roles/web_app/**'
+      - '.github/workflows/ansible-deploy.yml'
+```
+
+**Update deployment to use specific playbook:**
+```yaml
+- name: Deploy Python Application
+  run: |
+    cd ansible
+    ansible-playbook playbooks/deploy_python.yml \
+      --vault-password-file /tmp/vault_pass
+```
+
+#### Bonus 2.5 Matrix Strategy Alternative
+
+**File:** `.github/workflows/ansible-deploy-matrix.yml`
+
+**Using matrix to deploy both:**
+```yaml
+name: Ansible Multi-App Deployment
+
+on:
+  push:
+    branches: [ main, master ]
+    paths:
+      - 'ansible/**'
+
+jobs:
+  deploy:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        app:
+          - name: python
+            playbook: deploy_python.yml
+            port: 8000
+          - name: bonus
+            playbook: deploy_bonus.yml
+            port: 8001
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Deploy ${{ matrix.app.name }}
+        run: |
+          cd ansible
+          echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
+          ansible-playbook playbooks/${{ matrix.app.playbook }} \
+            --vault-password-file /tmp/vault_pass
+          rm /tmp/vault_pass
+
+      - name: Verify ${{ matrix.app.name }}
+        run: |
+          sleep 10
+          curl -f http://${{ secrets.VM_HOST }}:${{ matrix.app.port }}
+```
+
+#### Bonus 2.6 Testing Multi-App CI/CD
+
+**Test Scenarios:**
+
+**Test 1: Python app change should deploy only Python**
+```bash
+# Change ansible/vars/app_python.yml
+git add ansible/vars/app_python.yml
+git commit -m "Update Python app config"
+git push
+
+# Watch Actions - only ansible-deploy.yml should run
+# Verify only Python app redeployed
+```
+
+**Test 2: Bonus app change should deploy only Bonus**
+```bash
+# Change ansible/vars/app_bonus.yml
+git add ansible/vars/app_bonus.yml
+git commit -m "Update Bonus app config"
+git push
+
+# Watch Actions - only ansible-deploy-bonus.yml should run
+```
+
+**Test 3: Role change should deploy both**
+```bash
+# Change ansible/roles/web_app/tasks/main.yml
+git add ansible/roles/web_app/
+git commit -m "Update web_app role"
+git push
+
+# Watch Actions - both workflows should run
+```
+
+**Evidence Required:**
+- Screenshots showing independent workflow triggers
+- Logs proving only affected app deployed
+- Verification of both apps working after role change
+- Status badges for both workflows
+
+#### Bonus 2.7 Documentation
+
+**Add to LAB06.md:**
+- Multi-app CI/CD architecture
+- Workflow triggering logic
+- Path filter strategy
+- Matrix vs separate workflows comparison
+- Evidence of independent deployments
+
+---
+
+## Submission Guidelines
+
+### What to Submit
+
+Submit a single markdown file: **`ansible/docs/LAB06.md`**
+
+### Required Structure
+
+```markdown
+# Lab 6: Advanced Ansible & CI/CD - Submission
+
+**Name:** Your Name
+**Date:** YYYY-MM-DD
+**Lab Points:** 10 + X bonus
+
+---
+
+## Task 1: Blocks & Tags (2 pts)
+[Your implementation details]
+[Evidence: terminal outputs, tag listings]
+[Research answers]
+
+## Task 2: Docker Compose (3 pts)
+[Your implementation]
+[Template code]
+[Before/after comparison]
+[Evidence: deployments, idempotency]
+
+## Task 3: Wipe Logic (1 pt)
+[Implementation explanation]
+[Test results for all scenarios]
+[Evidence proving correct behavior]
+
+## Task 4: CI/CD (3 pts)
+[Workflow setup]
+[Secrets configuration]
+[Evidence: successful runs, badges]
+
+## Task 5: Documentation
+[This file serves as documentation]
+
+## Bonus Part 1: Multi-App (1.5 pts)
+[If completed]
+
+## Bonus Part 2: Multi-App CI/CD (1 pt)
+[If completed]
+
+---
+
+## Summary
+[Overall reflection]
+[Total time spent]
+[Key learnings]
+```
+
+### GitHub Repository Requirements
+
+**Commit all code:**
+```bash
+git add ansible/
+git add .github/workflows/
+git add ansible/docs/LAB06.md
+git commit -m "Complete Lab 6: Advanced Ansible & CI/CD"
+git push
+```
+
+**Repository should contain:**
+- ✅ Updated roles with blocks and tags
+- ✅ Docker Compose templates
+- ✅ Wipe logic implementation
+- ✅ CI/CD workflows
+- ✅ Documentation with evidence
+- ✅ Working deployments (apps accessible)
+
+### Evidence Checklist
+
+**Required Proof:**
+- [ ] Ansible playbook output with selective tags
+- [ ] Rescue block triggered output
+- [ ] Docker Compose deployment success
+- [ ] Idempotency verification (2nd run)
+- [ ] Wipe logic test results (all 4 scenarios)
+- [ ] GitHub Actions successful workflow
+- [ ] ansible-lint passing
+- [ ] Status badge(s) in README
+- [ ] Application(s) accessible via curl
+
+**Bonus Proof (if applicable):**
+- [ ] Both apps deployed and accessible
+- [ ] Independent wipe functionality
+- [ ] Separate workflow runs for each app
+- [ ] Path filter effectiveness demonstrated
+
+---
+
+## Checklist
+
+**Before submitting, ensure you have:**
+- [ ] All three roles refactored with blocks and tags
+- [ ] Docker Compose deployment working with templated config
+- [ ] Role dependencies correctly configured
+- [ ] Wipe logic implemented with variable + tag safety
+- [ ] All 4 wipe scenarios tested successfully
+- [ ] GitHub Actions workflow running and passing
+- [ ] ansible-lint integrated and passing
+- [ ] Path filters configured for efficient CI/CD
+- [ ] Complete documentation in `ansible/docs/LAB06.md`
+- [ ] All research questions answered
+- [ ] Terminal outputs and screenshots included
+- [ ] Application(s) accessible and verified
+
+**Bonus (if attempting):**
+- [ ] Second app deployed using role reusability
+- [ ] Independent wipe logic for each app
+- [ ] Separate CI/CD workflows or matrix strategy
+- [ ] Path filters for independent triggering
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Blocks & Tags** | 2 pts | All roles refactored with blocks, rescue/always, comprehensive tag strategy |
+| **Docker Compose** | 3 pts | Working templated deployment, role dependencies, idempotent |
+| **Wipe Logic** | 1 pt | Variable + tag implementation, all scenarios tested |
+| **CI/CD** | 3 pts | Automated workflow with linting, deployment, verification |
+| **Documentation** | 1 pt | Complete LAB06.md with evidence and analysis |
+| **Bonus: Multi-App** | 1.5 pts | Role reusability, independent deployment and wipe |
+| **Bonus: Multi-App CI/CD** | 1 pt | Separate workflows or matrix, independent triggering |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading Scale:**
+- **10/10:** All tasks working, excellent documentation, proper implementation
+- **8-9/10:** All works, good docs, minor improvements possible
+- **6-7/10:** Core functionality present, basic documentation
+- **<6/10:** Missing features or documentation, needs revision
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Ansible Documentation</summary>
+
+- [Ansible Blocks](https://docs.ansible.com/ansible/latest/user_guide/playbooks_blocks.html)
+- [Ansible Tags](https://docs.ansible.com/ansible/latest/user_guide/playbooks_tags.html)
+- [Ansible Role Dependencies](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html#using-role-dependencies)
+- [Ansible Variables](https://docs.ansible.com/ansible/latest/user_guide/playbooks_variables.html)
+- [Ansible Vault](https://docs.ansible.com/ansible/latest/user_guide/vault.html)
+
+</details>
+
+<details>
+<summary>🐳 Docker Compose</summary>
+
+- [Docker Compose File Reference](https://docs.docker.com/compose/compose-file/)
+- [Docker Compose Module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_compose_module.html)
+- [community.docker Collection](https://docs.ansible.com/ansible/latest/collections/community/docker/)
+- [Compose Best Practices](https://docs.docker.com/compose/production/)
+
+</details>
+
+<details>
+<summary>🔄 CI/CD & GitHub Actions</summary>
+
+- [GitHub Actions Documentation](https://docs.github.com/en/actions)
+- [GitHub Actions: Workflow Syntax](https://docs.github.com/en/actions/reference/workflow-syntax-for-github-actions)
+- [Self-hosted Runners](https://docs.github.com/en/actions/hosting-your-own-runners)
+- [Encrypted Secrets](https://docs.github.com/en/actions/security-guides/encrypted-secrets)
+
+</details>
+
+<details>
+<summary>🛠️ Tools & Best Practices</summary>
+
+- [ansible-lint](https://ansible-lint.readthedocs.io/) - Best practices checker
+- [Ansible Galaxy](https://galaxy.ansible.com/) - Community roles
+- [Jinja2 Templating](https://jinja.palletsprojects.com/) - Template engine
+- [YAML Syntax](https://docs.ansible.com/ansible/latest/reference_appendices/YAMLSyntax.html)
+
+</details>
+
+---
+
+## Looking Ahead
+
+Your Ansible automation evolves throughout the course:
+
+- **Lab 7:** Logging Stack - Deploy Loki, Promtail, and Grafana
+- **Lab 8:** Metrics Stack - Add Prometheus metrics to your app
+- **Lab 9:** Kubernetes Basics - Migrate from Docker Compose to K8s deployments
+- **Lab 10:** Helm charts for templated K8s deployments
+- **Lab 11-12:** Secrets with Vault, ConfigMaps, and persistent storage
+- **Lab 13:** GitOps with ArgoCD - Declarative Kubernetes deployments
+
+---
+
+**Good luck!** 🚀
diff --git a/labs/lab07.md b/labs/lab07.md
index f971e0b01d..fbae87c030 100644
--- a/labs/lab07.md
+++ b/labs/lab07.md
@@ -1,594 +1,594 @@
-# Lab 7 — Observability & Logging with Loki Stack
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-Logging%20%26%20Observability-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Loki%20|%20Promtail%20|%20Grafana-informational)
-
-> Deploy a logging stack with Loki, Promtail, and Grafana to aggregate and visualize logs from your containerized applications.
-
-## Overview
-
-Set up centralized logging for your applications using the Grafana Loki stack. You'll deploy Loki 3.0 (log storage with TSDB), Promtail (log collector), and Grafana 11 (visualization), then integrate your apps from previous labs.
-
-**What You'll Learn:**
-- Loki 3.0 architecture with TSDB (10x faster queries!)
-- Promtail configuration for Docker log collection
-- LogQL query language basics
-- Building interactive log dashboards in Grafana 11
-- Production logging practices and retention policies
-
-**Prerequisites:** Lab 1 (web apps), Lab 2 (Docker), Lab 6 (Docker Compose understanding)
-
-**Tech Stack:** Loki 3.0 + Promtail 3.0 + Grafana 12.3
-
----
-
-## Tasks
-
-### Task 1 — Deploy Loki Stack (4 pts)
-
-Create a Docker Compose stack with Loki, Promtail, and Grafana.
-
-#### 1.1 Study the Stack
-
-**Research these components before starting:**
-- [Loki Overview](https://grafana.com/docs/loki/latest/get-started/overview/) - How Loki works
-- [Promtail Basics](https://grafana.com/docs/loki/latest/send-data/promtail/) - Log collection
-- [LogQL Introduction](https://grafana.com/docs/loki/latest/query/) - Query language
-
-**Understand:**
-- How is Loki different from Elasticsearch?
-- What are log labels and why do they matter?
-- How does Promtail discover containers?
-
-#### 1.2 Create Project Structure
-
-```
-monitoring/
-├── docker-compose.yml
-├── loki/
-│   └── config.yml
-├── promtail/
-│   └── config.yml
-└── docs/
-    └── LAB07.md
-```
-
-#### 1.3 Configure Docker Compose
-
-**File:** `monitoring/docker-compose.yml`
-
-**Requirements:**
-- Loki service (image: `grafana/loki:3.0.0`, port 3100)
-- Promtail service (image: `grafana/promtail:3.0.0`)
-- Grafana service (image: `grafana/grafana:12.3.1`, port 3000)
-- Volumes for configs and data persistence
-- Shared network
-
-<details>
-<summary>💡 Docker Compose Hints</summary>
-
-**Key points to consider:**
-- Use Docker Compose v2 syntax (version field is optional but use 3.8 for compatibility)
-- Mount config files to `/etc/loki/config.yml` and `/etc/promtail/config.yml`
-- Promtail needs access to Docker logs: `/var/lib/docker/containers:ro`
-- Promtail needs Docker socket: `/var/run/docker.sock:ro` (⚠️ security consideration)
-- Create named volumes: `loki-data` and `grafana-data`
-- Use `command:` to specify config file path (e.g., `-config.file=/etc/loki/config.yml`)
-
-**Grafana environment variables for easier testing:**
-```yaml
-environment:
-  - GF_AUTH_ANONYMOUS_ENABLED=true
-  - GF_AUTH_ANONYMOUS_ORG_ROLE=Admin
-  - GF_SECURITY_ALLOW_EMBEDDING=true  # For iframe embedding if needed
-```
-⚠️ Only for development! Remove for production.
-
-**Note:** Use `docker compose` (space, not hyphen) - the v2 CLI standard.
-
-</details>
-
-#### 1.4 Configure Loki
-
-**File:** `monitoring/loki/config.yml`
-
-**Research and configure:**
-- Basic server settings (port 3100)
-- Storage backend (use `tsdb` with `filesystem` - recommended in Loki 3.0)
-- Schema configuration (use schema v13, find examples in [Loki docs](https://grafana.com/docs/loki/latest/configure/))
-- Log retention: 7 days (168h)
-
-<details>
-<summary>💡 Loki Configuration Hints</summary>
-
-**Essential sections you need:**
-- `auth_enabled: false` (for testing)
-- `server:` - HTTP port
-- `common:` - Shared configuration (new in Loki 3.0, simplifies config)
-- `schema_config:` - Storage schema (use v13 with TSDB for Loki 3.0+)
-- `storage_config:` - Where to store data
-  - Use `tsdb` index type (faster than boltdb-shipper)
-  - Use `filesystem` object store for single-instance setup
-- `limits_config:` - Retention period (`retention_period: 168h` = 7 days)
-- `compactor:` - Cleanup old logs (required when retention is enabled)
-
-**TSDB Benefits (Loki 3.0+):**
-- Faster queries (up to 10x improvement)
-- Lower memory usage
-- Better compression
-
-**Check the [Loki 3.0 configuration docs](https://grafana.com/docs/loki/latest/configure/) for structure and required fields.**
-
-</details>
-
-#### 1.5 Configure Promtail
-
-**File:** `monitoring/promtail/config.yml`
-
-**Requirements:**
-- Configure Loki client endpoint (http://loki:3100)
-- Set up Docker service discovery
-- Add relabeling to extract container name as label
-
-<details>
-<summary>💡 Promtail Configuration Hints</summary>
-
-**Key sections:**
-- `server:` - Promtail's own port (9080)
-- `positions:` - Track what logs were read
-- `clients:` - Where to send logs (Loki URL + `/loki/api/v1/push`)
-- `scrape_configs:` - How to collect logs
-
-**For Docker service discovery:**
-```yaml
-scrape_configs:
-  - job_name: docker
-    docker_sd_configs:
-      - host: unix:///var/run/docker.sock
-        refresh_interval: 5s
-```
-
-**Relabeling extracts container name:**
-- Use `__meta_docker_container_name` source label
-- Create `container` target label
-- Remove leading `/` from container name with regex
-
-Check [Promtail Docker SD docs](https://grafana.com/docs/loki/latest/send-data/promtail/configuration/#docker_sd_configs).
-
-</details>
-
-#### 1.6 Deploy and Verify
-
-**Deploy the stack:**
-```bash
-cd monitoring
-docker compose up -d  # v2 CLI (space, not hyphen)
-docker compose ps
-```
-
-**Verify services:**
-```bash
-# Test Loki
-curl http://localhost:3100/ready
-
-# Check Promtail targets
-curl http://localhost:9080/targets
-
-# Access Grafana
-open http://localhost:3000
-```
-
-**In Grafana:**
-1. Go to **Connections** → **Data sources** → **Add data source** → **Loki**
-2. URL: `http://loki:3100`
-3. Click **Save & Test** (should show "Data source connected")
-4. Navigate to **Explore** → Select **Loki** data source
-5. Query: `{job="docker"}` → You should see logs from all containers
-
-**Alternative:** Provision the data source automatically (see bonus task for Ansible example).
-
-**Evidence:** Screenshot showing logs from at least 3 containers in Grafana Explore.
-
----
-
-### Task 2 — Integrate Your Applications (3 pts)
-
-Add your apps to the logging stack and implement structured logging.
-
-#### 2.1 Add Structured Logging
-
-**Update your Python app** from Lab 1 to log in JSON format.
-
-**Requirements:**
-- Use Python's `logging` module
-- Output JSON format: `{"timestamp": "...", "level": "...", "message": "...", ...}`
-- Log important events: startup, HTTP requests, errors
-- Include context: method, path, status code, client IP
-
-<details>
-<summary>💡 JSON Logging Hints</summary>
-
-**Option 1: Custom formatter**
-Create a `JSONFormatter` class that inherits from `logging.Formatter` and overrides the `format()` method to return JSON.
-
-**Option 2: Use python-json-logger**
-```bash
-pip install python-json-logger
-```
-Then configure it in your app.
-
-**What to log:**
-- App startup with configuration
-- Each HTTP request (use `@app.before_request`)
-- Response status (use `@app.after_request`)
-- Errors and exceptions
-
-**Why JSON?**
-- Easy to parse by log aggregation tools
-- Structured data, not just text
-- Can extract fields in LogQL queries
-
-</details>
-
-#### 2.2 Add Applications to Docker Compose
-
-**Extend** `monitoring/docker-compose.yml` with your applications:
-- Python app from Lab 1 (port 8000)
-- Bonus app from Lab 1 if you completed it (port 8001)
-
-**Both apps should:**
-- Join the `logging` network
-- Have labels for Promtail filtering: `logging: "promtail"`, `app: "app-name"`
-
-<details>
-<summary>💡 Multi-App Compose Hints</summary>
-
-**Add to your docker-compose.yml:**
-```yaml
-services:
-  # ... loki, promtail, grafana ...
-
-  app-python:
-    image: your-username/devops-info-service:latest
-    ports:
-      - "8000:8000"
-    networks:
-      - logging
-    labels:
-      logging: "promtail"
-      app: "devops-python"
-```
-
-**Filter in Promtail:** Update `promtail/config.yml` to only scrape containers with the label:
-```yaml
-filters:
-  - name: label
-    values: ["logging=promtail"]
-```
-
-</details>
-
-#### 2.3 Generate Logs and Test
-
-**Make requests to generate logs:**
-```bash
-# Generate traffic
-for i in {1..20}; do curl http://localhost:8000/; done
-for i in {1..20}; do curl http://localhost:8000/health; done
-```
-
-**Query logs in Grafana Explore:**
-```logql
-# All logs from Python app
-{app="devops-python"}
-
-# Only errors
-{app="devops-python"} |= "ERROR"
-
-# Parse JSON and filter
-{app="devops-python"} | json | method="GET"
-```
-
-**Evidence:**
-- Screenshot of JSON log output from your app
-- Screenshot of Grafana showing logs from both applications
-- At least 3 different LogQL queries that work
-
----
-
-### Task 3 — Build Log Dashboard (2 pts)
-
-Create a Grafana dashboard to visualize your application logs.
-
-#### 3.1 Learn LogQL Basics
-
-**Practice these query patterns in Explore first:**
-
-1. **Stream selection:** `{app="devops-python"}`
-2. **Text filtering:** `{app="devops-python"} |= "error"`
-3. **JSON parsing:** `{app="devops-python"} | json`
-4. **Field filtering:** `{app="devops-python"} | json | level="INFO"`
-5. **Metrics from logs:** `rate({app="devops-python"}[1m])`
-
-<details>
-<summary>💡 LogQL Reference</summary>
-
-**Stream selectors:**
-- `{label="value"}` - exact match
-- `{label=~"regex"}` - regex match
-- `{label!="value"}` - not equal
-
-**Line filters:**
-- `|= "text"` - contains
-- `!= "text"` - doesn't contain
-- `|~ "regex"` - regex match
-
-**Parsers:**
-- `| json` - parse JSON logs
-- `| logfmt` - parse logfmt logs
-
-**Aggregations:**
-- `rate({app="app"}[5m])` - logs per second
-- `count_over_time({app="app"}[5m])` - count logs
-- `sum by (level) (count_over_time({app="app"} | json [5m]))` - count by level
-
-Learn more: [LogQL Documentation](https://grafana.com/docs/loki/latest/query/)
-
-</details>
-
-#### 3.2 Create Dashboard
-
-**Requirements - create 4 panels:**
-
-1. **Logs Table** (Logs visualization)
-   - Shows recent logs from all apps
-   - Query: `{app=~"devops-.*"}`
-
-2. **Request Rate** (Time series graph)
-   - Shows logs per second by app
-   - Query: `sum by (app) (rate({app=~"devops-.*"} [1m]))`
-
-3. **Error Logs** (Logs visualization)
-   - Shows only ERROR level logs
-   - Query: `{app=~"devops-.*"} | json | level="ERROR"`
-
-4. **Log Level Distribution** (Stat or Pie chart)
-   - Count logs by level (INFO, ERROR, etc.)
-   - Query: `sum by (level) (count_over_time({app=~"devops-.*"} | json [5m]))`
-
-**How to create:**
-1. **Dashboard** → **New** → **New Dashboard** → **Add visualization**
-2. Select **Loki** data source
-3. Enter LogQL query (use the query builder or code editor)
-4. Choose visualization type (Logs, Time series, Stat, Pie chart, etc.)
-5. Configure panel title and options
-6. **Save dashboard** (Grafana 11 auto-saves drafts)
-
-**Grafana 11 features:**
-- Query builder UI for LogQL (easier for beginners)
-- Better log context and line wrapping
-- Improved variable support
-- Dashboard version history
-
-**Evidence:** Screenshot of your dashboard showing all 4 panels with real data.
-
----
-
-### Task 4 — Production Readiness (1 pt)
-
-Configure the stack for production use.
-
-#### 4.1 Add Resource Limits
-
-Add resource constraints to prevent services from consuming too much:
-
-```yaml
-deploy:
-  resources:
-    limits:
-      cpus: '1.0'
-      memory: 1G
-    reservations:
-      cpus: '0.5'
-      memory: 512M
-```
-
-**Apply to all services** with appropriate values.
-
-#### 4.2 Secure Grafana
-
-**Remove anonymous authentication:**
-- Change `GF_AUTH_ANONYMOUS_ENABLED` to `false`
-- Set admin password via environment variable
-- Use `.env` file for secrets (don't commit!)
-
-#### 4.3 Add Health Checks
-
-Add `healthcheck:` sections to verify services are working:
-- Loki: `http://localhost:3100/ready`
-- Grafana: `http://localhost:3000/api/health`
-
-<details>
-<summary>💡 Health Check Example</summary>
-
-```yaml
-healthcheck:
-  test: ["CMD-SHELL", "wget --no-verbose --tries=1 --spider http://localhost:3100/ready || exit 1"]
-  interval: 10s
-  timeout: 5s
-  retries: 5
-  start_period: 10s  # Grace period for startup
-```
-
-**Alternative using curl:**
-```yaml
-test: ["CMD-SHELL", "curl -f http://localhost:3100/ready || exit 1"]
-```
-
-</details>
-
-**Evidence:**
-- `docker-compose ps` showing all services healthy
-- Screenshot of Grafana login page (no anonymous access)
-
----
-
-### Task 5 — Documentation (2 pts)
-
-Create `monitoring/docs/LAB07.md` documenting your setup.
-
-**Required sections:**
-1. **Architecture** - Diagram showing how components connect
-2. **Setup Guide** - Step-by-step deployment instructions
-3. **Configuration** - Explain your Loki/Promtail configs and why
-4. **Application Logging** - How you implemented JSON logging
-5. **Dashboard** - Explain each panel and the LogQL queries
-6. **Production Config** - Security measures, resources, retention
-7. **Testing** - Commands to verify everything works
-8. **Challenges** - Problems you encountered and solutions
-
-**Include:**
-- Configuration file snippets (not full files)
-- Screenshots of Grafana dashboard
-- Example LogQL queries with explanations
-- Evidence of all tasks completed
-
----
-
-## Bonus — Ansible Automation (2.5 pts)
-
-Automate Loki stack deployment with Ansible (builds on Labs 5-6).
-
-**Create Ansible role** `roles/monitoring` that:
-- Creates monitoring directory structure
-- Templates configuration files (Loki 3.0 format)
-- Deploys stack with Docker Compose v2
-- Waits for services to be ready
-- Configures Grafana data source
-
-**Requirements:**
-- Use Jinja2 templates for configs (versions, ports, retention as variables)
-- Make it idempotent (use `community.docker.docker_compose_v2` module)
-- Add to your existing Ansible setup from Lab 6
-- Create playbook: `playbooks/deploy-monitoring.yml`
-- Compatible with Ansible 2.16+
-
-<details>
-<summary>💡 Ansible Role Structure</summary>
-
-```
-roles/monitoring/
-├── defaults/main.yml       # Variables (versions, ports, etc.)
-├── tasks/
-│   ├── main.yml           # Main orchestration
-│   ├── setup.yml          # Create dirs, template configs
-│   └── deploy.yml         # Docker compose deployment
-├── templates/
-│   ├── docker-compose.yml.j2
-│   ├── loki-config.yml.j2
-│   └── promtail-config.yml.j2
-└── meta/main.yml          # Depends on: docker role
-```
-
-**Key variables to parameterize:**
-- Service versions (loki: 3.0.0, promtail: 3.0.0, grafana: 11.3.0)
-- Ports (loki: 3100, grafana: 3000, promtail: 9080)
-- Retention period (default: 168h / 7 days)
-- Resource limits (memory, CPU)
-- Schema version (v13 for Loki 3.0+)
-
-</details>
-
-**Evidence:**
-- Ansible playbook execution output
-- Idempotency test (run twice, second shows no changes)
-- Templated configuration files
-
----
-
-## Checklist
-
-**Before submitting:**
-- [ ] Loki, Promtail, Grafana running via Docker Compose
-- [ ] Loki data source configured in Grafana
-- [ ] Python app logging in JSON format
-- [ ] Bonus app (if completed Lab 1 bonus) integrated
-- [ ] Logs visible in Grafana from all containers
-- [ ] Dashboard with 4+ panels created
-- [ ] LogQL queries working for different scenarios
-- [ ] Resource limits on all services
-- [ ] Health checks added
-- [ ] Grafana secured (no anonymous access)
-- [ ] Complete documentation with screenshots
-- [ ] All configuration files in repo
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Stack Deployment** | 4 pts | Loki, Promtail, Grafana configured and working |
-| **App Integration** | 3 pts | Apps logging JSON format, visible in Loki |
-| **Dashboard** | 2 pts | 4+ panels with appropriate LogQL queries |
-| **Production Config** | 1 pt | Resources, security, health checks |
-| **Documentation** | 2 pts | Complete LAB07.md with evidence |
-| **Bonus: Ansible** | 2.5 pts | Automated deployment with Ansible role |
-| **Total** | 12.5 pts | 10 pts required + 2.5 bonus |
-
----
-
-## Resources
-
-<details>
-<summary>📚 Loki Documentation</summary>
-
-- [Loki 3.0 Overview](https://grafana.com/docs/loki/latest/get-started/overview/)
-- [Loki Configuration](https://grafana.com/docs/loki/latest/configure/)
-- [LogQL Query Language](https://grafana.com/docs/loki/latest/query/)
-- [Storage Configuration](https://grafana.com/docs/loki/latest/storage/)
-
-</details>
-
-<details>
-<summary>🚢 Promtail</summary>
-
-- [Promtail Configuration](https://grafana.com/docs/loki/latest/send-data/promtail/configuration/)
-- [Docker Service Discovery](https://grafana.com/docs/loki/latest/send-data/promtail/configuration/#docker_sd_configs)
-- [Scraping Configuration](https://grafana.com/docs/loki/latest/send-data/promtail/scraping/)
-
-</details>
-
-<details>
-<summary>📊 Grafana</summary>
-
-- [Grafana 11 Dashboards](https://grafana.com/docs/grafana/latest/dashboards/)
-- [Loki Data Source](https://grafana.com/docs/grafana/latest/datasources/loki/)
-- [Explore Logs](https://grafana.com/docs/grafana/latest/explore/logs-integration/)
-
-</details>
-
-<details>
-<summary>📝 Logging Best Practices</summary>
-
-- [Structured Logging with structlog](https://www.structlog.org/en/stable/)
-- [The Twelve-Factor App: Logs](https://12factor.net/logs)
-- [Python Logging HOWTO](https://docs.python.org/3/howto/logging.html)
-- [python-json-logger](https://github.com/madzak/python-json-logger)
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 8:** Metrics with Prometheus - Add metrics to complement logs
-- **Lab 9:** Kubernetes Fundamentals - Deploy your apps to K8s
-- **Lab 10-12:** Helm, Secrets, ConfigMaps - Package and configure K8s deployments
-- **Lab 16:** Kubernetes Monitoring - Full observability in K8s
-
----
-
-**Good luck!** 🚀
+# Lab 7 — Observability & Logging with Loki Stack
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Logging%20%26%20Observability-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Loki%20|%20Promtail%20|%20Grafana-informational)
+
+> Deploy a logging stack with Loki, Promtail, and Grafana to aggregate and visualize logs from your containerized applications.
+
+## Overview
+
+Set up centralized logging for your applications using the Grafana Loki stack. You'll deploy Loki 3.0 (log storage with TSDB), Promtail (log collector), and Grafana 11 (visualization), then integrate your apps from previous labs.
+
+**What You'll Learn:**
+- Loki 3.0 architecture with TSDB (10x faster queries!)
+- Promtail configuration for Docker log collection
+- LogQL query language basics
+- Building interactive log dashboards in Grafana 11
+- Production logging practices and retention policies
+
+**Prerequisites:** Lab 1 (web apps), Lab 2 (Docker), Lab 6 (Docker Compose understanding)
+
+**Tech Stack:** Loki 3.0 + Promtail 3.0 + Grafana 12.3
+
+---
+
+## Tasks
+
+### Task 1 — Deploy Loki Stack (4 pts)
+
+Create a Docker Compose stack with Loki, Promtail, and Grafana.
+
+#### 1.1 Study the Stack
+
+**Research these components before starting:**
+- [Loki Overview](https://grafana.com/docs/loki/latest/get-started/overview/) - How Loki works
+- [Promtail Basics](https://grafana.com/docs/loki/latest/send-data/promtail/) - Log collection
+- [LogQL Introduction](https://grafana.com/docs/loki/latest/query/) - Query language
+
+**Understand:**
+- How is Loki different from Elasticsearch?
+- What are log labels and why do they matter?
+- How does Promtail discover containers?
+
+#### 1.2 Create Project Structure
+
+```
+monitoring/
+├── docker-compose.yml
+├── loki/
+│   └── config.yml
+├── promtail/
+│   └── config.yml
+└── docs/
+    └── LAB07.md
+```
+
+#### 1.3 Configure Docker Compose
+
+**File:** `monitoring/docker-compose.yml`
+
+**Requirements:**
+- Loki service (image: `grafana/loki:3.0.0`, port 3100)
+- Promtail service (image: `grafana/promtail:3.0.0`)
+- Grafana service (image: `grafana/grafana:12.3.1`, port 3000)
+- Volumes for configs and data persistence
+- Shared network
+
+<details>
+<summary>💡 Docker Compose Hints</summary>
+
+**Key points to consider:**
+- Use Docker Compose v2 syntax (version field is optional but use 3.8 for compatibility)
+- Mount config files to `/etc/loki/config.yml` and `/etc/promtail/config.yml`
+- Promtail needs access to Docker logs: `/var/lib/docker/containers:ro`
+- Promtail needs Docker socket: `/var/run/docker.sock:ro` (⚠️ security consideration)
+- Create named volumes: `loki-data` and `grafana-data`
+- Use `command:` to specify config file path (e.g., `-config.file=/etc/loki/config.yml`)
+
+**Grafana environment variables for easier testing:**
+```yaml
+environment:
+  - GF_AUTH_ANONYMOUS_ENABLED=true
+  - GF_AUTH_ANONYMOUS_ORG_ROLE=Admin
+  - GF_SECURITY_ALLOW_EMBEDDING=true  # For iframe embedding if needed
+```
+⚠️ Only for development! Remove for production.
+
+**Note:** Use `docker compose` (space, not hyphen) - the v2 CLI standard.
+
+</details>
+
+#### 1.4 Configure Loki
+
+**File:** `monitoring/loki/config.yml`
+
+**Research and configure:**
+- Basic server settings (port 3100)
+- Storage backend (use `tsdb` with `filesystem` - recommended in Loki 3.0)
+- Schema configuration (use schema v13, find examples in [Loki docs](https://grafana.com/docs/loki/latest/configure/))
+- Log retention: 7 days (168h)
+
+<details>
+<summary>💡 Loki Configuration Hints</summary>
+
+**Essential sections you need:**
+- `auth_enabled: false` (for testing)
+- `server:` - HTTP port
+- `common:` - Shared configuration (new in Loki 3.0, simplifies config)
+- `schema_config:` - Storage schema (use v13 with TSDB for Loki 3.0+)
+- `storage_config:` - Where to store data
+  - Use `tsdb` index type (faster than boltdb-shipper)
+  - Use `filesystem` object store for single-instance setup
+- `limits_config:` - Retention period (`retention_period: 168h` = 7 days)
+- `compactor:` - Cleanup old logs (required when retention is enabled)
+
+**TSDB Benefits (Loki 3.0+):**
+- Faster queries (up to 10x improvement)
+- Lower memory usage
+- Better compression
+
+**Check the [Loki 3.0 configuration docs](https://grafana.com/docs/loki/latest/configure/) for structure and required fields.**
+
+</details>
+
+#### 1.5 Configure Promtail
+
+**File:** `monitoring/promtail/config.yml`
+
+**Requirements:**
+- Configure Loki client endpoint (http://loki:3100)
+- Set up Docker service discovery
+- Add relabeling to extract container name as label
+
+<details>
+<summary>💡 Promtail Configuration Hints</summary>
+
+**Key sections:**
+- `server:` - Promtail's own port (9080)
+- `positions:` - Track what logs were read
+- `clients:` - Where to send logs (Loki URL + `/loki/api/v1/push`)
+- `scrape_configs:` - How to collect logs
+
+**For Docker service discovery:**
+```yaml
+scrape_configs:
+  - job_name: docker
+    docker_sd_configs:
+      - host: unix:///var/run/docker.sock
+        refresh_interval: 5s
+```
+
+**Relabeling extracts container name:**
+- Use `__meta_docker_container_name` source label
+- Create `container` target label
+- Remove leading `/` from container name with regex
+
+Check [Promtail Docker SD docs](https://grafana.com/docs/loki/latest/send-data/promtail/configuration/#docker_sd_configs).
+
+</details>
+
+#### 1.6 Deploy and Verify
+
+**Deploy the stack:**
+```bash
+cd monitoring
+docker compose up -d  # v2 CLI (space, not hyphen)
+docker compose ps
+```
+
+**Verify services:**
+```bash
+# Test Loki
+curl http://localhost:3100/ready
+
+# Check Promtail targets
+curl http://localhost:9080/targets
+
+# Access Grafana
+open http://localhost:3000
+```
+
+**In Grafana:**
+1. Go to **Connections** → **Data sources** → **Add data source** → **Loki**
+2. URL: `http://loki:3100`
+3. Click **Save & Test** (should show "Data source connected")
+4. Navigate to **Explore** → Select **Loki** data source
+5. Query: `{job="docker"}` → You should see logs from all containers
+
+**Alternative:** Provision the data source automatically (see bonus task for Ansible example).
+
+**Evidence:** Screenshot showing logs from at least 3 containers in Grafana Explore.
+
+---
+
+### Task 2 — Integrate Your Applications (3 pts)
+
+Add your apps to the logging stack and implement structured logging.
+
+#### 2.1 Add Structured Logging
+
+**Update your Python app** from Lab 1 to log in JSON format.
+
+**Requirements:**
+- Use Python's `logging` module
+- Output JSON format: `{"timestamp": "...", "level": "...", "message": "...", ...}`
+- Log important events: startup, HTTP requests, errors
+- Include context: method, path, status code, client IP
+
+<details>
+<summary>💡 JSON Logging Hints</summary>
+
+**Option 1: Custom formatter**
+Create a `JSONFormatter` class that inherits from `logging.Formatter` and overrides the `format()` method to return JSON.
+
+**Option 2: Use python-json-logger**
+```bash
+pip install python-json-logger
+```
+Then configure it in your app.
+
+**What to log:**
+- App startup with configuration
+- Each HTTP request (use `@app.before_request`)
+- Response status (use `@app.after_request`)
+- Errors and exceptions
+
+**Why JSON?**
+- Easy to parse by log aggregation tools
+- Structured data, not just text
+- Can extract fields in LogQL queries
+
+</details>
+
+#### 2.2 Add Applications to Docker Compose
+
+**Extend** `monitoring/docker-compose.yml` with your applications:
+- Python app from Lab 1 (port 8000)
+- Bonus app from Lab 1 if you completed it (port 8001)
+
+**Both apps should:**
+- Join the `logging` network
+- Have labels for Promtail filtering: `logging: "promtail"`, `app: "app-name"`
+
+<details>
+<summary>💡 Multi-App Compose Hints</summary>
+
+**Add to your docker-compose.yml:**
+```yaml
+services:
+  # ... loki, promtail, grafana ...
+
+  app-python:
+    image: your-username/devops-info-service:latest
+    ports:
+      - "8000:8000"
+    networks:
+      - logging
+    labels:
+      logging: "promtail"
+      app: "devops-python"
+```
+
+**Filter in Promtail:** Update `promtail/config.yml` to only scrape containers with the label:
+```yaml
+filters:
+  - name: label
+    values: ["logging=promtail"]
+```
+
+</details>
+
+#### 2.3 Generate Logs and Test
+
+**Make requests to generate logs:**
+```bash
+# Generate traffic
+for i in {1..20}; do curl http://localhost:8000/; done
+for i in {1..20}; do curl http://localhost:8000/health; done
+```
+
+**Query logs in Grafana Explore:**
+```logql
+# All logs from Python app
+{app="devops-python"}
+
+# Only errors
+{app="devops-python"} |= "ERROR"
+
+# Parse JSON and filter
+{app="devops-python"} | json | method="GET"
+```
+
+**Evidence:**
+- Screenshot of JSON log output from your app
+- Screenshot of Grafana showing logs from both applications
+- At least 3 different LogQL queries that work
+
+---
+
+### Task 3 — Build Log Dashboard (2 pts)
+
+Create a Grafana dashboard to visualize your application logs.
+
+#### 3.1 Learn LogQL Basics
+
+**Practice these query patterns in Explore first:**
+
+1. **Stream selection:** `{app="devops-python"}`
+2. **Text filtering:** `{app="devops-python"} |= "error"`
+3. **JSON parsing:** `{app="devops-python"} | json`
+4. **Field filtering:** `{app="devops-python"} | json | level="INFO"`
+5. **Metrics from logs:** `rate({app="devops-python"}[1m])`
+
+<details>
+<summary>💡 LogQL Reference</summary>
+
+**Stream selectors:**
+- `{label="value"}` - exact match
+- `{label=~"regex"}` - regex match
+- `{label!="value"}` - not equal
+
+**Line filters:**
+- `|= "text"` - contains
+- `!= "text"` - doesn't contain
+- `|~ "regex"` - regex match
+
+**Parsers:**
+- `| json` - parse JSON logs
+- `| logfmt` - parse logfmt logs
+
+**Aggregations:**
+- `rate({app="app"}[5m])` - logs per second
+- `count_over_time({app="app"}[5m])` - count logs
+- `sum by (level) (count_over_time({app="app"} | json [5m]))` - count by level
+
+Learn more: [LogQL Documentation](https://grafana.com/docs/loki/latest/query/)
+
+</details>
+
+#### 3.2 Create Dashboard
+
+**Requirements - create 4 panels:**
+
+1. **Logs Table** (Logs visualization)
+   - Shows recent logs from all apps
+   - Query: `{app=~"devops-.*"}`
+
+2. **Request Rate** (Time series graph)
+   - Shows logs per second by app
+   - Query: `sum by (app) (rate({app=~"devops-.*"} [1m]))`
+
+3. **Error Logs** (Logs visualization)
+   - Shows only ERROR level logs
+   - Query: `{app=~"devops-.*"} | json | level="ERROR"`
+
+4. **Log Level Distribution** (Stat or Pie chart)
+   - Count logs by level (INFO, ERROR, etc.)
+   - Query: `sum by (level) (count_over_time({app=~"devops-.*"} | json [5m]))`
+
+**How to create:**
+1. **Dashboard** → **New** → **New Dashboard** → **Add visualization**
+2. Select **Loki** data source
+3. Enter LogQL query (use the query builder or code editor)
+4. Choose visualization type (Logs, Time series, Stat, Pie chart, etc.)
+5. Configure panel title and options
+6. **Save dashboard** (Grafana 11 auto-saves drafts)
+
+**Grafana 11 features:**
+- Query builder UI for LogQL (easier for beginners)
+- Better log context and line wrapping
+- Improved variable support
+- Dashboard version history
+
+**Evidence:** Screenshot of your dashboard showing all 4 panels with real data.
+
+---
+
+### Task 4 — Production Readiness (1 pt)
+
+Configure the stack for production use.
+
+#### 4.1 Add Resource Limits
+
+Add resource constraints to prevent services from consuming too much:
+
+```yaml
+deploy:
+  resources:
+    limits:
+      cpus: '1.0'
+      memory: 1G
+    reservations:
+      cpus: '0.5'
+      memory: 512M
+```
+
+**Apply to all services** with appropriate values.
+
+#### 4.2 Secure Grafana
+
+**Remove anonymous authentication:**
+- Change `GF_AUTH_ANONYMOUS_ENABLED` to `false`
+- Set admin password via environment variable
+- Use `.env` file for secrets (don't commit!)
+
+#### 4.3 Add Health Checks
+
+Add `healthcheck:` sections to verify services are working:
+- Loki: `http://localhost:3100/ready`
+- Grafana: `http://localhost:3000/api/health`
+
+<details>
+<summary>💡 Health Check Example</summary>
+
+```yaml
+healthcheck:
+  test: ["CMD-SHELL", "wget --no-verbose --tries=1 --spider http://localhost:3100/ready || exit 1"]
+  interval: 10s
+  timeout: 5s
+  retries: 5
+  start_period: 10s  # Grace period for startup
+```
+
+**Alternative using curl:**
+```yaml
+test: ["CMD-SHELL", "curl -f http://localhost:3100/ready || exit 1"]
+```
+
+</details>
+
+**Evidence:**
+- `docker-compose ps` showing all services healthy
+- Screenshot of Grafana login page (no anonymous access)
+
+---
+
+### Task 5 — Documentation (2 pts)
+
+Create `monitoring/docs/LAB07.md` documenting your setup.
+
+**Required sections:**
+1. **Architecture** - Diagram showing how components connect
+2. **Setup Guide** - Step-by-step deployment instructions
+3. **Configuration** - Explain your Loki/Promtail configs and why
+4. **Application Logging** - How you implemented JSON logging
+5. **Dashboard** - Explain each panel and the LogQL queries
+6. **Production Config** - Security measures, resources, retention
+7. **Testing** - Commands to verify everything works
+8. **Challenges** - Problems you encountered and solutions
+
+**Include:**
+- Configuration file snippets (not full files)
+- Screenshots of Grafana dashboard
+- Example LogQL queries with explanations
+- Evidence of all tasks completed
+
+---
+
+## Bonus — Ansible Automation (2.5 pts)
+
+Automate Loki stack deployment with Ansible (builds on Labs 5-6).
+
+**Create Ansible role** `roles/monitoring` that:
+- Creates monitoring directory structure
+- Templates configuration files (Loki 3.0 format)
+- Deploys stack with Docker Compose v2
+- Waits for services to be ready
+- Configures Grafana data source
+
+**Requirements:**
+- Use Jinja2 templates for configs (versions, ports, retention as variables)
+- Make it idempotent (use `community.docker.docker_compose_v2` module)
+- Add to your existing Ansible setup from Lab 6
+- Create playbook: `playbooks/deploy-monitoring.yml`
+- Compatible with Ansible 2.16+
+
+<details>
+<summary>💡 Ansible Role Structure</summary>
+
+```
+roles/monitoring/
+├── defaults/main.yml       # Variables (versions, ports, etc.)
+├── tasks/
+│   ├── main.yml           # Main orchestration
+│   ├── setup.yml          # Create dirs, template configs
+│   └── deploy.yml         # Docker compose deployment
+├── templates/
+│   ├── docker-compose.yml.j2
+│   ├── loki-config.yml.j2
+│   └── promtail-config.yml.j2
+└── meta/main.yml          # Depends on: docker role
+```
+
+**Key variables to parameterize:**
+- Service versions (loki: 3.0.0, promtail: 3.0.0, grafana: 11.3.0)
+- Ports (loki: 3100, grafana: 3000, promtail: 9080)
+- Retention period (default: 168h / 7 days)
+- Resource limits (memory, CPU)
+- Schema version (v13 for Loki 3.0+)
+
+</details>
+
+**Evidence:**
+- Ansible playbook execution output
+- Idempotency test (run twice, second shows no changes)
+- Templated configuration files
+
+---
+
+## Checklist
+
+**Before submitting:**
+- [ ] Loki, Promtail, Grafana running via Docker Compose
+- [ ] Loki data source configured in Grafana
+- [ ] Python app logging in JSON format
+- [ ] Bonus app (if completed Lab 1 bonus) integrated
+- [ ] Logs visible in Grafana from all containers
+- [ ] Dashboard with 4+ panels created
+- [ ] LogQL queries working for different scenarios
+- [ ] Resource limits on all services
+- [ ] Health checks added
+- [ ] Grafana secured (no anonymous access)
+- [ ] Complete documentation with screenshots
+- [ ] All configuration files in repo
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Stack Deployment** | 4 pts | Loki, Promtail, Grafana configured and working |
+| **App Integration** | 3 pts | Apps logging JSON format, visible in Loki |
+| **Dashboard** | 2 pts | 4+ panels with appropriate LogQL queries |
+| **Production Config** | 1 pt | Resources, security, health checks |
+| **Documentation** | 2 pts | Complete LAB07.md with evidence |
+| **Bonus: Ansible** | 2.5 pts | Automated deployment with Ansible role |
+| **Total** | 12.5 pts | 10 pts required + 2.5 bonus |
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Loki Documentation</summary>
+
+- [Loki 3.0 Overview](https://grafana.com/docs/loki/latest/get-started/overview/)
+- [Loki Configuration](https://grafana.com/docs/loki/latest/configure/)
+- [LogQL Query Language](https://grafana.com/docs/loki/latest/query/)
+- [Storage Configuration](https://grafana.com/docs/loki/latest/storage/)
+
+</details>
+
+<details>
+<summary>🚢 Promtail</summary>
+
+- [Promtail Configuration](https://grafana.com/docs/loki/latest/send-data/promtail/configuration/)
+- [Docker Service Discovery](https://grafana.com/docs/loki/latest/send-data/promtail/configuration/#docker_sd_configs)
+- [Scraping Configuration](https://grafana.com/docs/loki/latest/send-data/promtail/scraping/)
+
+</details>
+
+<details>
+<summary>📊 Grafana</summary>
+
+- [Grafana 11 Dashboards](https://grafana.com/docs/grafana/latest/dashboards/)
+- [Loki Data Source](https://grafana.com/docs/grafana/latest/datasources/loki/)
+- [Explore Logs](https://grafana.com/docs/grafana/latest/explore/logs-integration/)
+
+</details>
+
+<details>
+<summary>📝 Logging Best Practices</summary>
+
+- [Structured Logging with structlog](https://www.structlog.org/en/stable/)
+- [The Twelve-Factor App: Logs](https://12factor.net/logs)
+- [Python Logging HOWTO](https://docs.python.org/3/howto/logging.html)
+- [python-json-logger](https://github.com/madzak/python-json-logger)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 8:** Metrics with Prometheus - Add metrics to complement logs
+- **Lab 9:** Kubernetes Fundamentals - Deploy your apps to K8s
+- **Lab 10-12:** Helm, Secrets, ConfigMaps - Package and configure K8s deployments
+- **Lab 16:** Kubernetes Monitoring - Full observability in K8s
+
+---
+
+**Good luck!** 🚀
diff --git a/labs/lab08.md b/labs/lab08.md
index 50f4aa5c9f..b49d641289 100644
--- a/labs/lab08.md
+++ b/labs/lab08.md
@@ -1,752 +1,752 @@
-# Lab 8 — Metrics & Monitoring with Prometheus
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-Metrics%20%26%20Monitoring-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Prometheus%20|%20Grafana%20|%20Docker%20Compose-informational)
-
-> Instrument your applications with metrics and build a complete monitoring stack with Prometheus and Grafana.
-
-## Overview
-
-Add observability to your applications by exposing Prometheus metrics, then deploy Prometheus to collect them and Grafana to visualize. You'll instrument your app first, then build the monitoring infrastructure around it.
-
-**What You'll Learn:**
-- Application instrumentation with prometheus_client
-- Prometheus scraping and metric types
-- PromQL query language
-- Building Grafana dashboards for metrics
-- Monitoring best practices (RED method, resource limits)
-- Integration with existing observability stack from Lab 7
-
-**Tech Stack:** Prometheus 3.9+ | Grafana 12.3+ | prometheus_client | PromQL
-
-**Prerequisites:** Lab 7 completed (Loki + Grafana stack), Python app from Lab 1-2
-
----
-
-## Tasks
-
-### Task 1 — Application Metrics (3 pts)
-
-Add Prometheus metrics to your Python application.
-
-#### 1.1 Understanding Application Metrics
-
-**Why metrics matter:**
-- **Logs** tell you what happened (Lab 7)
-- **Metrics** tell you how much and how often
-- **Together** they provide complete observability
-
-**The RED Method (for request-driven apps):**
-- **R**ate - Requests per second
-- **E**rrors - Error rate
-- **D**uration - Response time
-
-<details>
-<summary>💡 Prometheus Metric Types</summary>
-
-**Counter** - Only goes up (total requests, errors)
-```python
-http_requests_total.inc()  # Increment by 1
-```
-
-**Gauge** - Can go up or down (memory usage, active connections)
-```python
-active_connections.set(42)
-```
-
-**Histogram** - Measures distribution (request duration, response size)
-```python
-request_duration_seconds.observe(0.25)  # Record 250ms request
-```
-
-**Summary** - Similar to histogram, with percentiles
-
-**When to use what:**
-- Counting events? → Counter
-- Current state? → Gauge
-- Distribution/percentiles? → Histogram
-
-**Resources:**
-- [Prometheus Metric Types](https://prometheus.io/docs/concepts/metric_types/)
-- [Instrumentation Best Practices](https://prometheus.io/docs/practices/instrumentation/)
-
-</details>
-
-#### 1.2 Install Prometheus Client
-
-**Add to `requirements.txt`:**
-```txt
-prometheus-client==0.23.1
-```
-
-**Install:**
-```bash
-pip install prometheus-client
-```
-
-#### 1.3 Implement Metrics Endpoint
-
-**Add `/metrics` endpoint to your app:**
-
-**Requirements:**
-- Expose metrics at `/metrics` endpoint
-- Track HTTP requests (counter)
-- Track request duration (histogram)
-- Track active requests (gauge)
-- Use labels: `method`, `endpoint`, `status_code`
-
-<details>
-<summary>💡 Implementation Guidance</summary>
-
-**Basic Setup (Flask):**
-```python
-from prometheus_client import Counter, Histogram, Gauge, generate_latest
-
-# Define metrics
-http_requests_total = Counter(
-    'http_requests_total',
-    'Total HTTP requests',
-    ['method', 'endpoint', 'status']
-)
-
-http_request_duration_seconds = Histogram(
-    'http_request_duration_seconds',
-    'HTTP request duration',
-    ['method', 'endpoint']
-)
-
-http_requests_in_progress = Gauge(
-    'http_requests_in_progress',
-    'HTTP requests currently being processed'
-)
-
-@app.route('/metrics')
-def metrics():
-    return generate_latest()
-```
-
-**Instrumenting Requests:**
-- Use `@app.before_request` to track start time
-- Use `@app.after_request` to record metrics
-- Increment counter with labels
-- Observe histogram with duration
-- Use gauge context manager for in-progress
-
-**Label Best Practices:**
-- Keep cardinality low (don't use user IDs as labels!)
-- Use `/` for root, `/health` for health, group others
-- Normalize endpoint names (e.g., `/user/{id}` not `/user/123`)
-
-**Resources:**
-- [prometheus_client docs](https://github.com/prometheus/client_python)
-- [Python instrumentation guide](https://prometheus.io/docs/guides/python/)
-
-</details>
-
-#### 1.4 Add Application-Specific Metrics
-
-**Beyond HTTP, track your app's business metrics:**
-- Counter: API calls to external services
-- Gauge: Items in cache, database pool size
-- Histogram: Database query duration
-
-**Example for your DevOps info service:**
-```python
-# Track endpoint usage
-endpoint_calls = Counter('devops_info_endpoint_calls', 'Endpoint calls', ['endpoint'])
-
-# Track system info collection time
-system_info_duration = Histogram('devops_info_system_collection_seconds', 'System info collection time')
-```
-
-#### 1.5 Test Metrics Locally
-
-**Run your app and test:**
-```bash
-python app.py
-curl http://localhost:8000/metrics
-```
-
-**Expected output format:**
-```
-# HELP http_requests_total Total HTTP requests
-# TYPE http_requests_total counter
-http_requests_total{method="GET",endpoint="/",status="200"} 42.0
-http_requests_total{method="GET",endpoint="/health",status="200"} 15.0
-
-# HELP http_request_duration_seconds HTTP request duration
-# TYPE http_request_duration_seconds histogram
-http_request_duration_seconds_bucket{le="0.005",method="GET",endpoint="/"} 10.0
-http_request_duration_seconds_bucket{le="0.01",method="GET",endpoint="/"} 35.0
-...
-```
-
-**Evidence Required:**
-- Screenshot of `/metrics` endpoint output
-- Code showing metric definitions
-- Documentation explaining your metric choices
-
----
-
-### Task 2 — Prometheus Setup (3 pts)
-
-Deploy Prometheus and configure it to scrape your application metrics.
-
-#### 2.1 Understanding Prometheus Architecture
-
-<details>
-<summary>💡 How Prometheus Works</summary>
-
-**Pull-based model:**
-1. Your app exposes `/metrics` endpoint
-2. Prometheus scrapes (pulls) metrics on schedule
-3. Stores time-series data locally
-4. Provides PromQL for querying
-
-**Key concepts:**
-- **Target** - Endpoint to scrape (your app)
-- **Job** - Collection of targets with same purpose
-- **Scrape interval** - How often to collect (default: 15s)
-- **TSDB** - Time-series database storing metrics
-
-**vs Push-based (like StatsD):**
-- Pull = simpler, apps don't need to know about Prometheus
-- Better for service discovery
-- Failed scrapes are visible
-
-**Resources:**
-- [Prometheus Overview](https://prometheus.io/docs/introduction/overview/)
-- [First Steps with Prometheus](https://prometheus.io/docs/introduction/first_steps/)
-
-</details>
-
-#### 2.2 Add Prometheus to Docker Compose
-
-**Extend `monitoring/docker-compose.yml`** from Lab 7:
-
-**Requirements:**
-- Prometheus service (image: `prom/prometheus:v3.9.0`, port 9090)
-- Mount prometheus config: `./prometheus/prometheus.yml`
-- Mount data volume for persistence: `prometheus-data`
-- Connect to existing `logging` network from Lab 7
-
-<details>
-<summary>💡 Docker Compose Guidance</summary>
-
-**Key points:**
-- Use same network as Loki/Grafana from Lab 7
-- Mount config to `/etc/prometheus/prometheus.yml`
-- Use volume for data persistence: `/prometheus`
-- Add `--config.file=/etc/prometheus/prometheus.yml` command argument
-
-**Resource limits:**
-```yaml
-deploy:
-  resources:
-    limits:
-      memory: 1G
-      cpus: '1.0'
-```
-
-</details>
-
-#### 2.3 Configure Prometheus
-
-**File:** `monitoring/prometheus/prometheus.yml`
-
-**Requirements:**
-- Scrape Prometheus itself (job: `prometheus`)
-- Scrape your Python app (job: `app`)
-- Scrape Loki metrics (job: `loki`)
-- Scrape Grafana metrics (job: `grafana`)
-- Set scrape interval: 15s
-
-<details>
-<summary>💡 Prometheus Configuration Guide</summary>
-
-**Basic structure:**
-```yaml
-global:
-  scrape_interval: 15s
-  evaluation_interval: 15s
-
-# Storage retention (Prometheus 3.x config-based retention)
-storage:
-  tsdb:
-    retention_time: 15d
-    retention_size: 10GB
-
-scrape_configs:
-  - job_name: 'prometheus'
-    static_configs:
-      - targets: ['localhost:9090']
-
-  - job_name: 'app'
-    static_configs:
-      - targets: ['app-python:8000']
-    metrics_path: '/metrics'
-```
-
-**For Docker Compose:**
-- Use service names as hostnames (e.g., `loki:3100`)
-- Prometheus self-scrape uses `localhost:9090`
-- Check each service's metrics port:
-  - Loki: port 3100, path `/metrics`
-  - Grafana: port 3000, path `/metrics`
-  - Your app: port 8000, path `/metrics`
-
-**Resources:**
-- [Prometheus Configuration](https://prometheus.io/docs/prometheus/latest/configuration/configuration/)
-- [Scrape Configs](https://prometheus.io/docs/prometheus/latest/configuration/configuration/#scrape_config)
-
-</details>
-
-#### 2.4 Deploy and Verify
-
-**Deploy the updated stack:**
-```bash
-cd monitoring
-docker compose up -d
-docker compose ps
-```
-
-**Verify Prometheus:**
-1. **Access UI:** http://localhost:9090
-2. **Check targets:** http://localhost:9090/targets
-   - All targets should be "UP" (green)
-3. **Query metrics:** Try query `up` - should show all targets
-
-**Troubleshooting targets:**
-- **State: DOWN** → Check service is running, check port/path
-- **State: UNKNOWN** → Prometheus just started, wait for first scrape
-- **No target** → Check `prometheus.yml` syntax
-
-**Evidence Required:**
-- Screenshot of `/targets` page showing all targets UP
-- Screenshot of a successful PromQL query
-- `prometheus.yml` configuration file
-
----
-
-### Task 3 — Grafana Dashboards (2 pts)
-
-Build dashboards to visualize your application metrics.
-
-#### 3.1 Add Prometheus Data Source
-
-**In Grafana:**
-1. **Connections** → **Data sources** → **Add data source** → **Prometheus**
-2. URL: `http://prometheus:9090`
-3. **Save & Test**
-
-**Alternative:** Provision automatically (see Ansible bonus).
-
-#### 3.2 Learn PromQL Basics
-
-<details>
-<summary>💡 PromQL Quick Reference</summary>
-
-**Instant Vector (single value per time series):**
-```promql
-http_requests_total                                    # All request counters
-http_requests_total{method="GET"}                      # Filter by label
-http_requests_total{endpoint="/",status="200"}         # Multiple labels
-```
-
-**Range Vector (values over time range):**
-```promql
-http_requests_total[5m]                                # Last 5 minutes of data
-```
-
-**Functions:**
-```promql
-rate(http_requests_total[5m])                          # Requests per second
-sum(rate(http_requests_total[5m]))                     # Total req/s across all series
-sum by (endpoint) (rate(http_requests_total[5m]))      # Req/s per endpoint
-histogram_quantile(0.95, http_request_duration_seconds_bucket)  # 95th percentile latency
-```
-
-**Operators:**
-```promql
-up == 0                                                # Services down
-rate(http_requests_total{status="500"}[5m]) * 100     # Error rate percentage
-```
-
-**Common Queries:**
-- Request rate: `rate(http_requests_total[5m])`
-- Error rate: `sum(rate(http_requests_total{status=~"5.."}[5m]))`
-- p95 latency: `histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m]))`
-- CPU usage: `rate(process_cpu_seconds_total[5m]) * 100`
-
-**Resources:**
-- [PromQL Basics](https://prometheus.io/docs/prometheus/latest/querying/basics/)
-- [PromQL Examples](https://prometheus.io/docs/prometheus/latest/querying/examples/)
-
-</details>
-
-#### 3.3 Create Application Dashboard
-
-**Create dashboard with 6+ panels:**
-
-1. **Request Rate** (Graph)
-   - Query: `sum(rate(http_requests_total[5m])) by (endpoint)`
-   - Shows requests/sec per endpoint
-
-2. **Error Rate** (Graph)
-   - Query: `sum(rate(http_requests_total{status=~"5.."}[5m]))`
-   - Shows 5xx errors/sec
-
-3. **Request Duration p95** (Graph)
-   - Query: `histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m]))`
-   - Shows 95th percentile latency
-
-4. **Request Duration Heatmap** (Heatmap)
-   - Query: `rate(http_request_duration_seconds_bucket[5m])`
-   - Visualizes latency distribution
-
-5. **Active Requests** (Gauge/Graph)
-   - Query: `http_requests_in_progress`
-   - Shows concurrent requests
-
-6. **Status Code Distribution** (Pie Chart)
-   - Query: `sum by (status) (rate(http_requests_total[5m]))`
-   - Shows 2xx vs 4xx vs 5xx
-
-7. **Uptime** (Stat)
-   - Query: `up{job="app"}`
-   - Shows if service is up (1) or down (0)
-
-**Panel configuration tips:**
-- Set appropriate time ranges
-- Use legends with `{{label}}` syntax
-- Set units (requests/sec, seconds, etc.)
-- Add thresholds for alerting visualization
-
-#### 3.4 Import Community Dashboards
-
-**Grafana has pre-built dashboards:**
-
-**For Prometheus metrics:**
-- Dashboard ID: **3662** (Prometheus 2.0 Stats)
-
-**For Loki:**
-- Dashboard ID: **13407** (Loki Dashboard)
-
-**To import:**
-1. **Dashboards** → **New** → **Import**
-2. Enter dashboard ID
-3. Select Prometheus data source
-4. **Import**
-
-Customize these for your needs.
-
-**Evidence Required:**
-- Screenshot of your custom application dashboard with live data
-- Screenshot showing all 6+ panels working
-- Exported dashboard JSON file
-
----
-
-### Task 4 — Production Configuration (2 pts)
-
-Harden the monitoring stack for production use.
-
-#### 4.1 Add Health Checks
-
-**Add health checks to all services in `docker-compose.yml`:**
-
-**Prometheus:**
-```yaml
-healthcheck:
-  test: ["CMD-SHELL", "wget --no-verbose --tries=1 --spider http://localhost:9090/-/healthy || exit 1"]
-  interval: 10s
-  timeout: 5s
-  retries: 5
-```
-
-**Your app:**
-```yaml
-healthcheck:
-  test: ["CMD-SHELL", "curl -f http://localhost:8000/health || exit 1"]
-  interval: 10s
-  timeout: 5s
-  retries: 5
-```
-
-#### 4.2 Configure Resource Limits
-
-**Set limits on all services:**
-- Prometheus: 1G memory, 1 CPU
-- Loki: 1G memory, 1 CPU
-- Grafana: 512M memory, 0.5 CPU
-- Apps: 256M memory, 0.5 CPU
-
-#### 4.3 Data Retention
-
-**Configure retention periods:**
-
-**Prometheus retention:**
-```yaml
-command:
-  - '--config.file=/etc/prometheus/prometheus.yml'
-  - '--storage.tsdb.retention.time=15d'
-  - '--storage.tsdb.retention.size=10GB'
-```
-
-**Why retention matters:**
-- Disk space management
-- Query performance (smaller dataset = faster queries)
-- Compliance requirements
-
-#### 4.4 Persistent Volumes
-
-**Ensure data survives container restarts:**
-```yaml
-volumes:
-  prometheus-data:
-  loki-data:
-  grafana-data:
-```
-
-**Test persistence:**
-1. Create dashboard
-2. Stop containers: `docker compose down`
-3. Start containers: `docker compose up -d`
-4. Dashboard should still exist
-
-**Evidence Required:**
-- `docker compose ps` showing all services healthy
-- Documentation of retention policies
-- Proof of data persistence after restart
-
----
-
-### Task 5 — Documentation (2 pts)
-
-Create `monitoring/docs/LAB08.md` documenting your implementation.
-
-**Required sections:**
-1. **Architecture** - Diagram showing metric flow (app → Prometheus → Grafana)
-2. **Application Instrumentation** - What metrics you added and why
-3. **Prometheus Configuration** - Scrape targets, intervals, retention
-4. **Dashboard Walkthrough** - Each panel's purpose and query
-5. **PromQL Examples** - 5+ queries with explanations
-6. **Production Setup** - Health checks, resources, retention policies
-7. **Testing Results** - Screenshots showing everything working
-8. **Challenges & Solutions** - Issues encountered and fixes
-
-**Evidence:**
-- Screenshots of dashboards with live data
-- PromQL queries that demonstrate RED method
-- Proof of all services healthy and scraping
-- Comparison: metrics vs logs (Lab 7) - when to use each
-
----
-
-## Bonus — Ansible Automation (2.5 pts)
-
-Automate the complete observability stack (Loki + Prometheus + Grafana) deployment with Ansible.
-
-**Extend your `monitoring` role from Lab 7** or create a comprehensive new one.
-
-#### Bonus 1.1 Enhanced Monitoring Role
-
-**Update `roles/monitoring/` to include:**
-- Loki configuration (from Lab 7)
-- Promtail configuration (from Lab 7)
-- **Prometheus configuration** (new)
-- Grafana data sources (Loki + Prometheus)
-- Grafana dashboard provisioning (logs + metrics)
-
-#### Bonus 1.2 Variables to Parameterize
-
-**File:** `roles/monitoring/defaults/main.yml`
-
-**Add Prometheus variables:**
-```yaml
-# Prometheus Configuration
-prometheus_version: "3.9.0"
-prometheus_port: 9090
-prometheus_retention_days: 15
-prometheus_retention_size: "10GB"
-prometheus_scrape_interval: "15s"
-
-# Scrape Targets
-prometheus_targets:
-  - job: "prometheus"
-    targets: ["localhost:9090"]
-  - job: "loki"
-    targets: ["loki:3100"]
-  - job: "grafana"
-    targets: ["grafana:3000"]
-  - job: "app"
-    targets: ["app-python:8000"]
-    path: "/metrics"
-```
-
-#### Bonus 1.3 Template Prometheus Config
-
-**File:** `roles/monitoring/templates/prometheus.yml.j2`
-
-**Use Jinja2 to generate config from variables:**
-```yaml
-global:
-  scrape_interval: {{ prometheus_scrape_interval }}
-
-scrape_configs:
-{% for target in prometheus_targets %}
-  - job_name: '{{ target.job }}'
-    static_configs:
-      - targets: {{ target.targets }}
-    {% if target.path is defined %}
-    metrics_path: '{{ target.path }}'
-    {% endif %}
-{% endfor %}
-```
-
-#### Bonus 1.4 Provision Grafana Dashboards
-
-**Automatically provision dashboards:**
-
-**File:** `roles/monitoring/files/grafana-app-dashboard.json`
-- Export your application dashboard JSON
-- Add to Ansible role files
-
-**File:** `roles/monitoring/tasks/grafana.yml`
-```yaml
-- name: Provision Grafana dashboards
-  copy:
-    src: "{{ item }}"
-    dest: "{{ monitoring_dir }}/grafana/provisioning/dashboards/"
-  loop:
-    - grafana-app-dashboard.json
-    - grafana-logs-dashboard.json
-```
-
-#### Bonus 1.5 End-to-End Deployment
-
-**Single playbook deploys everything:**
-```bash
-ansible-playbook playbooks/deploy-monitoring.yml
-```
-
-**Should deploy:**
-- Loki + Promtail + Grafana (Lab 7)
-- Prometheus (Lab 8)
-- Grafana data sources (Loki + Prometheus)
-- Grafana dashboards (logs + metrics)
-- All with proper config, health checks, resources
-
-**Evidence Required:**
-- Ansible playbook execution showing idempotency
-- Templated configuration files
-- Screenshot of Grafana with both data sources working
-- Both dashboards (logs + metrics) automatically provisioned
-- Documentation of role structure and variables
-
----
-
-## Checklist
-
-**Before submitting:**
-- [ ] `/metrics` endpoint added to Python app
-- [ ] prometheus_client installed and configured
-- [ ] Counter, Gauge, Histogram metrics implemented
-- [ ] Prometheus deployed and scraping all targets
-- [ ] All targets showing "UP" in Prometheus UI
-- [ ] Prometheus data source added to Grafana
-- [ ] Custom dashboard with 6+ panels created
-- [ ] PromQL queries demonstrating RED method
-- [ ] Health checks on all services
-- [ ] Resource limits configured
-- [ ] Data retention policies set
-- [ ] Volumes persist after restart
-- [ ] Complete LAB08.md documentation
-- [ ] Screenshots of working dashboards
-
-**Bonus (if attempting):**
-- [ ] Ansible role extended for Prometheus
-- [ ] Variables parameterize all configs
-- [ ] Prometheus config templated with Jinja2
-- [ ] Grafana dashboards auto-provisioned
-- [ ] Single playbook deploys full stack
-- [ ] Idempotency verified
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Application Metrics** | 3 pts | `/metrics` endpoint with Counter, Gauge, Histogram; proper labels |
-| **Prometheus Setup** | 3 pts | Deployed, configured, scraping all targets successfully |
-| **Grafana Dashboards** | 2 pts | Custom dashboard with 6+ panels, PromQL queries |
-| **Production Config** | 2 pts | Health checks, resource limits, retention, persistence |
-| **Documentation** | 2 pts | Complete LAB08.md with architecture, queries, evidence |
-| **Bonus: Ansible** | 2.5 pts | Full stack automation with templates and provisioning |
-| **Total** | 12.5 pts | 10 pts required + 2.5 bonus |
-
-**Grading Scale:**
-- **10/10:** All working, excellent dashboards, production-ready config, thorough docs
-- **8-9/10:** All works, good dashboards, basic production config, good docs
-- **6-7/10:** Core working, simple dashboards, minimal config, basic docs
-- **<6/10:** Incomplete, missing components, needs revision
-
----
-
-## Resources
-
-<details>
-<summary>📊 Prometheus Documentation</summary>
-
-- [Prometheus Overview](https://prometheus.io/docs/introduction/overview/)
-- [Prometheus Configuration](https://prometheus.io/docs/prometheus/latest/configuration/configuration/)
-- [PromQL Basics](https://prometheus.io/docs/prometheus/latest/querying/basics/)
-- [Metric Types](https://prometheus.io/docs/concepts/metric_types/)
-- [Instrumentation Best Practices](https://prometheus.io/docs/practices/instrumentation/)
-
-</details>
-
-<details>
-<summary>🐍 Python Instrumentation</summary>
-
-- [prometheus_client GitHub](https://github.com/prometheus/client_python)
-- [Python Instrumentation](https://prometheus.io/docs/guides/python/)
-- [Flask Metrics Example](https://github.com/prometheus/client_python#flask)
-- [Metric Naming](https://prometheus.io/docs/practices/naming/)
-
-</details>
-
-<details>
-<summary>📈 Grafana & Dashboards</summary>
-
-- [Grafana Prometheus Data Source](https://grafana.com/docs/grafana/latest/datasources/prometheus/)
-- [Dashboard Best Practices](https://grafana.com/docs/grafana/latest/dashboards/build-dashboards/best-practices/)
-- [PromQL in Grafana](https://grafana.com/docs/grafana/latest/datasources/prometheus/query-editor/)
-- [Dashboard Provisioning](https://grafana.com/docs/grafana/latest/administration/provisioning/#dashboards)
-
-</details>
-
-<details>
-<summary>📚 Observability Concepts</summary>
-
-- [RED Method](https://grafana.com/blog/2018/08/02/the-red-method-how-to-instrument-your-services/)
-- [USE Method](http://www.brendangregg.com/usemethod.html) - For resources
-- [The Four Golden Signals](https://sre.google/sre-book/monitoring-distributed-systems/)
-- [Metrics vs Logs vs Traces](https://peter.bourgon.org/blog/2017/02/21/metrics-tracing-and-logging.html)
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 9:** Kubernetes - Deploy your monitored apps to K8s
-- **Lab 10:** Helm - Package your monitoring stack as Helm charts
-- **Lab 16:** Kubernetes Monitoring - Full observability with init containers and probes
-
----
-
-**Good luck!** 🚀
+# Lab 8 — Metrics & Monitoring with Prometheus
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Metrics%20%26%20Monitoring-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Prometheus%20|%20Grafana%20|%20Docker%20Compose-informational)
+
+> Instrument your applications with metrics and build a complete monitoring stack with Prometheus and Grafana.
+
+## Overview
+
+Add observability to your applications by exposing Prometheus metrics, then deploy Prometheus to collect them and Grafana to visualize. You'll instrument your app first, then build the monitoring infrastructure around it.
+
+**What You'll Learn:**
+- Application instrumentation with prometheus_client
+- Prometheus scraping and metric types
+- PromQL query language
+- Building Grafana dashboards for metrics
+- Monitoring best practices (RED method, resource limits)
+- Integration with existing observability stack from Lab 7
+
+**Tech Stack:** Prometheus 3.9+ | Grafana 12.3+ | prometheus_client | PromQL
+
+**Prerequisites:** Lab 7 completed (Loki + Grafana stack), Python app from Lab 1-2
+
+---
+
+## Tasks
+
+### Task 1 — Application Metrics (3 pts)
+
+Add Prometheus metrics to your Python application.
+
+#### 1.1 Understanding Application Metrics
+
+**Why metrics matter:**
+- **Logs** tell you what happened (Lab 7)
+- **Metrics** tell you how much and how often
+- **Together** they provide complete observability
+
+**The RED Method (for request-driven apps):**
+- **R**ate - Requests per second
+- **E**rrors - Error rate
+- **D**uration - Response time
+
+<details>
+<summary>💡 Prometheus Metric Types</summary>
+
+**Counter** - Only goes up (total requests, errors)
+```python
+http_requests_total.inc()  # Increment by 1
+```
+
+**Gauge** - Can go up or down (memory usage, active connections)
+```python
+active_connections.set(42)
+```
+
+**Histogram** - Measures distribution (request duration, response size)
+```python
+request_duration_seconds.observe(0.25)  # Record 250ms request
+```
+
+**Summary** - Similar to histogram, with percentiles
+
+**When to use what:**
+- Counting events? → Counter
+- Current state? → Gauge
+- Distribution/percentiles? → Histogram
+
+**Resources:**
+- [Prometheus Metric Types](https://prometheus.io/docs/concepts/metric_types/)
+- [Instrumentation Best Practices](https://prometheus.io/docs/practices/instrumentation/)
+
+</details>
+
+#### 1.2 Install Prometheus Client
+
+**Add to `requirements.txt`:**
+```txt
+prometheus-client==0.23.1
+```
+
+**Install:**
+```bash
+pip install prometheus-client
+```
+
+#### 1.3 Implement Metrics Endpoint
+
+**Add `/metrics` endpoint to your app:**
+
+**Requirements:**
+- Expose metrics at `/metrics` endpoint
+- Track HTTP requests (counter)
+- Track request duration (histogram)
+- Track active requests (gauge)
+- Use labels: `method`, `endpoint`, `status_code`
+
+<details>
+<summary>💡 Implementation Guidance</summary>
+
+**Basic Setup (Flask):**
+```python
+from prometheus_client import Counter, Histogram, Gauge, generate_latest
+
+# Define metrics
+http_requests_total = Counter(
+    'http_requests_total',
+    'Total HTTP requests',
+    ['method', 'endpoint', 'status']
+)
+
+http_request_duration_seconds = Histogram(
+    'http_request_duration_seconds',
+    'HTTP request duration',
+    ['method', 'endpoint']
+)
+
+http_requests_in_progress = Gauge(
+    'http_requests_in_progress',
+    'HTTP requests currently being processed'
+)
+
+@app.route('/metrics')
+def metrics():
+    return generate_latest()
+```
+
+**Instrumenting Requests:**
+- Use `@app.before_request` to track start time
+- Use `@app.after_request` to record metrics
+- Increment counter with labels
+- Observe histogram with duration
+- Use gauge context manager for in-progress
+
+**Label Best Practices:**
+- Keep cardinality low (don't use user IDs as labels!)
+- Use `/` for root, `/health` for health, group others
+- Normalize endpoint names (e.g., `/user/{id}` not `/user/123`)
+
+**Resources:**
+- [prometheus_client docs](https://github.com/prometheus/client_python)
+- [Python instrumentation guide](https://prometheus.io/docs/guides/python/)
+
+</details>
+
+#### 1.4 Add Application-Specific Metrics
+
+**Beyond HTTP, track your app's business metrics:**
+- Counter: API calls to external services
+- Gauge: Items in cache, database pool size
+- Histogram: Database query duration
+
+**Example for your DevOps info service:**
+```python
+# Track endpoint usage
+endpoint_calls = Counter('devops_info_endpoint_calls', 'Endpoint calls', ['endpoint'])
+
+# Track system info collection time
+system_info_duration = Histogram('devops_info_system_collection_seconds', 'System info collection time')
+```
+
+#### 1.5 Test Metrics Locally
+
+**Run your app and test:**
+```bash
+python app.py
+curl http://localhost:8000/metrics
+```
+
+**Expected output format:**
+```
+# HELP http_requests_total Total HTTP requests
+# TYPE http_requests_total counter
+http_requests_total{method="GET",endpoint="/",status="200"} 42.0
+http_requests_total{method="GET",endpoint="/health",status="200"} 15.0
+
+# HELP http_request_duration_seconds HTTP request duration
+# TYPE http_request_duration_seconds histogram
+http_request_duration_seconds_bucket{le="0.005",method="GET",endpoint="/"} 10.0
+http_request_duration_seconds_bucket{le="0.01",method="GET",endpoint="/"} 35.0
+...
+```
+
+**Evidence Required:**
+- Screenshot of `/metrics` endpoint output
+- Code showing metric definitions
+- Documentation explaining your metric choices
+
+---
+
+### Task 2 — Prometheus Setup (3 pts)
+
+Deploy Prometheus and configure it to scrape your application metrics.
+
+#### 2.1 Understanding Prometheus Architecture
+
+<details>
+<summary>💡 How Prometheus Works</summary>
+
+**Pull-based model:**
+1. Your app exposes `/metrics` endpoint
+2. Prometheus scrapes (pulls) metrics on schedule
+3. Stores time-series data locally
+4. Provides PromQL for querying
+
+**Key concepts:**
+- **Target** - Endpoint to scrape (your app)
+- **Job** - Collection of targets with same purpose
+- **Scrape interval** - How often to collect (default: 15s)
+- **TSDB** - Time-series database storing metrics
+
+**vs Push-based (like StatsD):**
+- Pull = simpler, apps don't need to know about Prometheus
+- Better for service discovery
+- Failed scrapes are visible
+
+**Resources:**
+- [Prometheus Overview](https://prometheus.io/docs/introduction/overview/)
+- [First Steps with Prometheus](https://prometheus.io/docs/introduction/first_steps/)
+
+</details>
+
+#### 2.2 Add Prometheus to Docker Compose
+
+**Extend `monitoring/docker-compose.yml`** from Lab 7:
+
+**Requirements:**
+- Prometheus service (image: `prom/prometheus:v3.9.0`, port 9090)
+- Mount prometheus config: `./prometheus/prometheus.yml`
+- Mount data volume for persistence: `prometheus-data`
+- Connect to existing `logging` network from Lab 7
+
+<details>
+<summary>💡 Docker Compose Guidance</summary>
+
+**Key points:**
+- Use same network as Loki/Grafana from Lab 7
+- Mount config to `/etc/prometheus/prometheus.yml`
+- Use volume for data persistence: `/prometheus`
+- Add `--config.file=/etc/prometheus/prometheus.yml` command argument
+
+**Resource limits:**
+```yaml
+deploy:
+  resources:
+    limits:
+      memory: 1G
+      cpus: '1.0'
+```
+
+</details>
+
+#### 2.3 Configure Prometheus
+
+**File:** `monitoring/prometheus/prometheus.yml`
+
+**Requirements:**
+- Scrape Prometheus itself (job: `prometheus`)
+- Scrape your Python app (job: `app`)
+- Scrape Loki metrics (job: `loki`)
+- Scrape Grafana metrics (job: `grafana`)
+- Set scrape interval: 15s
+
+<details>
+<summary>💡 Prometheus Configuration Guide</summary>
+
+**Basic structure:**
+```yaml
+global:
+  scrape_interval: 15s
+  evaluation_interval: 15s
+
+# Storage retention (Prometheus 3.x config-based retention)
+storage:
+  tsdb:
+    retention_time: 15d
+    retention_size: 10GB
+
+scrape_configs:
+  - job_name: 'prometheus'
+    static_configs:
+      - targets: ['localhost:9090']
+
+  - job_name: 'app'
+    static_configs:
+      - targets: ['app-python:8000']
+    metrics_path: '/metrics'
+```
+
+**For Docker Compose:**
+- Use service names as hostnames (e.g., `loki:3100`)
+- Prometheus self-scrape uses `localhost:9090`
+- Check each service's metrics port:
+  - Loki: port 3100, path `/metrics`
+  - Grafana: port 3000, path `/metrics`
+  - Your app: port 8000, path `/metrics`
+
+**Resources:**
+- [Prometheus Configuration](https://prometheus.io/docs/prometheus/latest/configuration/configuration/)
+- [Scrape Configs](https://prometheus.io/docs/prometheus/latest/configuration/configuration/#scrape_config)
+
+</details>
+
+#### 2.4 Deploy and Verify
+
+**Deploy the updated stack:**
+```bash
+cd monitoring
+docker compose up -d
+docker compose ps
+```
+
+**Verify Prometheus:**
+1. **Access UI:** http://localhost:9090
+2. **Check targets:** http://localhost:9090/targets
+   - All targets should be "UP" (green)
+3. **Query metrics:** Try query `up` - should show all targets
+
+**Troubleshooting targets:**
+- **State: DOWN** → Check service is running, check port/path
+- **State: UNKNOWN** → Prometheus just started, wait for first scrape
+- **No target** → Check `prometheus.yml` syntax
+
+**Evidence Required:**
+- Screenshot of `/targets` page showing all targets UP
+- Screenshot of a successful PromQL query
+- `prometheus.yml` configuration file
+
+---
+
+### Task 3 — Grafana Dashboards (2 pts)
+
+Build dashboards to visualize your application metrics.
+
+#### 3.1 Add Prometheus Data Source
+
+**In Grafana:**
+1. **Connections** → **Data sources** → **Add data source** → **Prometheus**
+2. URL: `http://prometheus:9090`
+3. **Save & Test**
+
+**Alternative:** Provision automatically (see Ansible bonus).
+
+#### 3.2 Learn PromQL Basics
+
+<details>
+<summary>💡 PromQL Quick Reference</summary>
+
+**Instant Vector (single value per time series):**
+```promql
+http_requests_total                                    # All request counters
+http_requests_total{method="GET"}                      # Filter by label
+http_requests_total{endpoint="/",status="200"}         # Multiple labels
+```
+
+**Range Vector (values over time range):**
+```promql
+http_requests_total[5m]                                # Last 5 minutes of data
+```
+
+**Functions:**
+```promql
+rate(http_requests_total[5m])                          # Requests per second
+sum(rate(http_requests_total[5m]))                     # Total req/s across all series
+sum by (endpoint) (rate(http_requests_total[5m]))      # Req/s per endpoint
+histogram_quantile(0.95, http_request_duration_seconds_bucket)  # 95th percentile latency
+```
+
+**Operators:**
+```promql
+up == 0                                                # Services down
+rate(http_requests_total{status="500"}[5m]) * 100     # Error rate percentage
+```
+
+**Common Queries:**
+- Request rate: `rate(http_requests_total[5m])`
+- Error rate: `sum(rate(http_requests_total{status=~"5.."}[5m]))`
+- p95 latency: `histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m]))`
+- CPU usage: `rate(process_cpu_seconds_total[5m]) * 100`
+
+**Resources:**
+- [PromQL Basics](https://prometheus.io/docs/prometheus/latest/querying/basics/)
+- [PromQL Examples](https://prometheus.io/docs/prometheus/latest/querying/examples/)
+
+</details>
+
+#### 3.3 Create Application Dashboard
+
+**Create dashboard with 6+ panels:**
+
+1. **Request Rate** (Graph)
+   - Query: `sum(rate(http_requests_total[5m])) by (endpoint)`
+   - Shows requests/sec per endpoint
+
+2. **Error Rate** (Graph)
+   - Query: `sum(rate(http_requests_total{status=~"5.."}[5m]))`
+   - Shows 5xx errors/sec
+
+3. **Request Duration p95** (Graph)
+   - Query: `histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m]))`
+   - Shows 95th percentile latency
+
+4. **Request Duration Heatmap** (Heatmap)
+   - Query: `rate(http_request_duration_seconds_bucket[5m])`
+   - Visualizes latency distribution
+
+5. **Active Requests** (Gauge/Graph)
+   - Query: `http_requests_in_progress`
+   - Shows concurrent requests
+
+6. **Status Code Distribution** (Pie Chart)
+   - Query: `sum by (status) (rate(http_requests_total[5m]))`
+   - Shows 2xx vs 4xx vs 5xx
+
+7. **Uptime** (Stat)
+   - Query: `up{job="app"}`
+   - Shows if service is up (1) or down (0)
+
+**Panel configuration tips:**
+- Set appropriate time ranges
+- Use legends with `{{label}}` syntax
+- Set units (requests/sec, seconds, etc.)
+- Add thresholds for alerting visualization
+
+#### 3.4 Import Community Dashboards
+
+**Grafana has pre-built dashboards:**
+
+**For Prometheus metrics:**
+- Dashboard ID: **3662** (Prometheus 2.0 Stats)
+
+**For Loki:**
+- Dashboard ID: **13407** (Loki Dashboard)
+
+**To import:**
+1. **Dashboards** → **New** → **Import**
+2. Enter dashboard ID
+3. Select Prometheus data source
+4. **Import**
+
+Customize these for your needs.
+
+**Evidence Required:**
+- Screenshot of your custom application dashboard with live data
+- Screenshot showing all 6+ panels working
+- Exported dashboard JSON file
+
+---
+
+### Task 4 — Production Configuration (2 pts)
+
+Harden the monitoring stack for production use.
+
+#### 4.1 Add Health Checks
+
+**Add health checks to all services in `docker-compose.yml`:**
+
+**Prometheus:**
+```yaml
+healthcheck:
+  test: ["CMD-SHELL", "wget --no-verbose --tries=1 --spider http://localhost:9090/-/healthy || exit 1"]
+  interval: 10s
+  timeout: 5s
+  retries: 5
+```
+
+**Your app:**
+```yaml
+healthcheck:
+  test: ["CMD-SHELL", "curl -f http://localhost:8000/health || exit 1"]
+  interval: 10s
+  timeout: 5s
+  retries: 5
+```
+
+#### 4.2 Configure Resource Limits
+
+**Set limits on all services:**
+- Prometheus: 1G memory, 1 CPU
+- Loki: 1G memory, 1 CPU
+- Grafana: 512M memory, 0.5 CPU
+- Apps: 256M memory, 0.5 CPU
+
+#### 4.3 Data Retention
+
+**Configure retention periods:**
+
+**Prometheus retention:**
+```yaml
+command:
+  - '--config.file=/etc/prometheus/prometheus.yml'
+  - '--storage.tsdb.retention.time=15d'
+  - '--storage.tsdb.retention.size=10GB'
+```
+
+**Why retention matters:**
+- Disk space management
+- Query performance (smaller dataset = faster queries)
+- Compliance requirements
+
+#### 4.4 Persistent Volumes
+
+**Ensure data survives container restarts:**
+```yaml
+volumes:
+  prometheus-data:
+  loki-data:
+  grafana-data:
+```
+
+**Test persistence:**
+1. Create dashboard
+2. Stop containers: `docker compose down`
+3. Start containers: `docker compose up -d`
+4. Dashboard should still exist
+
+**Evidence Required:**
+- `docker compose ps` showing all services healthy
+- Documentation of retention policies
+- Proof of data persistence after restart
+
+---
+
+### Task 5 — Documentation (2 pts)
+
+Create `monitoring/docs/LAB08.md` documenting your implementation.
+
+**Required sections:**
+1. **Architecture** - Diagram showing metric flow (app → Prometheus → Grafana)
+2. **Application Instrumentation** - What metrics you added and why
+3. **Prometheus Configuration** - Scrape targets, intervals, retention
+4. **Dashboard Walkthrough** - Each panel's purpose and query
+5. **PromQL Examples** - 5+ queries with explanations
+6. **Production Setup** - Health checks, resources, retention policies
+7. **Testing Results** - Screenshots showing everything working
+8. **Challenges & Solutions** - Issues encountered and fixes
+
+**Evidence:**
+- Screenshots of dashboards with live data
+- PromQL queries that demonstrate RED method
+- Proof of all services healthy and scraping
+- Comparison: metrics vs logs (Lab 7) - when to use each
+
+---
+
+## Bonus — Ansible Automation (2.5 pts)
+
+Automate the complete observability stack (Loki + Prometheus + Grafana) deployment with Ansible.
+
+**Extend your `monitoring` role from Lab 7** or create a comprehensive new one.
+
+#### Bonus 1.1 Enhanced Monitoring Role
+
+**Update `roles/monitoring/` to include:**
+- Loki configuration (from Lab 7)
+- Promtail configuration (from Lab 7)
+- **Prometheus configuration** (new)
+- Grafana data sources (Loki + Prometheus)
+- Grafana dashboard provisioning (logs + metrics)
+
+#### Bonus 1.2 Variables to Parameterize
+
+**File:** `roles/monitoring/defaults/main.yml`
+
+**Add Prometheus variables:**
+```yaml
+# Prometheus Configuration
+prometheus_version: "3.9.0"
+prometheus_port: 9090
+prometheus_retention_days: 15
+prometheus_retention_size: "10GB"
+prometheus_scrape_interval: "15s"
+
+# Scrape Targets
+prometheus_targets:
+  - job: "prometheus"
+    targets: ["localhost:9090"]
+  - job: "loki"
+    targets: ["loki:3100"]
+  - job: "grafana"
+    targets: ["grafana:3000"]
+  - job: "app"
+    targets: ["app-python:8000"]
+    path: "/metrics"
+```
+
+#### Bonus 1.3 Template Prometheus Config
+
+**File:** `roles/monitoring/templates/prometheus.yml.j2`
+
+**Use Jinja2 to generate config from variables:**
+```yaml
+global:
+  scrape_interval: {{ prometheus_scrape_interval }}
+
+scrape_configs:
+{% for target in prometheus_targets %}
+  - job_name: '{{ target.job }}'
+    static_configs:
+      - targets: {{ target.targets }}
+    {% if target.path is defined %}
+    metrics_path: '{{ target.path }}'
+    {% endif %}
+{% endfor %}
+```
+
+#### Bonus 1.4 Provision Grafana Dashboards
+
+**Automatically provision dashboards:**
+
+**File:** `roles/monitoring/files/grafana-app-dashboard.json`
+- Export your application dashboard JSON
+- Add to Ansible role files
+
+**File:** `roles/monitoring/tasks/grafana.yml`
+```yaml
+- name: Provision Grafana dashboards
+  copy:
+    src: "{{ item }}"
+    dest: "{{ monitoring_dir }}/grafana/provisioning/dashboards/"
+  loop:
+    - grafana-app-dashboard.json
+    - grafana-logs-dashboard.json
+```
+
+#### Bonus 1.5 End-to-End Deployment
+
+**Single playbook deploys everything:**
+```bash
+ansible-playbook playbooks/deploy-monitoring.yml
+```
+
+**Should deploy:**
+- Loki + Promtail + Grafana (Lab 7)
+- Prometheus (Lab 8)
+- Grafana data sources (Loki + Prometheus)
+- Grafana dashboards (logs + metrics)
+- All with proper config, health checks, resources
+
+**Evidence Required:**
+- Ansible playbook execution showing idempotency
+- Templated configuration files
+- Screenshot of Grafana with both data sources working
+- Both dashboards (logs + metrics) automatically provisioned
+- Documentation of role structure and variables
+
+---
+
+## Checklist
+
+**Before submitting:**
+- [ ] `/metrics` endpoint added to Python app
+- [ ] prometheus_client installed and configured
+- [ ] Counter, Gauge, Histogram metrics implemented
+- [ ] Prometheus deployed and scraping all targets
+- [ ] All targets showing "UP" in Prometheus UI
+- [ ] Prometheus data source added to Grafana
+- [ ] Custom dashboard with 6+ panels created
+- [ ] PromQL queries demonstrating RED method
+- [ ] Health checks on all services
+- [ ] Resource limits configured
+- [ ] Data retention policies set
+- [ ] Volumes persist after restart
+- [ ] Complete LAB08.md documentation
+- [ ] Screenshots of working dashboards
+
+**Bonus (if attempting):**
+- [ ] Ansible role extended for Prometheus
+- [ ] Variables parameterize all configs
+- [ ] Prometheus config templated with Jinja2
+- [ ] Grafana dashboards auto-provisioned
+- [ ] Single playbook deploys full stack
+- [ ] Idempotency verified
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Application Metrics** | 3 pts | `/metrics` endpoint with Counter, Gauge, Histogram; proper labels |
+| **Prometheus Setup** | 3 pts | Deployed, configured, scraping all targets successfully |
+| **Grafana Dashboards** | 2 pts | Custom dashboard with 6+ panels, PromQL queries |
+| **Production Config** | 2 pts | Health checks, resource limits, retention, persistence |
+| **Documentation** | 2 pts | Complete LAB08.md with architecture, queries, evidence |
+| **Bonus: Ansible** | 2.5 pts | Full stack automation with templates and provisioning |
+| **Total** | 12.5 pts | 10 pts required + 2.5 bonus |
+
+**Grading Scale:**
+- **10/10:** All working, excellent dashboards, production-ready config, thorough docs
+- **8-9/10:** All works, good dashboards, basic production config, good docs
+- **6-7/10:** Core working, simple dashboards, minimal config, basic docs
+- **<6/10:** Incomplete, missing components, needs revision
+
+---
+
+## Resources
+
+<details>
+<summary>📊 Prometheus Documentation</summary>
+
+- [Prometheus Overview](https://prometheus.io/docs/introduction/overview/)
+- [Prometheus Configuration](https://prometheus.io/docs/prometheus/latest/configuration/configuration/)
+- [PromQL Basics](https://prometheus.io/docs/prometheus/latest/querying/basics/)
+- [Metric Types](https://prometheus.io/docs/concepts/metric_types/)
+- [Instrumentation Best Practices](https://prometheus.io/docs/practices/instrumentation/)
+
+</details>
+
+<details>
+<summary>🐍 Python Instrumentation</summary>
+
+- [prometheus_client GitHub](https://github.com/prometheus/client_python)
+- [Python Instrumentation](https://prometheus.io/docs/guides/python/)
+- [Flask Metrics Example](https://github.com/prometheus/client_python#flask)
+- [Metric Naming](https://prometheus.io/docs/practices/naming/)
+
+</details>
+
+<details>
+<summary>📈 Grafana & Dashboards</summary>
+
+- [Grafana Prometheus Data Source](https://grafana.com/docs/grafana/latest/datasources/prometheus/)
+- [Dashboard Best Practices](https://grafana.com/docs/grafana/latest/dashboards/build-dashboards/best-practices/)
+- [PromQL in Grafana](https://grafana.com/docs/grafana/latest/datasources/prometheus/query-editor/)
+- [Dashboard Provisioning](https://grafana.com/docs/grafana/latest/administration/provisioning/#dashboards)
+
+</details>
+
+<details>
+<summary>📚 Observability Concepts</summary>
+
+- [RED Method](https://grafana.com/blog/2018/08/02/the-red-method-how-to-instrument-your-services/)
+- [USE Method](http://www.brendangregg.com/usemethod.html) - For resources
+- [The Four Golden Signals](https://sre.google/sre-book/monitoring-distributed-systems/)
+- [Metrics vs Logs vs Traces](https://peter.bourgon.org/blog/2017/02/21/metrics-tracing-and-logging.html)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 9:** Kubernetes - Deploy your monitored apps to K8s
+- **Lab 10:** Helm - Package your monitoring stack as Helm charts
+- **Lab 16:** Kubernetes Monitoring - Full observability with init containers and probes
+
+---
+
+**Good luck!** 🚀
diff --git a/labs/lab09.md b/labs/lab09.md
index efcff217f2..2bb14d399b 100644
--- a/labs/lab09.md
+++ b/labs/lab09.md
@@ -1,730 +1,730 @@
-# Lab 9 — Kubernetes Fundamentals
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-Kubernetes-blue)
-![points](https://img.shields.io/badge/points-12%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Kubernetes-informational)
-
-> Deploy your containerized applications to Kubernetes using declarative manifests and production best practices.
-
-## Overview
-
-Take your Docker images from previous labs and deploy them to Kubernetes. Learn container orchestration fundamentals, declarative configuration, and production deployment patterns.
-
-**What You'll Learn:**
-- Kubernetes core concepts and architecture
-- Writing production-ready manifests
-- Deployments, Services, and networking
-- Health checks and resource management
-- Scaling and updates
-
-**Tech Stack:** Kubernetes 1.33+ | kubectl | minikube or kind | YAML
-
----
-
-## Tasks
-
-### Task 1 — Local Kubernetes Setup (2 pts)
-
-**Objective:** Set up a local Kubernetes cluster and understand core concepts.
-
-**Requirements:**
-
-1. **Learn Kubernetes Fundamentals**
-   - Study core concepts (Pods, Deployments, Services, Namespaces)
-   - Understand control plane and worker node architecture
-   - Learn the declarative vs imperative approach
-
-2. **Install Tools**
-   - Install `kubectl` (Kubernetes CLI)
-   - Install local cluster: `minikube` OR `kind`
-   - Verify installation with cluster info commands
-
-3. **Cluster Setup**
-   - Start local cluster
-   - Verify all components are running
-   - Explore cluster with kubectl commands
-
-<details>
-<summary>💡 Kubernetes Concepts</summary>
-
-**Core Resources:**
-- **Pod**: Smallest deployable unit, contains one or more containers
-- **Deployment**: Manages replica sets and rolling updates
-- **Service**: Exposes Pods as network service with stable endpoint
-- **Namespace**: Virtual cluster for resource isolation
-
-**Why Kubernetes?**
-- Automatic scaling and load balancing
-- Self-healing (restart failed containers)
-- Rolling updates and rollbacks
-- Service discovery and networking
-- Resource management and scheduling
-
-**Local Development Options:**
-- **minikube**: Full-featured, runs in VM or Docker
-- **kind**: Lightweight, runs in Docker containers, great for CI/CD
-
-**Key Concepts to Research:**
-- Desired state vs actual state
-- Controllers and reconciliation loops
-- Labels and selectors
-- Declarative configuration (YAML manifests)
-
-**Resources:**
-- [What is Kubernetes](https://kubernetes.io/docs/concepts/overview/)
-- [Kubernetes Components](https://kubernetes.io/docs/concepts/overview/components/)
-- [kubectl Cheat Sheet](https://kubernetes.io/docs/reference/kubectl/quick-reference/)
-- [Install Tools](https://kubernetes.io/docs/tasks/tools/)
-
-</details>
-
-<details>
-<summary>💡 Essential kubectl Commands</summary>
-
-**Cluster Information:**
-```bash
-kubectl cluster-info
-kubectl get nodes
-kubectl get namespaces
-```
-
-**Resource Management:**
-```bash
-kubectl get pods
-kubectl get deployments
-kubectl get services
-kubectl describe pod <pod-name>
-kubectl logs <pod-name>
-```
-
-**Apply vs Create:**
-- `kubectl apply` - Declarative, idempotent, preferred
-- `kubectl create` - Imperative, fails if exists
-
-</details>
-
-**Documentation Required:**
-- Terminal output showing successful cluster setup
-- Output of `kubectl cluster-info` and `kubectl get nodes`
-- Brief explanation of your chosen tool (minikube/kind) and why
-
----
-
-### Task 2 — Application Deployment (3 pts)
-
-**Objective:** Create a Deployment manifest for your Python app with production best practices.
-
-**Requirements:**
-
-1. **Create Deployment Manifest**
-   - File: `k8s/deployment.yml`
-   - Use your Docker image from Lab 2
-   - Minimum 3 replicas
-   - Include resource requests and limits
-   - Add liveness and readiness probes
-   - Use labels for organization
-
-2. **Production Best Practices**
-   - Non-root container (should already be in your image)
-   - Rolling update strategy
-   - Proper container port configuration
-   - Environment variables if needed
-
-<details>
-<summary>💡 Deployment Manifest Structure</summary>
-
-**Essential Sections:**
-```yaml
-apiVersion: apps/v1
-kind: Deployment
-metadata:
-  name: your-app-name
-  labels:
-    app: your-app
-spec:
-  replicas: 3
-  selector:
-    matchLabels:
-      app: your-app
-  template:
-    metadata:
-      labels:
-        app: your-app
-    spec:
-      containers:
-      - name: your-app
-        image: your-dockerhub-username/your-app:latest
-        # Add: ports, resources, probes
-```
-
-**Key Fields to Research:**
-- `replicas`: Number of Pod copies
-- `selector.matchLabels`: How Deployment finds its Pods
-- `template`: Pod specification
-- `resources`: CPU/memory requests and limits
-- `livenessProbe`: Is container healthy?
-- `readinessProbe`: Is container ready for traffic?
-
-**Resources:**
-- [Deployments](https://kubernetes.io/docs/concepts/workloads/controllers/deployment/)
-- [Resource Management](https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/)
-- [Health Checks](https://kubernetes.io/docs/tasks/configure-pod-container/configure-liveness-readiness-startup-probes/)
-
-</details>
-
-<details>
-<summary>💡 Health Checks (Probes)</summary>
-
-**Types of Probes:**
-- **Liveness**: Restart container if failing
-- **Readiness**: Remove from service if not ready
-- **Startup**: For slow-starting containers
-
-**Probe Methods:**
-- HTTP GET (common for web apps)
-- TCP Socket
-- Exec command
-
-**Example Configuration Pattern:**
-```yaml
-livenessProbe:
-  httpGet:
-    path: /health
-    port: 8000
-  initialDelaySeconds: 10
-  periodSeconds: 5
-
-readinessProbe:
-  httpGet:
-    path: /ready
-    port: 8000
-  initialDelaySeconds: 5
-  periodSeconds: 3
-```
-
-**Note:** You may need to add `/health` endpoint to your app.
-
-</details>
-
-<details>
-<summary>💡 Resource Management</summary>
-
-**Why Set Resources?**
-- Prevents resource starvation
-- Enables proper scheduling
-- Protects cluster stability
-
-**Pattern:**
-```yaml
-resources:
-  requests:
-    memory: "128Mi"
-    cpu: "100m"
-  limits:
-    memory: "256Mi"
-    cpu: "200m"
-```
-
-**CPU Units:**
-- `1000m` = 1 CPU core
-- `100m` = 0.1 CPU core
-
-**Memory Units:**
-- `Mi` = Mebibyte (1024-based)
-- `Gi` = Gibibyte
-
-</details>
-
-**Test Your Deployment:**
-```bash
-kubectl apply -f k8s/deployment.yml
-kubectl get deployments
-kubectl get pods
-kubectl describe deployment <name>
-```
-
----
-
-### Task 3 — Service Configuration (2 pts)
-
-**Objective:** Create a Service to expose your Deployment.
-
-**Requirements:**
-
-1. **Create Service Manifest**
-   - File: `k8s/service.yml`
-   - Type: `NodePort` (for local cluster access)
-   - Target your Deployment's Pods using labels
-   - Expose the correct port
-
-2. **Verify Connectivity**
-   - Apply Service manifest
-   - Access app using `minikube service` command or port-forward
-   - Test all endpoints work
-
-<details>
-<summary>💡 Service Types</summary>
-
-**Service Types:**
-- **ClusterIP** (default): Internal cluster access only
-- **NodePort**: Exposes service on each node's IP at a static port
-- **LoadBalancer**: Cloud provider load balancer
-- **ExternalName**: CNAME record for external service
-
-**For Local Development:**
-Use `NodePort` - allows external access without cloud provider.
-
-**Service Manifest Pattern:**
-```yaml
-apiVersion: v1
-kind: Service
-metadata:
-  name: your-app-service
-spec:
-  type: NodePort
-  selector:
-    app: your-app  # Must match Deployment labels
-  ports:
-    - protocol: TCP
-      port: 80        # Service port
-      targetPort: 8000  # Container port
-      nodePort: 30080   # Optional: specific node port (30000-32767)
-```
-
-**Resources:**
-- [Services](https://kubernetes.io/docs/concepts/services-networking/service/)
-- [Connect Applications with Services](https://kubernetes.io/docs/tutorials/services/connect-applications-service/)
-
-</details>
-
-<details>
-<summary>💡 Accessing Your Service</summary>
-
-**Minikube:**
-```bash
-minikube service <service-name>
-minikube service <service-name> --url
-```
-
-**kind or other:**
-```bash
-kubectl port-forward service/<service-name> 8080:80
-```
-
-**Verify:**
-```bash
-kubectl get services
-kubectl describe service <service-name>
-kubectl get endpoints
-```
-
-</details>
-
----
-
-### Task 4 — Scaling and Updates (2 pts)
-
-**Objective:** Demonstrate scaling and rolling updates.
-
-**Requirements:**
-
-1. **Scaling**
-   - Scale your deployment to 5 replicas
-   - Verify all replicas are running
-   - Document the process
-
-2. **Rolling Updates**
-   - Update your image tag or change a configuration
-   - Apply the updated manifest
-   - Watch the rollout process
-   - Verify zero downtime
-
-3. **Rollback**
-   - Demonstrate rollback capability
-   - Show rollout history
-
-<details>
-<summary>💡 Scaling Operations</summary>
-
-**Declarative (Preferred):**
-Edit `deployment.yml` replicas field, then:
-```bash
-kubectl apply -f k8s/deployment.yml
-```
-
-**Imperative (Quick Testing):**
-```bash
-kubectl scale deployment/<name> --replicas=5
-```
-
-**Watch Scaling:**
-```bash
-kubectl get pods -w
-kubectl rollout status deployment/<name>
-```
-
-</details>
-
-<details>
-<summary>💡 Rolling Updates</summary>
-
-**How Rolling Updates Work:**
-- Creates new Pods with updated spec
-- Waits for them to be ready
-- Terminates old Pods gradually
-- Ensures minimum availability
-
-**Update Strategy:**
-```yaml
-spec:
-  strategy:
-    type: RollingUpdate
-    rollingUpdate:
-      maxSurge: 1        # Extra pods during update
-      maxUnavailable: 0  # Ensure availability
-```
-
-**Useful Commands:**
-```bash
-kubectl apply -f k8s/deployment.yml
-kubectl rollout status deployment/<name>
-kubectl rollout history deployment/<name>
-kubectl rollout undo deployment/<name>
-```
-
-**Resources:**
-- [Performing Rolling Update](https://kubernetes.io/docs/tutorials/kubernetes-basics/update/update-intro/)
-
-</details>
-
----
-
-### Task 5 — Documentation (3 pts)
-
-**Objective:** Document your Kubernetes implementation.
-
-Create `k8s/README.md` with these sections:
-
-**Required Sections:**
-
-1. **Architecture Overview**
-   - Diagram or description of your deployment architecture
-   - How many Pods, which Services, networking flow
-   - Resource allocation strategy
-
-2. **Manifest Files**
-   - Brief description of each manifest
-   - Key configuration choices
-   - Why you chose specific values (replicas, resources, etc.)
-
-3. **Deployment Evidence**
-   - `kubectl get all` output
-   - `kubectl get pods,svc` with detailed view
-   - `kubectl describe deployment <name>` showing replicas and strategy
-   - Screenshot or curl output showing app working
-
-4. **Operations Performed**
-   - Commands used to deploy
-   - Scaling demonstration output
-   - Rolling update demonstration output
-   - Service access method and verification
-
-5. **Production Considerations**
-   - What health checks did you implement and why?
-   - Resource limits rationale
-   - How would you improve this for production?
-   - Monitoring and observability strategy
-
-6. **Challenges & Solutions**
-   - Issues encountered
-   - How you debugged (logs, describe, events)
-   - What you learned about Kubernetes
-
----
-
-## Bonus Task — Ingress with TLS (2.5 pts)
-
-**Objective:** Deploy multiple applications with Ingress routing and HTTPS.
-
-**Requirements:**
-
-1. **Multi-App Deployment**
-   - Deploy second application (use different image or different config)
-   - Create Deployment and Service for second app
-
-2. **Ingress Controller**
-   - Enable Ingress in minikube or install in kind
-   - Verify Ingress controller is running
-
-3. **Ingress Resources**
-   - Create Ingress manifest with path-based routing
-   - Route `/app1` to first service
-   - Route `/app2` to second service
-
-4. **TLS Configuration**
-   - Generate self-signed certificate
-   - Create TLS Secret
-   - Configure Ingress for HTTPS
-
-<details>
-<summary>💡 Ingress Concepts</summary>
-
-**What is Ingress?**
-HTTP/HTTPS routing layer sitting in front of Services. Provides:
-- URL-based routing
-- TLS/SSL termination
-- Virtual hosting
-- Load balancing
-
-**Ingress vs Service:**
-- Service: L4 (TCP/UDP) load balancing
-- Ingress: L7 (HTTP/HTTPS) routing
-
-**Ingress Controller:**
-Software that implements Ingress rules. Popular options:
-- nginx-ingress (most common)
-- Traefik
-- HAProxy
-- Cloud provider specific
-
-**Enable in Minikube:**
-```bash
-minikube addons enable ingress
-```
-
-**Install in kind:**
-```bash
-kubectl apply -f https://raw.githubusercontent.com/kubernetes/ingress-nginx/main/deploy/static/provider/kind/deploy.yaml
-```
-
-**Important Note:** The Ingress NGINX controller reaches end of life in March 2026. For production deployments, consider migrating to the [Gateway API](https://gateway-api.sigs.k8s.io/), which is the future of Kubernetes traffic management.
-
-**Resources:**
-- [Ingress](https://kubernetes.io/docs/concepts/services-networking/ingress/)
-- [Ingress Controllers](https://kubernetes.io/docs/concepts/services-networking/ingress-controllers/)
-- [Set up Ingress on Minikube](https://kubernetes.io/docs/tasks/access-application-cluster/ingress-minikube/)
-- [Gateway API](https://gateway-api.sigs.k8s.io/) - Next generation traffic management
-
-</details>
-
-<details>
-<summary>💡 Path-Based Routing</summary>
-
-**Ingress Manifest Pattern:**
-```yaml
-apiVersion: networking.k8s.io/v1
-kind: Ingress
-metadata:
-  name: apps-ingress
-  annotations:
-    nginx.ingress.kubernetes.io/rewrite-target: /
-spec:
-  rules:
-  - host: local.example.com
-    http:
-      paths:
-      - path: /app1
-        pathType: Prefix
-        backend:
-          service:
-            name: app1-service
-            port:
-              number: 80
-      - path: /app2
-        pathType: Prefix
-        backend:
-          service:
-            name: app2-service
-            port:
-              number: 80
-```
-
-**Path Types:**
-- `Exact`: Exact match
-- `Prefix`: Matches URL path prefix
-
-**Testing:**
-Add to `/etc/hosts`:
-```
-<minikube-ip> local.example.com
-```
-
-Access:
-```bash
-curl http://local.example.com/app1
-curl http://local.example.com/app2
-```
-
-</details>
-
-<details>
-<summary>💡 TLS Configuration</summary>
-
-**Generate Self-Signed Certificate:**
-```bash
-openssl req -x509 -nodes -days 365 -newkey rsa:2048 \
-  -keyout tls.key -out tls.crt \
-  -subj "/CN=local.example.com/O=local.example.com"
-```
-
-**Create TLS Secret:**
-```bash
-kubectl create secret tls tls-secret \
-  --key tls.key \
-  --cert tls.crt
-```
-
-**Update Ingress:**
-```yaml
-spec:
-  tls:
-  - hosts:
-    - local.example.com
-    secretName: tls-secret
-  rules:
-  # ... your rules
-```
-
-**Test HTTPS:**
-```bash
-curl -k https://local.example.com/app1
-```
-
-</details>
-
-**Documentation Required:**
-- Both applications deployed and accessible via Ingress
-- Ingress manifest with routing rules
-- TLS configuration and certificate creation steps
-- Terminal output showing all resources
-- curl commands demonstrating routing works
-- Explanation of Ingress benefits over NodePort Services
-
----
-
-## Checklist
-
-### Task 1 — Local Kubernetes Setup (2 pts)
-- [ ] kubectl and local cluster (minikube/kind) installed
-- [ ] Cluster running successfully
-- [ ] Terminal output showing cluster info
-- [ ] Documentation of setup process
-
-### Task 2 — Application Deployment (3 pts)
-- [ ] `k8s/deployment.yml` exists
-- [ ] Uses Docker image from Lab 2
-- [ ] Minimum 3 replicas configured
-- [ ] Resource requests and limits defined
-- [ ] Liveness and readiness probes configured
-- [ ] Deployment successfully running
-
-### Task 3 — Service Configuration (2 pts)
-- [ ] `k8s/service.yml` exists
-- [ ] Service type: NodePort
-- [ ] Correct label selectors
-- [ ] Service accessible from outside cluster
-- [ ] All endpoints responding
-
-### Task 4 — Scaling and Updates (2 pts)
-- [ ] Scaling to 5 replicas demonstrated
-- [ ] Rolling update performed and documented
-- [ ] Rollback capability demonstrated
-- [ ] Zero downtime verified
-
-### Task 5 — Documentation (3 pts)
-- [ ] `k8s/README.md` complete with all sections
-- [ ] Architecture overview provided
-- [ ] Terminal output evidence included
-- [ ] Operations demonstrated
-- [ ] Production considerations discussed
-- [ ] Challenges and learnings documented
-
-### Bonus — Ingress with TLS (2.5 pts)
-- [ ] Second application deployed
-- [ ] Ingress controller enabled
-- [ ] Ingress manifest with path-based routing
-- [ ] TLS certificate generated
-- [ ] HTTPS working
-- [ ] Documentation complete
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Setup** | 2 pts | Cluster running, tools installed |
-| **Deployment** | 3 pts | Production-ready manifest with probes and resources |
-| **Service** | 2 pts | Properly exposed and accessible |
-| **Scaling & Updates** | 2 pts | Demonstrated operations |
-| **Documentation** | 3 pts | Complete and thorough |
-| **Bonus** | 2.5 pts | Ingress with TLS |
-| **Total** | 14.5 pts | 12 pts required + 2.5 pts bonus |
-
-**Grading:**
-- **12/12:** All requirements met, excellent documentation, deep understanding
-- **10-11/12:** Working deployment, good practices, solid documentation
-- **8-9/12:** Basic deployment works, missing some best practices
-- **<8/12:** Missing requirements, no health checks, poor documentation
-
----
-
-## Resources
-
-<details>
-<summary>📚 Official Kubernetes Documentation</summary>
-
-- [Kubernetes Documentation](https://kubernetes.io/docs/home/)
-- [Kubernetes Concepts](https://kubernetes.io/docs/concepts/)
-- [kubectl Reference](https://kubernetes.io/docs/reference/kubectl/)
-- [Kubernetes API Reference](https://kubernetes.io/docs/reference/kubernetes-api/)
-
-</details>
-
-<details>
-<summary>🎓 Learning Resources</summary>
-
-- [Kubernetes Basics Tutorial](https://kubernetes.io/docs/tutorials/kubernetes-basics/)
-- [Learn Kubernetes Basics](https://kubernetes.io/docs/tutorials/kubernetes-basics/)
-- [Configuration Best Practices](https://kubernetes.io/docs/concepts/configuration/overview/)
-
-</details>
-
-<details>
-<summary>🛠️ Tools</summary>
-
-- [kubectl](https://kubernetes.io/docs/tasks/tools/) - Kubernetes CLI
-- [minikube](https://minikube.sigs.k8s.io/docs/) - Local Kubernetes
-- [kind](https://kind.sigs.k8s.io/) - Kubernetes in Docker
-- [k9s](https://k9scli.io/) - Terminal UI for Kubernetes
-- [kubectx/kubens](https://github.com/ahmetb/kubectx) - Context and namespace switcher
-
-</details>
-
-<details>
-<summary>🔍 Debugging Resources</summary>
-
-- [Debug Pods](https://kubernetes.io/docs/tasks/debug/debug-application/debug-pods/)
-- [Debug Services](https://kubernetes.io/docs/tasks/debug/debug-application/debug-service/)
-- [Troubleshooting Applications](https://kubernetes.io/docs/tasks/debug/debug-application/)
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 10:** Helm charts for package management
-- **Lab 11:** Secrets management with Vault
-- **Lab 12:** ConfigMaps and application configuration
-- **Lab 13:** ArgoCD for GitOps deployments
-- **Lab 14:** Progressive delivery with Argo Rollouts
-- **Lab 15:** StatefulSets for stateful applications
-- **Lab 16:** Kubernetes monitoring and observability
-
----
-
-**Good luck!** 🚢
-
-> **Remember:** Kubernetes is declarative. Define desired state, let the control plane make it happen. Use health checks and resource limits from day one.
+# Lab 9 — Kubernetes Fundamentals
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Kubernetes-blue)
+![points](https://img.shields.io/badge/points-12%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Kubernetes-informational)
+
+> Deploy your containerized applications to Kubernetes using declarative manifests and production best practices.
+
+## Overview
+
+Take your Docker images from previous labs and deploy them to Kubernetes. Learn container orchestration fundamentals, declarative configuration, and production deployment patterns.
+
+**What You'll Learn:**
+- Kubernetes core concepts and architecture
+- Writing production-ready manifests
+- Deployments, Services, and networking
+- Health checks and resource management
+- Scaling and updates
+
+**Tech Stack:** Kubernetes 1.33+ | kubectl | minikube or kind | YAML
+
+---
+
+## Tasks
+
+### Task 1 — Local Kubernetes Setup (2 pts)
+
+**Objective:** Set up a local Kubernetes cluster and understand core concepts.
+
+**Requirements:**
+
+1. **Learn Kubernetes Fundamentals**
+   - Study core concepts (Pods, Deployments, Services, Namespaces)
+   - Understand control plane and worker node architecture
+   - Learn the declarative vs imperative approach
+
+2. **Install Tools**
+   - Install `kubectl` (Kubernetes CLI)
+   - Install local cluster: `minikube` OR `kind`
+   - Verify installation with cluster info commands
+
+3. **Cluster Setup**
+   - Start local cluster
+   - Verify all components are running
+   - Explore cluster with kubectl commands
+
+<details>
+<summary>💡 Kubernetes Concepts</summary>
+
+**Core Resources:**
+- **Pod**: Smallest deployable unit, contains one or more containers
+- **Deployment**: Manages replica sets and rolling updates
+- **Service**: Exposes Pods as network service with stable endpoint
+- **Namespace**: Virtual cluster for resource isolation
+
+**Why Kubernetes?**
+- Automatic scaling and load balancing
+- Self-healing (restart failed containers)
+- Rolling updates and rollbacks
+- Service discovery and networking
+- Resource management and scheduling
+
+**Local Development Options:**
+- **minikube**: Full-featured, runs in VM or Docker
+- **kind**: Lightweight, runs in Docker containers, great for CI/CD
+
+**Key Concepts to Research:**
+- Desired state vs actual state
+- Controllers and reconciliation loops
+- Labels and selectors
+- Declarative configuration (YAML manifests)
+
+**Resources:**
+- [What is Kubernetes](https://kubernetes.io/docs/concepts/overview/)
+- [Kubernetes Components](https://kubernetes.io/docs/concepts/overview/components/)
+- [kubectl Cheat Sheet](https://kubernetes.io/docs/reference/kubectl/quick-reference/)
+- [Install Tools](https://kubernetes.io/docs/tasks/tools/)
+
+</details>
+
+<details>
+<summary>💡 Essential kubectl Commands</summary>
+
+**Cluster Information:**
+```bash
+kubectl cluster-info
+kubectl get nodes
+kubectl get namespaces
+```
+
+**Resource Management:**
+```bash
+kubectl get pods
+kubectl get deployments
+kubectl get services
+kubectl describe pod <pod-name>
+kubectl logs <pod-name>
+```
+
+**Apply vs Create:**
+- `kubectl apply` - Declarative, idempotent, preferred
+- `kubectl create` - Imperative, fails if exists
+
+</details>
+
+**Documentation Required:**
+- Terminal output showing successful cluster setup
+- Output of `kubectl cluster-info` and `kubectl get nodes`
+- Brief explanation of your chosen tool (minikube/kind) and why
+
+---
+
+### Task 2 — Application Deployment (3 pts)
+
+**Objective:** Create a Deployment manifest for your Python app with production best practices.
+
+**Requirements:**
+
+1. **Create Deployment Manifest**
+   - File: `k8s/deployment.yml`
+   - Use your Docker image from Lab 2
+   - Minimum 3 replicas
+   - Include resource requests and limits
+   - Add liveness and readiness probes
+   - Use labels for organization
+
+2. **Production Best Practices**
+   - Non-root container (should already be in your image)
+   - Rolling update strategy
+   - Proper container port configuration
+   - Environment variables if needed
+
+<details>
+<summary>💡 Deployment Manifest Structure</summary>
+
+**Essential Sections:**
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: your-app-name
+  labels:
+    app: your-app
+spec:
+  replicas: 3
+  selector:
+    matchLabels:
+      app: your-app
+  template:
+    metadata:
+      labels:
+        app: your-app
+    spec:
+      containers:
+      - name: your-app
+        image: your-dockerhub-username/your-app:latest
+        # Add: ports, resources, probes
+```
+
+**Key Fields to Research:**
+- `replicas`: Number of Pod copies
+- `selector.matchLabels`: How Deployment finds its Pods
+- `template`: Pod specification
+- `resources`: CPU/memory requests and limits
+- `livenessProbe`: Is container healthy?
+- `readinessProbe`: Is container ready for traffic?
+
+**Resources:**
+- [Deployments](https://kubernetes.io/docs/concepts/workloads/controllers/deployment/)
+- [Resource Management](https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/)
+- [Health Checks](https://kubernetes.io/docs/tasks/configure-pod-container/configure-liveness-readiness-startup-probes/)
+
+</details>
+
+<details>
+<summary>💡 Health Checks (Probes)</summary>
+
+**Types of Probes:**
+- **Liveness**: Restart container if failing
+- **Readiness**: Remove from service if not ready
+- **Startup**: For slow-starting containers
+
+**Probe Methods:**
+- HTTP GET (common for web apps)
+- TCP Socket
+- Exec command
+
+**Example Configuration Pattern:**
+```yaml
+livenessProbe:
+  httpGet:
+    path: /health
+    port: 8000
+  initialDelaySeconds: 10
+  periodSeconds: 5
+
+readinessProbe:
+  httpGet:
+    path: /ready
+    port: 8000
+  initialDelaySeconds: 5
+  periodSeconds: 3
+```
+
+**Note:** You may need to add `/health` endpoint to your app.
+
+</details>
+
+<details>
+<summary>💡 Resource Management</summary>
+
+**Why Set Resources?**
+- Prevents resource starvation
+- Enables proper scheduling
+- Protects cluster stability
+
+**Pattern:**
+```yaml
+resources:
+  requests:
+    memory: "128Mi"
+    cpu: "100m"
+  limits:
+    memory: "256Mi"
+    cpu: "200m"
+```
+
+**CPU Units:**
+- `1000m` = 1 CPU core
+- `100m` = 0.1 CPU core
+
+**Memory Units:**
+- `Mi` = Mebibyte (1024-based)
+- `Gi` = Gibibyte
+
+</details>
+
+**Test Your Deployment:**
+```bash
+kubectl apply -f k8s/deployment.yml
+kubectl get deployments
+kubectl get pods
+kubectl describe deployment <name>
+```
+
+---
+
+### Task 3 — Service Configuration (2 pts)
+
+**Objective:** Create a Service to expose your Deployment.
+
+**Requirements:**
+
+1. **Create Service Manifest**
+   - File: `k8s/service.yml`
+   - Type: `NodePort` (for local cluster access)
+   - Target your Deployment's Pods using labels
+   - Expose the correct port
+
+2. **Verify Connectivity**
+   - Apply Service manifest
+   - Access app using `minikube service` command or port-forward
+   - Test all endpoints work
+
+<details>
+<summary>💡 Service Types</summary>
+
+**Service Types:**
+- **ClusterIP** (default): Internal cluster access only
+- **NodePort**: Exposes service on each node's IP at a static port
+- **LoadBalancer**: Cloud provider load balancer
+- **ExternalName**: CNAME record for external service
+
+**For Local Development:**
+Use `NodePort` - allows external access without cloud provider.
+
+**Service Manifest Pattern:**
+```yaml
+apiVersion: v1
+kind: Service
+metadata:
+  name: your-app-service
+spec:
+  type: NodePort
+  selector:
+    app: your-app  # Must match Deployment labels
+  ports:
+    - protocol: TCP
+      port: 80        # Service port
+      targetPort: 8000  # Container port
+      nodePort: 30080   # Optional: specific node port (30000-32767)
+```
+
+**Resources:**
+- [Services](https://kubernetes.io/docs/concepts/services-networking/service/)
+- [Connect Applications with Services](https://kubernetes.io/docs/tutorials/services/connect-applications-service/)
+
+</details>
+
+<details>
+<summary>💡 Accessing Your Service</summary>
+
+**Minikube:**
+```bash
+minikube service <service-name>
+minikube service <service-name> --url
+```
+
+**kind or other:**
+```bash
+kubectl port-forward service/<service-name> 8080:80
+```
+
+**Verify:**
+```bash
+kubectl get services
+kubectl describe service <service-name>
+kubectl get endpoints
+```
+
+</details>
+
+---
+
+### Task 4 — Scaling and Updates (2 pts)
+
+**Objective:** Demonstrate scaling and rolling updates.
+
+**Requirements:**
+
+1. **Scaling**
+   - Scale your deployment to 5 replicas
+   - Verify all replicas are running
+   - Document the process
+
+2. **Rolling Updates**
+   - Update your image tag or change a configuration
+   - Apply the updated manifest
+   - Watch the rollout process
+   - Verify zero downtime
+
+3. **Rollback**
+   - Demonstrate rollback capability
+   - Show rollout history
+
+<details>
+<summary>💡 Scaling Operations</summary>
+
+**Declarative (Preferred):**
+Edit `deployment.yml` replicas field, then:
+```bash
+kubectl apply -f k8s/deployment.yml
+```
+
+**Imperative (Quick Testing):**
+```bash
+kubectl scale deployment/<name> --replicas=5
+```
+
+**Watch Scaling:**
+```bash
+kubectl get pods -w
+kubectl rollout status deployment/<name>
+```
+
+</details>
+
+<details>
+<summary>💡 Rolling Updates</summary>
+
+**How Rolling Updates Work:**
+- Creates new Pods with updated spec
+- Waits for them to be ready
+- Terminates old Pods gradually
+- Ensures minimum availability
+
+**Update Strategy:**
+```yaml
+spec:
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1        # Extra pods during update
+      maxUnavailable: 0  # Ensure availability
+```
+
+**Useful Commands:**
+```bash
+kubectl apply -f k8s/deployment.yml
+kubectl rollout status deployment/<name>
+kubectl rollout history deployment/<name>
+kubectl rollout undo deployment/<name>
+```
+
+**Resources:**
+- [Performing Rolling Update](https://kubernetes.io/docs/tutorials/kubernetes-basics/update/update-intro/)
+
+</details>
+
+---
+
+### Task 5 — Documentation (3 pts)
+
+**Objective:** Document your Kubernetes implementation.
+
+Create `k8s/README.md` with these sections:
+
+**Required Sections:**
+
+1. **Architecture Overview**
+   - Diagram or description of your deployment architecture
+   - How many Pods, which Services, networking flow
+   - Resource allocation strategy
+
+2. **Manifest Files**
+   - Brief description of each manifest
+   - Key configuration choices
+   - Why you chose specific values (replicas, resources, etc.)
+
+3. **Deployment Evidence**
+   - `kubectl get all` output
+   - `kubectl get pods,svc` with detailed view
+   - `kubectl describe deployment <name>` showing replicas and strategy
+   - Screenshot or curl output showing app working
+
+4. **Operations Performed**
+   - Commands used to deploy
+   - Scaling demonstration output
+   - Rolling update demonstration output
+   - Service access method and verification
+
+5. **Production Considerations**
+   - What health checks did you implement and why?
+   - Resource limits rationale
+   - How would you improve this for production?
+   - Monitoring and observability strategy
+
+6. **Challenges & Solutions**
+   - Issues encountered
+   - How you debugged (logs, describe, events)
+   - What you learned about Kubernetes
+
+---
+
+## Bonus Task — Ingress with TLS (2.5 pts)
+
+**Objective:** Deploy multiple applications with Ingress routing and HTTPS.
+
+**Requirements:**
+
+1. **Multi-App Deployment**
+   - Deploy second application (use different image or different config)
+   - Create Deployment and Service for second app
+
+2. **Ingress Controller**
+   - Enable Ingress in minikube or install in kind
+   - Verify Ingress controller is running
+
+3. **Ingress Resources**
+   - Create Ingress manifest with path-based routing
+   - Route `/app1` to first service
+   - Route `/app2` to second service
+
+4. **TLS Configuration**
+   - Generate self-signed certificate
+   - Create TLS Secret
+   - Configure Ingress for HTTPS
+
+<details>
+<summary>💡 Ingress Concepts</summary>
+
+**What is Ingress?**
+HTTP/HTTPS routing layer sitting in front of Services. Provides:
+- URL-based routing
+- TLS/SSL termination
+- Virtual hosting
+- Load balancing
+
+**Ingress vs Service:**
+- Service: L4 (TCP/UDP) load balancing
+- Ingress: L7 (HTTP/HTTPS) routing
+
+**Ingress Controller:**
+Software that implements Ingress rules. Popular options:
+- nginx-ingress (most common)
+- Traefik
+- HAProxy
+- Cloud provider specific
+
+**Enable in Minikube:**
+```bash
+minikube addons enable ingress
+```
+
+**Install in kind:**
+```bash
+kubectl apply -f https://raw.githubusercontent.com/kubernetes/ingress-nginx/main/deploy/static/provider/kind/deploy.yaml
+```
+
+**Important Note:** The Ingress NGINX controller reaches end of life in March 2026. For production deployments, consider migrating to the [Gateway API](https://gateway-api.sigs.k8s.io/), which is the future of Kubernetes traffic management.
+
+**Resources:**
+- [Ingress](https://kubernetes.io/docs/concepts/services-networking/ingress/)
+- [Ingress Controllers](https://kubernetes.io/docs/concepts/services-networking/ingress-controllers/)
+- [Set up Ingress on Minikube](https://kubernetes.io/docs/tasks/access-application-cluster/ingress-minikube/)
+- [Gateway API](https://gateway-api.sigs.k8s.io/) - Next generation traffic management
+
+</details>
+
+<details>
+<summary>💡 Path-Based Routing</summary>
+
+**Ingress Manifest Pattern:**
+```yaml
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+metadata:
+  name: apps-ingress
+  annotations:
+    nginx.ingress.kubernetes.io/rewrite-target: /
+spec:
+  rules:
+  - host: local.example.com
+    http:
+      paths:
+      - path: /app1
+        pathType: Prefix
+        backend:
+          service:
+            name: app1-service
+            port:
+              number: 80
+      - path: /app2
+        pathType: Prefix
+        backend:
+          service:
+            name: app2-service
+            port:
+              number: 80
+```
+
+**Path Types:**
+- `Exact`: Exact match
+- `Prefix`: Matches URL path prefix
+
+**Testing:**
+Add to `/etc/hosts`:
+```
+<minikube-ip> local.example.com
+```
+
+Access:
+```bash
+curl http://local.example.com/app1
+curl http://local.example.com/app2
+```
+
+</details>
+
+<details>
+<summary>💡 TLS Configuration</summary>
+
+**Generate Self-Signed Certificate:**
+```bash
+openssl req -x509 -nodes -days 365 -newkey rsa:2048 \
+  -keyout tls.key -out tls.crt \
+  -subj "/CN=local.example.com/O=local.example.com"
+```
+
+**Create TLS Secret:**
+```bash
+kubectl create secret tls tls-secret \
+  --key tls.key \
+  --cert tls.crt
+```
+
+**Update Ingress:**
+```yaml
+spec:
+  tls:
+  - hosts:
+    - local.example.com
+    secretName: tls-secret
+  rules:
+  # ... your rules
+```
+
+**Test HTTPS:**
+```bash
+curl -k https://local.example.com/app1
+```
+
+</details>
+
+**Documentation Required:**
+- Both applications deployed and accessible via Ingress
+- Ingress manifest with routing rules
+- TLS configuration and certificate creation steps
+- Terminal output showing all resources
+- curl commands demonstrating routing works
+- Explanation of Ingress benefits over NodePort Services
+
+---
+
+## Checklist
+
+### Task 1 — Local Kubernetes Setup (2 pts)
+- [ ] kubectl and local cluster (minikube/kind) installed
+- [ ] Cluster running successfully
+- [ ] Terminal output showing cluster info
+- [ ] Documentation of setup process
+
+### Task 2 — Application Deployment (3 pts)
+- [ ] `k8s/deployment.yml` exists
+- [ ] Uses Docker image from Lab 2
+- [ ] Minimum 3 replicas configured
+- [ ] Resource requests and limits defined
+- [ ] Liveness and readiness probes configured
+- [ ] Deployment successfully running
+
+### Task 3 — Service Configuration (2 pts)
+- [ ] `k8s/service.yml` exists
+- [ ] Service type: NodePort
+- [ ] Correct label selectors
+- [ ] Service accessible from outside cluster
+- [ ] All endpoints responding
+
+### Task 4 — Scaling and Updates (2 pts)
+- [ ] Scaling to 5 replicas demonstrated
+- [ ] Rolling update performed and documented
+- [ ] Rollback capability demonstrated
+- [ ] Zero downtime verified
+
+### Task 5 — Documentation (3 pts)
+- [ ] `k8s/README.md` complete with all sections
+- [ ] Architecture overview provided
+- [ ] Terminal output evidence included
+- [ ] Operations demonstrated
+- [ ] Production considerations discussed
+- [ ] Challenges and learnings documented
+
+### Bonus — Ingress with TLS (2.5 pts)
+- [ ] Second application deployed
+- [ ] Ingress controller enabled
+- [ ] Ingress manifest with path-based routing
+- [ ] TLS certificate generated
+- [ ] HTTPS working
+- [ ] Documentation complete
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Setup** | 2 pts | Cluster running, tools installed |
+| **Deployment** | 3 pts | Production-ready manifest with probes and resources |
+| **Service** | 2 pts | Properly exposed and accessible |
+| **Scaling & Updates** | 2 pts | Demonstrated operations |
+| **Documentation** | 3 pts | Complete and thorough |
+| **Bonus** | 2.5 pts | Ingress with TLS |
+| **Total** | 14.5 pts | 12 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **12/12:** All requirements met, excellent documentation, deep understanding
+- **10-11/12:** Working deployment, good practices, solid documentation
+- **8-9/12:** Basic deployment works, missing some best practices
+- **<8/12:** Missing requirements, no health checks, poor documentation
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Kubernetes Documentation</summary>
+
+- [Kubernetes Documentation](https://kubernetes.io/docs/home/)
+- [Kubernetes Concepts](https://kubernetes.io/docs/concepts/)
+- [kubectl Reference](https://kubernetes.io/docs/reference/kubectl/)
+- [Kubernetes API Reference](https://kubernetes.io/docs/reference/kubernetes-api/)
+
+</details>
+
+<details>
+<summary>🎓 Learning Resources</summary>
+
+- [Kubernetes Basics Tutorial](https://kubernetes.io/docs/tutorials/kubernetes-basics/)
+- [Learn Kubernetes Basics](https://kubernetes.io/docs/tutorials/kubernetes-basics/)
+- [Configuration Best Practices](https://kubernetes.io/docs/concepts/configuration/overview/)
+
+</details>
+
+<details>
+<summary>🛠️ Tools</summary>
+
+- [kubectl](https://kubernetes.io/docs/tasks/tools/) - Kubernetes CLI
+- [minikube](https://minikube.sigs.k8s.io/docs/) - Local Kubernetes
+- [kind](https://kind.sigs.k8s.io/) - Kubernetes in Docker
+- [k9s](https://k9scli.io/) - Terminal UI for Kubernetes
+- [kubectx/kubens](https://github.com/ahmetb/kubectx) - Context and namespace switcher
+
+</details>
+
+<details>
+<summary>🔍 Debugging Resources</summary>
+
+- [Debug Pods](https://kubernetes.io/docs/tasks/debug/debug-application/debug-pods/)
+- [Debug Services](https://kubernetes.io/docs/tasks/debug/debug-application/debug-service/)
+- [Troubleshooting Applications](https://kubernetes.io/docs/tasks/debug/debug-application/)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 10:** Helm charts for package management
+- **Lab 11:** Secrets management with Vault
+- **Lab 12:** ConfigMaps and application configuration
+- **Lab 13:** ArgoCD for GitOps deployments
+- **Lab 14:** Progressive delivery with Argo Rollouts
+- **Lab 15:** StatefulSets for stateful applications
+- **Lab 16:** Kubernetes monitoring and observability
+
+---
+
+**Good luck!** 🚢
+
+> **Remember:** Kubernetes is declarative. Define desired state, let the control plane make it happen. Use health checks and resource limits from day one.
diff --git a/labs/lab10.md b/labs/lab10.md
index 11952dedb7..5c3d46161b 100644
--- a/labs/lab10.md
+++ b/labs/lab10.md
@@ -1,903 +1,903 @@
-# Lab 10 — Helm Package Manager
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-Helm-blue)
-![points](https://img.shields.io/badge/points-12%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Helm-informational)
-
-> Package your Kubernetes applications with Helm for reusable, configurable deployments across environments.
-
-## Overview
-
-Transform your Kubernetes manifests from Lab 9 into Helm charts. Learn templating, values management, lifecycle hooks, and chart best practices for production deployments.
-
-**What You'll Learn:**
-- Helm architecture and templating
-- Creating production-ready charts
-- Values and configuration management
-- Chart hooks for lifecycle events
-- Testing and validating charts
-- Library charts for code reuse
-
-**Tech Stack:** Helm 4.x | Kubernetes 1.33+ | Go templating | YAML
-
----
-
-## Tasks
-
-### Task 1 — Helm Fundamentals (2 pts)
-
-**Objective:** Understand Helm concepts and set up your environment.
-
-**Requirements:**
-
-1. **Learn Helm Concepts**
-   - Understand Charts, Releases, and Repositories
-   - Learn Go template syntax basics
-   - Study Helm architecture (v3)
-
-2. **Install Helm**
-   - Install Helm CLI
-   - Verify installation
-   - Add common chart repositories
-
-3. **Explore Existing Charts**
-   - Search public repositories
-   - Inspect a chart's structure
-   - Understand chart components
-
-<details>
-<summary>💡 Helm Concepts</summary>
-
-**What is Helm?**
-Package manager for Kubernetes. Think `apt`/`yum` for K8s applications.
-
-**Core Concepts:**
-- **Chart**: Package of Kubernetes resources (like a `.deb` or `.rpm`)
-- **Release**: Instance of a chart running in a cluster
-- **Repository**: Collection of charts (like package repositories)
-- **Values**: Configuration parameters for customization
-
-**Why Helm?**
-- **Templating**: Reuse manifests across environments
-- **Versioning**: Track and rollback releases
-- **Dependencies**: Manage complex multi-chart applications
-- **Hooks**: Execute actions during install/upgrade/delete
-- **Standardization**: Industry-standard packaging
-
-**Helm 4 (Current):**
-- Released November 2025, first major version in 6 years
-- Full backward compatibility with Helm 3 charts (apiVersion v2)
-- OCI registry support
-- No Tiller (removed in Helm 3)
-- Improved security and performance
-
-**Chart Structure:**
-```
-mychart/
-├── Chart.yaml          # Chart metadata
-├── values.yaml         # Default configuration values
-├── charts/             # Chart dependencies
-└── templates/          # Kubernetes manifest templates
-    ├── deployment.yaml
-    ├── service.yaml
-    ├── _helpers.tpl    # Template helpers
-    └── NOTES.txt       # Post-install notes
-```
-
-**Resources:**
-- [Helm Architecture](https://helm.sh/docs/topics/architecture/)
-- [Three Big Concepts](https://helm.sh/docs/intro/using_helm/#three-big-concepts)
-- [Charts](https://helm.sh/docs/topics/charts/)
-- [Install Helm](https://helm.sh/docs/intro/install/)
-
-</details>
-
-<details>
-<summary>💡 Essential Helm Commands</summary>
-
-**Repository Management:**
-```bash
-# Note: Traditional HTTP repositories are being phased out
-# Many charts now use OCI registries
-
-# Add a repository (traditional method)
-helm repo add prometheus-community https://prometheus-community.github.io/helm-charts
-helm repo update
-helm search repo prometheus
-
-# Install from OCI registry (modern method)
-helm install my-nginx oci://registry-1.docker.io/bitnamicharts/nginx
-```
-
-**Chart Operations:**
-```bash
-helm create mychart           # Create new chart
-helm lint mychart             # Validate chart
-helm template mychart         # Render templates locally
-helm install myrelease mychart  # Install chart
-helm list                     # List releases
-helm uninstall myrelease      # Remove release
-```
-
-**Debugging:**
-```bash
-helm install --dry-run --debug myrelease mychart
-helm get manifest myrelease
-helm get values myrelease
-```
-
-</details>
-
-**Documentation Required:**
-- Terminal output showing Helm installation and version (should be 4.x)
-- Output of exploring a public chart (e.g., `helm show chart prometheus-community/prometheus`)
-- Brief explanation of Helm's value proposition
-
----
-
-### Task 2 — Create Your Helm Chart (3 pts)
-
-**Objective:** Convert your Lab 9 Kubernetes manifests into a Helm chart.
-
-**Requirements:**
-
-1. **Initialize Chart**
-   - Create chart in `k8s/` directory
-   - Choose appropriate chart name
-   - Update `Chart.yaml` with metadata
-
-2. **Convert Manifests to Templates**
-   - Move your `deployment.yml` to `templates/deployment.yaml`
-   - Move your `service.yml` to `templates/service.yaml`
-   - Templatize using Go template syntax
-   - Extract values to `values.yaml`
-
-3. **Implement Proper Templating**
-   - Image repository and tag from values
-   - Replica count from values
-   - Resource limits from values
-   - Service type and ports from values
-   - Labels using helper templates
-
-4. **Keep Health Checks**
-   - NEVER comment out liveness/readiness probes
-   - Make probe configuration customizable via values
-   - Provide sensible defaults
-
-<details>
-<summary>💡 Chart.yaml Structure</summary>
-
-**Required Fields:**
-```yaml
-apiVersion: v2              # Chart API version (v2 for Helm 3+)
-name: my-python-app         # Chart name
-description: My Python application Helm chart
-type: application           # application or library
-version: 0.1.0              # Chart version (SemVer)
-appVersion: "1.0"           # App version (can be any string)
-```
-
-**Optional but Recommended:**
-```yaml
-keywords:
-  - python
-  - web
-maintainers:
-  - name: Your Name
-    email: your.email@example.com
-sources:
-  - https://github.com/yourusername/yourapp
-```
-
-**Chart vs App Version:**
-- `version`: Chart version (change when chart changes)
-- `appVersion`: Application version (change when app changes)
-
-</details>
-
-<details>
-<summary>💡 Templating Basics</summary>
-
-**Go Template Syntax:**
-```yaml
-# Access value from values.yaml
-image: {{ .Values.image.repository }}:{{ .Values.image.tag }}
-
-# With default value
-replicas: {{ .Values.replicaCount | default 3 }}
-
-# Conditional
-{{- if .Values.service.enabled }}
-# ... service definition
-{{- end }}
-
-# Range (loop)
-{{- range .Values.env }}
-- name: {{ .name }}
-  value: {{ .value }}
-{{- end }}
-```
-
-**Built-in Objects:**
-- `.Values`: Values from `values.yaml` and overrides
-- `.Chart`: Contents of `Chart.yaml`
-- `.Release`: Info about the release (name, namespace, etc.)
-- `.Template`: Info about current template
-
-**Example Conversion:**
-
-Before (static):
-```yaml
-apiVersion: apps/v1
-kind: Deployment
-metadata:
-  name: my-app
-spec:
-  replicas: 3
-  template:
-    spec:
-      containers:
-      - name: my-app
-        image: myuser/myapp:v1.0
-```
-
-After (templated):
-```yaml
-apiVersion: apps/v1
-kind: Deployment
-metadata:
-  name: {{ include "mychart.fullname" . }}
-  labels:
-    {{- include "mychart.labels" . | nindent 4 }}
-spec:
-  replicas: {{ .Values.replicaCount }}
-  template:
-    spec:
-      containers:
-      - name: {{ .Chart.Name }}
-        image: "{{ .Values.image.repository }}:{{ .Values.image.tag | default .Chart.AppVersion }}"
-```
-
-</details>
-
-<details>
-<summary>💡 Values.yaml Design</summary>
-
-**Structure Your Values:**
-```yaml
-# values.yaml
-replicaCount: 3
-
-image:
-  repository: yourusername/yourapp
-  tag: "1.0"
-  pullPolicy: IfNotPresent
-
-service:
-  type: NodePort
-  port: 80
-  targetPort: 8000
-
-resources:
-  limits:
-    cpu: 200m
-    memory: 256Mi
-  requests:
-    cpu: 100m
-    memory: 128Mi
-
-livenessProbe:
-  httpGet:
-    path: /health
-    port: 8000
-  initialDelaySeconds: 10
-  periodSeconds: 5
-
-readinessProbe:
-  httpGet:
-    path: /ready
-    port: 8000
-  initialDelaySeconds: 5
-  periodSeconds: 3
-```
-
-**Best Practices:**
-- Nested structure for organization
-- Sensible defaults
-- Document each value
-- Make everything configurable
-- Never hardcode secrets
-
-</details>
-
-<details>
-<summary>💡 Helper Templates</summary>
-
-**_helpers.tpl Pattern:**
-```yaml
-{{/*
-Expand the name of the chart.
-*/}}
-{{- define "mychart.name" -}}
-{{- default .Chart.Name .Values.nameOverride | trunc 63 | trimSuffix "-" }}
-{{- end }}
-
-{{/*
-Create a default fully qualified app name.
-*/}}
-{{- define "mychart.fullname" -}}
-{{- if .Values.fullnameOverride }}
-{{- .Values.fullnameOverride | trunc 63 | trimSuffix "-" }}
-{{- else }}
-{{- $name := default .Chart.Name .Values.nameOverride }}
-{{- printf "%s-%s" .Release.Name $name | trunc 63 | trimSuffix "-" }}
-{{- end }}
-{{- end }}
-
-{{/*
-Common labels
-*/}}
-{{- define "mychart.labels" -}}
-helm.sh/chart: {{ include "mychart.chart" . }}
-{{ include "mychart.selectorLabels" . }}
-app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
-app.kubernetes.io/managed-by: {{ .Release.Service }}
-{{- end }}
-```
-
-**Why Helpers?**
-- DRY principle
-- Consistent naming
-- Reusable logic
-- Easier maintenance
-
-</details>
-
-**Test Your Chart:**
-```bash
-helm lint k8s/mychart
-helm template mychart k8s/mychart
-helm install --dry-run --debug test-release k8s/mychart
-helm install myrelease k8s/mychart
-```
-
----
-
-### Task 3 — Multi-Environment Support (2 pts)
-
-**Objective:** Configure chart for different environments using values files.
-
-**Requirements:**
-
-1. **Create Environment-Specific Values**
-   - `values-dev.yaml` for development
-   - `values-prod.yaml` for production
-   - Different configurations per environment
-
-2. **Environment Differences**
-   - Dev: 1 replica, relaxed resources, NodePort
-   - Prod: 3+ replicas, proper resources, LoadBalancer ready
-   - Different image tags or configurations
-
-3. **Test Both Environments**
-   - Install with dev values
-   - Verify configuration
-   - Upgrade to prod values
-   - Verify changes applied
-
-<details>
-<summary>💡 Values Override Pattern</summary>
-
-**values-dev.yaml:**
-```yaml
-replicaCount: 1
-
-image:
-  tag: "latest"
-
-resources:
-  limits:
-    cpu: 100m
-    memory: 128Mi
-  requests:
-    cpu: 50m
-    memory: 64Mi
-
-service:
-  type: NodePort
-
-livenessProbe:
-  initialDelaySeconds: 5
-  periodSeconds: 10
-```
-
-**values-prod.yaml:**
-```yaml
-replicaCount: 5
-
-image:
-  tag: "1.0.0"  # Specific version
-
-resources:
-  limits:
-    cpu: 500m
-    memory: 512Mi
-  requests:
-    cpu: 200m
-    memory: 256Mi
-
-service:
-  type: LoadBalancer
-
-livenessProbe:
-  initialDelaySeconds: 30
-  periodSeconds: 5
-
-readinessProbe:
-  initialDelaySeconds: 10
-  periodSeconds: 3
-```
-
-**Using Values Files:**
-```bash
-# Development
-helm install myapp-dev k8s/mychart -f k8s/mychart/values-dev.yaml
-
-# Production
-helm install myapp-prod k8s/mychart -f k8s/mychart/values-prod.yaml
-
-# Override specific value
-helm install myapp k8s/mychart --set replicaCount=10
-```
-
-</details>
-
----
-
-### Task 4 — Chart Hooks (3 pts)
-
-**Objective:** Implement Helm hooks for lifecycle management.
-
-**Requirements:**
-
-1. **Learn Hook Concepts**
-   - Understand hook weights and execution order
-   - Learn hook deletion policies
-
-2. **Implement Hooks**
-   - **Pre-install hook**: Job that runs before installation (e.g., database migration, validation)
-   - **Post-install hook**: Job that runs after installation (e.g., smoke test, notification)
-
-3. **Hook Configuration**
-   - Proper annotations for hook type
-   - Hook weight for execution order
-   - Deletion policy (hook-succeeded)
-
-4. **Verify Hooks**
-   - Lint chart
-   - Dry-run to see hook rendering
-   - Install and verify hook execution
-   - Confirm hooks are deleted per policy
-
-<details>
-<summary>💡 Helm Hooks Concept</summary>
-
-**What Are Hooks?**
-Special Kubernetes resources that execute at specific points in release lifecycle.
-
-**Hook Types:**
-- `pre-install`: Before resources are installed
-- `post-install`: After all resources installed and ready
-- `pre-delete`: Before deletion
-- `post-delete`: After deletion
-- `pre-upgrade`: Before upgrade
-- `post-upgrade`: After upgrade
-- `pre-rollback`: Before rollback
-- `post-rollback`: After rollback
-
-**Hook Weights:**
-- Control execution order
-- Lower weight runs first
-- Default weight: 0
-
-**Hook Deletion Policies:**
-- `before-hook-creation`: Delete previous hook before new one
-- `hook-succeeded`: Delete after successful execution
-- `hook-failed`: Delete after failed execution
-
-**Resources:**
-- [Chart Hooks](https://helm.sh/docs/topics/charts_hooks/)
-
-</details>
-
-<details>
-<summary>💡 Hook Implementation Pattern</summary>
-
-**templates/hooks/pre-install-job.yaml:**
-```yaml
-apiVersion: batch/v1
-kind: Job
-metadata:
-  name: "{{ include "mychart.fullname" . }}-pre-install"
-  labels:
-    {{- include "mychart.labels" . | nindent 4 }}
-  annotations:
-    "helm.sh/hook": pre-install
-    "helm.sh/hook-weight": "-5"
-    "helm.sh/hook-delete-policy": hook-succeeded
-spec:
-  template:
-    metadata:
-      name: "{{ include "mychart.fullname" . }}-pre-install"
-    spec:
-      restartPolicy: Never
-      containers:
-      - name: pre-install-job
-        image: busybox
-        command: ['sh', '-c', 'echo Pre-install task running && sleep 10 && echo Pre-install completed']
-```
-
-**templates/hooks/post-install-job.yaml:**
-```yaml
-apiVersion: batch/v1
-kind: Job
-metadata:
-  name: "{{ include "mychart.fullname" . }}-post-install"
-  labels:
-    {{- include "mychart.labels" . | nindent 4 }}
-  annotations:
-    "helm.sh/hook": post-install
-    "helm.sh/hook-weight": "5"
-    "helm.sh/hook-delete-policy": hook-succeeded
-spec:
-  template:
-    metadata:
-      name: "{{ include "mychart.fullname" . }}-post-install"
-    spec:
-      restartPolicy: Never
-      containers:
-      - name: post-install-job
-        image: busybox
-        command: ['sh', '-c', 'echo Post-install validation && sleep 10 && echo Validation passed']
-```
-
-**Real-World Hook Examples:**
-- Pre-install: Database schema migration
-- Post-install: Smoke tests, send notification
-- Pre-upgrade: Backup database
-- Post-upgrade: Run integration tests
-- Pre-delete: Backup data before cleanup
-
-</details>
-
-<details>
-<summary>💡 Testing Hooks</summary>
-
-**Validation Commands:**
-```bash
-# Lint chart
-helm lint k8s/mychart
-
-# Dry run to see hooks
-helm install --dry-run --debug test-release k8s/mychart | grep -A 20 "hook"
-
-# Install and watch hooks
-helm install myrelease k8s/mychart
-kubectl get jobs -w
-kubectl get pods -w
-
-# Check hook execution
-kubectl describe job myrelease-pre-install
-kubectl logs job/myrelease-pre-install
-
-# Verify deletion policy worked
-kubectl get jobs
-```
-
-**Hook Troubleshooting:**
-- Check annotations are correct
-- Verify hook weight if order matters
-- Check pod logs for hook failures
-- Ensure deletion policy is appropriate
-
-</details>
-
----
-
-### Task 5 — Documentation (2 pts)
-
-**Objective:** Document your Helm chart implementation.
-
-Create `k8s/HELM.md` with these sections:
-
-**Required Sections:**
-
-1. **Chart Overview**
-   - Chart structure explanation
-   - Key template files and their purpose
-   - Values organization strategy
-
-2. **Configuration Guide**
-   - Important values and their purpose
-   - How to customize for different environments
-   - Example installations with different configurations
-
-3. **Hook Implementation**
-   - What hooks you implemented and why
-   - Hook execution order and weights
-   - Deletion policies explanation
-
-4. **Installation Evidence**
-   - `helm list` output
-   - `kubectl get all` showing deployed resources
-   - Hook execution output (`kubectl get jobs`, `kubectl describe job`)
-   - Different environment deployments (dev vs prod)
-
-5. **Operations**
-   - Installation commands used
-   - How to upgrade a release
-   - How to rollback
-   - How to uninstall
-
-6. **Testing & Validation**
-   - `helm lint` output
-   - `helm template` verification
-   - Dry-run output
-   - Application accessibility verification
-
----
-
-## Bonus Task — Library Charts (2.5 pts)
-
-**Objective:** Create a library chart for shared templates across multiple applications.
-
-**Requirements:**
-
-1. **Deploy Second Application**
-   - Create Helm chart for second app
-   - Notice template duplication (labels, helpers, etc.)
-
-2. **Create Library Chart**
-   - Create library chart in `k8s/common-lib/`
-   - Extract shared templates (labels, names, etc.)
-   - Set chart type to `library` in Chart.yaml
-
-3. **Use Library Chart**
-   - Add library as dependency in both app charts
-   - Reference library templates
-   - Eliminate duplication
-
-4. **Verify**
-   - Both charts install successfully
-   - Templates render correctly using library
-
-<details>
-<summary>💡 Library Chart Concepts</summary>
-
-**What Are Library Charts?**
-Charts that only contain templates (no resources). Used to share common template logic.
-
-**Type: Library**
-- Cannot be installed directly
-- Used as dependencies
-- Share templates across charts
-
-**Common Use Cases:**
-- Standard labels
-- Name generation
-- Security contexts
-- Resource definitions
-- Common configuration patterns
-
-**Resources:**
-- [Library Charts](https://helm.sh/docs/topics/library_charts/)
-
-</details>
-
-<details>
-<summary>💡 Library Chart Implementation</summary>
-
-**k8s/common-lib/Chart.yaml:**
-```yaml
-apiVersion: v2
-name: common-lib
-description: Common templates for all applications
-type: library
-version: 0.1.0
-```
-
-**k8s/common-lib/templates/_labels.tpl:**
-```yaml
-{{/*
-Common labels
-*/}}
-{{- define "common.labels" -}}
-app.kubernetes.io/name: {{ include "common.name" . }}
-app.kubernetes.io/instance: {{ .Release.Name }}
-app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
-app.kubernetes.io/managed-by: {{ .Release.Service }}
-helm.sh/chart: {{ include "common.chart" . }}
-{{- end }}
-
-{{/*
-Selector labels
-*/}}
-{{- define "common.selectorLabels" -}}
-app.kubernetes.io/name: {{ include "common.name" . }}
-app.kubernetes.io/instance: {{ .Release.Name }}
-{{- end }}
-```
-
-**Using Library Chart:**
-
-**app1/Chart.yaml:**
-```yaml
-apiVersion: v2
-name: app1
-version: 0.1.0
-dependencies:
-  - name: common-lib
-    version: 0.1.0
-    repository: "file://../common-lib"
-```
-
-**app1/templates/deployment.yaml:**
-```yaml
-apiVersion: apps/v1
-kind: Deployment
-metadata:
-  name: {{ include "common.fullname" . }}
-  labels:
-    {{- include "common.labels" . | nindent 4 }}
-spec:
-  selector:
-    matchLabels:
-      {{- include "common.selectorLabels" . | nindent 6 }}
-  # ... rest of deployment
-```
-
-**Install with Dependencies:**
-```bash
-helm dependency update k8s/app1
-helm install app1-release k8s/app1
-```
-
-</details>
-
-**Documentation Required:**
-- Library chart structure
-- Shared templates implemented
-- How both apps use the library
-- Benefits of this approach (DRY, consistency, maintainability)
-- Terminal output showing successful deployment of both apps
-
----
-
-## Checklist
-
-### Task 1 — Helm Fundamentals (2 pts)
-- [ ] Helm installed and verified
-- [ ] Chart repositories explored
-- [ ] Helm concepts understood
-- [ ] Documentation of setup
-
-### Task 2 — Create Your Helm Chart (3 pts)
-- [ ] Chart created in `k8s/` directory
-- [ ] `Chart.yaml` properly configured
-- [ ] Manifests converted to templates
-- [ ] Values properly extracted
-- [ ] Helper templates implemented
-- [ ] Health checks remain functional (not commented out!)
-- [ ] Chart installs successfully
-
-### Task 3 — Multi-Environment Support (2 pts)
-- [ ] `values-dev.yaml` created
-- [ ] `values-prod.yaml` created
-- [ ] Environment-specific configurations
-- [ ] Both environments tested
-- [ ] Documentation of differences
-
-### Task 4 — Chart Hooks (3 pts)
-- [ ] Pre-install hook implemented
-- [ ] Post-install hook implemented
-- [ ] Proper hook annotations
-- [ ] Hook weights configured
-- [ ] Deletion policies applied
-- [ ] Hooks execute successfully
-- [ ] Hooks deleted per policy
-
-### Task 5 — Documentation (2 pts)
-- [ ] `k8s/HELM.md` complete
-- [ ] Chart structure explained
-- [ ] Configuration guide provided
-- [ ] Hook implementation documented
-- [ ] Installation evidence included
-- [ ] Operations documented
-
-### Bonus — Library Charts (2.5 pts)
-- [ ] Library chart created
-- [ ] Shared templates extracted
-- [ ] Two app charts using library
-- [ ] Dependencies configured
-- [ ] Both apps deploy successfully
-- [ ] Documentation complete
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Fundamentals** | 2 pts | Helm installed, concepts understood |
-| **Chart Creation** | 3 pts | Proper templating, values, helpers |
-| **Multi-Environment** | 2 pts | Different configs, tested |
-| **Hooks** | 3 pts | Pre/post install hooks working |
-| **Documentation** | 2 pts | Complete HELM.md |
-| **Bonus** | 2.5 pts | Library chart implementation |
-| **Total** | 14.5 pts | 12 pts required + 2.5 pts bonus |
-
-**Grading:**
-- **12/12:** Excellent templating, working hooks, multi-env, great docs
-- **10-11/12:** Working chart, hooks function, good documentation
-- **8-9/12:** Basic chart works, missing best practices or hooks
-- **<8/12:** Chart doesn't install, commented out probes, poor templating
-
----
-
-## Resources
-
-<details>
-<summary>📚 Official Helm Documentation</summary>
-
-- [Helm Documentation](https://helm.sh/docs/)
-- [Chart Best Practices](https://helm.sh/docs/chart_best_practices/)
-- [Chart Template Guide](https://helm.sh/docs/chart_template_guide/)
-- [Helm Commands](https://helm.sh/docs/helm/)
-
-</details>
-
-<details>
-<summary>🎓 Learning Resources</summary>
-
-- [Quickstart Guide](https://helm.sh/docs/intro/quickstart/)
-- [Using Helm](https://helm.sh/docs/intro/using_helm/)
-- [Go Template Primer](https://helm.sh/docs/chart_template_guide/builtin_objects/)
-- [Chart Development Tips](https://helm.sh/docs/howto/charts_tips_and_tricks/)
-
-</details>
-
-<details>
-<summary>🛠️ Tools</summary>
-
-- [Helm](https://helm.sh/) - Official site
-- [Artifact Hub](https://artifacthub.io/) - Public chart repository
-- [helm-docs](https://github.com/norwoodj/helm-docs) - Generate docs from values
-- [chart-testing](https://github.com/helm/chart-testing) - Lint and test charts
-
-</details>
-
-<details>
-<summary>📦 Public Chart Repositories</summary>
-
-- [Bitnami Charts](https://github.com/bitnami/charts)
-- [Prometheus Community](https://github.com/prometheus-community/helm-charts)
-- [Grafana Charts](https://github.com/grafana/helm-charts)
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 11:** Secrets management with Vault (integrate with Helm)
-- **Lab 12:** ConfigMaps and persistent volumes
-- **Lab 13:** ArgoCD deploys Helm charts via GitOps
-- **Lab 14:** Progressive delivery with Argo Rollouts
-- **Lab 15:** StatefulSets for stateful applications
-
----
-
-**Good luck!** ⛵
-
-> **Remember:** Helm makes your deployments reusable and configurable. Never comment out health checks - configure them properly. Template everything, hardcode nothing (except defaults).
+# Lab 10 — Helm Package Manager
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Helm-blue)
+![points](https://img.shields.io/badge/points-12%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Helm-informational)
+
+> Package your Kubernetes applications with Helm for reusable, configurable deployments across environments.
+
+## Overview
+
+Transform your Kubernetes manifests from Lab 9 into Helm charts. Learn templating, values management, lifecycle hooks, and chart best practices for production deployments.
+
+**What You'll Learn:**
+- Helm architecture and templating
+- Creating production-ready charts
+- Values and configuration management
+- Chart hooks for lifecycle events
+- Testing and validating charts
+- Library charts for code reuse
+
+**Tech Stack:** Helm 4.x | Kubernetes 1.33+ | Go templating | YAML
+
+---
+
+## Tasks
+
+### Task 1 — Helm Fundamentals (2 pts)
+
+**Objective:** Understand Helm concepts and set up your environment.
+
+**Requirements:**
+
+1. **Learn Helm Concepts**
+   - Understand Charts, Releases, and Repositories
+   - Learn Go template syntax basics
+   - Study Helm architecture (v3)
+
+2. **Install Helm**
+   - Install Helm CLI
+   - Verify installation
+   - Add common chart repositories
+
+3. **Explore Existing Charts**
+   - Search public repositories
+   - Inspect a chart's structure
+   - Understand chart components
+
+<details>
+<summary>💡 Helm Concepts</summary>
+
+**What is Helm?**
+Package manager for Kubernetes. Think `apt`/`yum` for K8s applications.
+
+**Core Concepts:**
+- **Chart**: Package of Kubernetes resources (like a `.deb` or `.rpm`)
+- **Release**: Instance of a chart running in a cluster
+- **Repository**: Collection of charts (like package repositories)
+- **Values**: Configuration parameters for customization
+
+**Why Helm?**
+- **Templating**: Reuse manifests across environments
+- **Versioning**: Track and rollback releases
+- **Dependencies**: Manage complex multi-chart applications
+- **Hooks**: Execute actions during install/upgrade/delete
+- **Standardization**: Industry-standard packaging
+
+**Helm 4 (Current):**
+- Released November 2025, first major version in 6 years
+- Full backward compatibility with Helm 3 charts (apiVersion v2)
+- OCI registry support
+- No Tiller (removed in Helm 3)
+- Improved security and performance
+
+**Chart Structure:**
+```
+mychart/
+├── Chart.yaml          # Chart metadata
+├── values.yaml         # Default configuration values
+├── charts/             # Chart dependencies
+└── templates/          # Kubernetes manifest templates
+    ├── deployment.yaml
+    ├── service.yaml
+    ├── _helpers.tpl    # Template helpers
+    └── NOTES.txt       # Post-install notes
+```
+
+**Resources:**
+- [Helm Architecture](https://helm.sh/docs/topics/architecture/)
+- [Three Big Concepts](https://helm.sh/docs/intro/using_helm/#three-big-concepts)
+- [Charts](https://helm.sh/docs/topics/charts/)
+- [Install Helm](https://helm.sh/docs/intro/install/)
+
+</details>
+
+<details>
+<summary>💡 Essential Helm Commands</summary>
+
+**Repository Management:**
+```bash
+# Note: Traditional HTTP repositories are being phased out
+# Many charts now use OCI registries
+
+# Add a repository (traditional method)
+helm repo add prometheus-community https://prometheus-community.github.io/helm-charts
+helm repo update
+helm search repo prometheus
+
+# Install from OCI registry (modern method)
+helm install my-nginx oci://registry-1.docker.io/bitnamicharts/nginx
+```
+
+**Chart Operations:**
+```bash
+helm create mychart           # Create new chart
+helm lint mychart             # Validate chart
+helm template mychart         # Render templates locally
+helm install myrelease mychart  # Install chart
+helm list                     # List releases
+helm uninstall myrelease      # Remove release
+```
+
+**Debugging:**
+```bash
+helm install --dry-run --debug myrelease mychart
+helm get manifest myrelease
+helm get values myrelease
+```
+
+</details>
+
+**Documentation Required:**
+- Terminal output showing Helm installation and version (should be 4.x)
+- Output of exploring a public chart (e.g., `helm show chart prometheus-community/prometheus`)
+- Brief explanation of Helm's value proposition
+
+---
+
+### Task 2 — Create Your Helm Chart (3 pts)
+
+**Objective:** Convert your Lab 9 Kubernetes manifests into a Helm chart.
+
+**Requirements:**
+
+1. **Initialize Chart**
+   - Create chart in `k8s/` directory
+   - Choose appropriate chart name
+   - Update `Chart.yaml` with metadata
+
+2. **Convert Manifests to Templates**
+   - Move your `deployment.yml` to `templates/deployment.yaml`
+   - Move your `service.yml` to `templates/service.yaml`
+   - Templatize using Go template syntax
+   - Extract values to `values.yaml`
+
+3. **Implement Proper Templating**
+   - Image repository and tag from values
+   - Replica count from values
+   - Resource limits from values
+   - Service type and ports from values
+   - Labels using helper templates
+
+4. **Keep Health Checks**
+   - NEVER comment out liveness/readiness probes
+   - Make probe configuration customizable via values
+   - Provide sensible defaults
+
+<details>
+<summary>💡 Chart.yaml Structure</summary>
+
+**Required Fields:**
+```yaml
+apiVersion: v2              # Chart API version (v2 for Helm 3+)
+name: my-python-app         # Chart name
+description: My Python application Helm chart
+type: application           # application or library
+version: 0.1.0              # Chart version (SemVer)
+appVersion: "1.0"           # App version (can be any string)
+```
+
+**Optional but Recommended:**
+```yaml
+keywords:
+  - python
+  - web
+maintainers:
+  - name: Your Name
+    email: your.email@example.com
+sources:
+  - https://github.com/yourusername/yourapp
+```
+
+**Chart vs App Version:**
+- `version`: Chart version (change when chart changes)
+- `appVersion`: Application version (change when app changes)
+
+</details>
+
+<details>
+<summary>💡 Templating Basics</summary>
+
+**Go Template Syntax:**
+```yaml
+# Access value from values.yaml
+image: {{ .Values.image.repository }}:{{ .Values.image.tag }}
+
+# With default value
+replicas: {{ .Values.replicaCount | default 3 }}
+
+# Conditional
+{{- if .Values.service.enabled }}
+# ... service definition
+{{- end }}
+
+# Range (loop)
+{{- range .Values.env }}
+- name: {{ .name }}
+  value: {{ .value }}
+{{- end }}
+```
+
+**Built-in Objects:**
+- `.Values`: Values from `values.yaml` and overrides
+- `.Chart`: Contents of `Chart.yaml`
+- `.Release`: Info about the release (name, namespace, etc.)
+- `.Template`: Info about current template
+
+**Example Conversion:**
+
+Before (static):
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: my-app
+spec:
+  replicas: 3
+  template:
+    spec:
+      containers:
+      - name: my-app
+        image: myuser/myapp:v1.0
+```
+
+After (templated):
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: {{ include "mychart.fullname" . }}
+  labels:
+    {{- include "mychart.labels" . | nindent 4 }}
+spec:
+  replicas: {{ .Values.replicaCount }}
+  template:
+    spec:
+      containers:
+      - name: {{ .Chart.Name }}
+        image: "{{ .Values.image.repository }}:{{ .Values.image.tag | default .Chart.AppVersion }}"
+```
+
+</details>
+
+<details>
+<summary>💡 Values.yaml Design</summary>
+
+**Structure Your Values:**
+```yaml
+# values.yaml
+replicaCount: 3
+
+image:
+  repository: yourusername/yourapp
+  tag: "1.0"
+  pullPolicy: IfNotPresent
+
+service:
+  type: NodePort
+  port: 80
+  targetPort: 8000
+
+resources:
+  limits:
+    cpu: 200m
+    memory: 256Mi
+  requests:
+    cpu: 100m
+    memory: 128Mi
+
+livenessProbe:
+  httpGet:
+    path: /health
+    port: 8000
+  initialDelaySeconds: 10
+  periodSeconds: 5
+
+readinessProbe:
+  httpGet:
+    path: /ready
+    port: 8000
+  initialDelaySeconds: 5
+  periodSeconds: 3
+```
+
+**Best Practices:**
+- Nested structure for organization
+- Sensible defaults
+- Document each value
+- Make everything configurable
+- Never hardcode secrets
+
+</details>
+
+<details>
+<summary>💡 Helper Templates</summary>
+
+**_helpers.tpl Pattern:**
+```yaml
+{{/*
+Expand the name of the chart.
+*/}}
+{{- define "mychart.name" -}}
+{{- default .Chart.Name .Values.nameOverride | trunc 63 | trimSuffix "-" }}
+{{- end }}
+
+{{/*
+Create a default fully qualified app name.
+*/}}
+{{- define "mychart.fullname" -}}
+{{- if .Values.fullnameOverride }}
+{{- .Values.fullnameOverride | trunc 63 | trimSuffix "-" }}
+{{- else }}
+{{- $name := default .Chart.Name .Values.nameOverride }}
+{{- printf "%s-%s" .Release.Name $name | trunc 63 | trimSuffix "-" }}
+{{- end }}
+{{- end }}
+
+{{/*
+Common labels
+*/}}
+{{- define "mychart.labels" -}}
+helm.sh/chart: {{ include "mychart.chart" . }}
+{{ include "mychart.selectorLabels" . }}
+app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
+app.kubernetes.io/managed-by: {{ .Release.Service }}
+{{- end }}
+```
+
+**Why Helpers?**
+- DRY principle
+- Consistent naming
+- Reusable logic
+- Easier maintenance
+
+</details>
+
+**Test Your Chart:**
+```bash
+helm lint k8s/mychart
+helm template mychart k8s/mychart
+helm install --dry-run --debug test-release k8s/mychart
+helm install myrelease k8s/mychart
+```
+
+---
+
+### Task 3 — Multi-Environment Support (2 pts)
+
+**Objective:** Configure chart for different environments using values files.
+
+**Requirements:**
+
+1. **Create Environment-Specific Values**
+   - `values-dev.yaml` for development
+   - `values-prod.yaml` for production
+   - Different configurations per environment
+
+2. **Environment Differences**
+   - Dev: 1 replica, relaxed resources, NodePort
+   - Prod: 3+ replicas, proper resources, LoadBalancer ready
+   - Different image tags or configurations
+
+3. **Test Both Environments**
+   - Install with dev values
+   - Verify configuration
+   - Upgrade to prod values
+   - Verify changes applied
+
+<details>
+<summary>💡 Values Override Pattern</summary>
+
+**values-dev.yaml:**
+```yaml
+replicaCount: 1
+
+image:
+  tag: "latest"
+
+resources:
+  limits:
+    cpu: 100m
+    memory: 128Mi
+  requests:
+    cpu: 50m
+    memory: 64Mi
+
+service:
+  type: NodePort
+
+livenessProbe:
+  initialDelaySeconds: 5
+  periodSeconds: 10
+```
+
+**values-prod.yaml:**
+```yaml
+replicaCount: 5
+
+image:
+  tag: "1.0.0"  # Specific version
+
+resources:
+  limits:
+    cpu: 500m
+    memory: 512Mi
+  requests:
+    cpu: 200m
+    memory: 256Mi
+
+service:
+  type: LoadBalancer
+
+livenessProbe:
+  initialDelaySeconds: 30
+  periodSeconds: 5
+
+readinessProbe:
+  initialDelaySeconds: 10
+  periodSeconds: 3
+```
+
+**Using Values Files:**
+```bash
+# Development
+helm install myapp-dev k8s/mychart -f k8s/mychart/values-dev.yaml
+
+# Production
+helm install myapp-prod k8s/mychart -f k8s/mychart/values-prod.yaml
+
+# Override specific value
+helm install myapp k8s/mychart --set replicaCount=10
+```
+
+</details>
+
+---
+
+### Task 4 — Chart Hooks (3 pts)
+
+**Objective:** Implement Helm hooks for lifecycle management.
+
+**Requirements:**
+
+1. **Learn Hook Concepts**
+   - Understand hook weights and execution order
+   - Learn hook deletion policies
+
+2. **Implement Hooks**
+   - **Pre-install hook**: Job that runs before installation (e.g., database migration, validation)
+   - **Post-install hook**: Job that runs after installation (e.g., smoke test, notification)
+
+3. **Hook Configuration**
+   - Proper annotations for hook type
+   - Hook weight for execution order
+   - Deletion policy (hook-succeeded)
+
+4. **Verify Hooks**
+   - Lint chart
+   - Dry-run to see hook rendering
+   - Install and verify hook execution
+   - Confirm hooks are deleted per policy
+
+<details>
+<summary>💡 Helm Hooks Concept</summary>
+
+**What Are Hooks?**
+Special Kubernetes resources that execute at specific points in release lifecycle.
+
+**Hook Types:**
+- `pre-install`: Before resources are installed
+- `post-install`: After all resources installed and ready
+- `pre-delete`: Before deletion
+- `post-delete`: After deletion
+- `pre-upgrade`: Before upgrade
+- `post-upgrade`: After upgrade
+- `pre-rollback`: Before rollback
+- `post-rollback`: After rollback
+
+**Hook Weights:**
+- Control execution order
+- Lower weight runs first
+- Default weight: 0
+
+**Hook Deletion Policies:**
+- `before-hook-creation`: Delete previous hook before new one
+- `hook-succeeded`: Delete after successful execution
+- `hook-failed`: Delete after failed execution
+
+**Resources:**
+- [Chart Hooks](https://helm.sh/docs/topics/charts_hooks/)
+
+</details>
+
+<details>
+<summary>💡 Hook Implementation Pattern</summary>
+
+**templates/hooks/pre-install-job.yaml:**
+```yaml
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: "{{ include "mychart.fullname" . }}-pre-install"
+  labels:
+    {{- include "mychart.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": pre-install
+    "helm.sh/hook-weight": "-5"
+    "helm.sh/hook-delete-policy": hook-succeeded
+spec:
+  template:
+    metadata:
+      name: "{{ include "mychart.fullname" . }}-pre-install"
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: pre-install-job
+        image: busybox
+        command: ['sh', '-c', 'echo Pre-install task running && sleep 10 && echo Pre-install completed']
+```
+
+**templates/hooks/post-install-job.yaml:**
+```yaml
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: "{{ include "mychart.fullname" . }}-post-install"
+  labels:
+    {{- include "mychart.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": post-install
+    "helm.sh/hook-weight": "5"
+    "helm.sh/hook-delete-policy": hook-succeeded
+spec:
+  template:
+    metadata:
+      name: "{{ include "mychart.fullname" . }}-post-install"
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: post-install-job
+        image: busybox
+        command: ['sh', '-c', 'echo Post-install validation && sleep 10 && echo Validation passed']
+```
+
+**Real-World Hook Examples:**
+- Pre-install: Database schema migration
+- Post-install: Smoke tests, send notification
+- Pre-upgrade: Backup database
+- Post-upgrade: Run integration tests
+- Pre-delete: Backup data before cleanup
+
+</details>
+
+<details>
+<summary>💡 Testing Hooks</summary>
+
+**Validation Commands:**
+```bash
+# Lint chart
+helm lint k8s/mychart
+
+# Dry run to see hooks
+helm install --dry-run --debug test-release k8s/mychart | grep -A 20 "hook"
+
+# Install and watch hooks
+helm install myrelease k8s/mychart
+kubectl get jobs -w
+kubectl get pods -w
+
+# Check hook execution
+kubectl describe job myrelease-pre-install
+kubectl logs job/myrelease-pre-install
+
+# Verify deletion policy worked
+kubectl get jobs
+```
+
+**Hook Troubleshooting:**
+- Check annotations are correct
+- Verify hook weight if order matters
+- Check pod logs for hook failures
+- Ensure deletion policy is appropriate
+
+</details>
+
+---
+
+### Task 5 — Documentation (2 pts)
+
+**Objective:** Document your Helm chart implementation.
+
+Create `k8s/HELM.md` with these sections:
+
+**Required Sections:**
+
+1. **Chart Overview**
+   - Chart structure explanation
+   - Key template files and their purpose
+   - Values organization strategy
+
+2. **Configuration Guide**
+   - Important values and their purpose
+   - How to customize for different environments
+   - Example installations with different configurations
+
+3. **Hook Implementation**
+   - What hooks you implemented and why
+   - Hook execution order and weights
+   - Deletion policies explanation
+
+4. **Installation Evidence**
+   - `helm list` output
+   - `kubectl get all` showing deployed resources
+   - Hook execution output (`kubectl get jobs`, `kubectl describe job`)
+   - Different environment deployments (dev vs prod)
+
+5. **Operations**
+   - Installation commands used
+   - How to upgrade a release
+   - How to rollback
+   - How to uninstall
+
+6. **Testing & Validation**
+   - `helm lint` output
+   - `helm template` verification
+   - Dry-run output
+   - Application accessibility verification
+
+---
+
+## Bonus Task — Library Charts (2.5 pts)
+
+**Objective:** Create a library chart for shared templates across multiple applications.
+
+**Requirements:**
+
+1. **Deploy Second Application**
+   - Create Helm chart for second app
+   - Notice template duplication (labels, helpers, etc.)
+
+2. **Create Library Chart**
+   - Create library chart in `k8s/common-lib/`
+   - Extract shared templates (labels, names, etc.)
+   - Set chart type to `library` in Chart.yaml
+
+3. **Use Library Chart**
+   - Add library as dependency in both app charts
+   - Reference library templates
+   - Eliminate duplication
+
+4. **Verify**
+   - Both charts install successfully
+   - Templates render correctly using library
+
+<details>
+<summary>💡 Library Chart Concepts</summary>
+
+**What Are Library Charts?**
+Charts that only contain templates (no resources). Used to share common template logic.
+
+**Type: Library**
+- Cannot be installed directly
+- Used as dependencies
+- Share templates across charts
+
+**Common Use Cases:**
+- Standard labels
+- Name generation
+- Security contexts
+- Resource definitions
+- Common configuration patterns
+
+**Resources:**
+- [Library Charts](https://helm.sh/docs/topics/library_charts/)
+
+</details>
+
+<details>
+<summary>💡 Library Chart Implementation</summary>
+
+**k8s/common-lib/Chart.yaml:**
+```yaml
+apiVersion: v2
+name: common-lib
+description: Common templates for all applications
+type: library
+version: 0.1.0
+```
+
+**k8s/common-lib/templates/_labels.tpl:**
+```yaml
+{{/*
+Common labels
+*/}}
+{{- define "common.labels" -}}
+app.kubernetes.io/name: {{ include "common.name" . }}
+app.kubernetes.io/instance: {{ .Release.Name }}
+app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
+app.kubernetes.io/managed-by: {{ .Release.Service }}
+helm.sh/chart: {{ include "common.chart" . }}
+{{- end }}
+
+{{/*
+Selector labels
+*/}}
+{{- define "common.selectorLabels" -}}
+app.kubernetes.io/name: {{ include "common.name" . }}
+app.kubernetes.io/instance: {{ .Release.Name }}
+{{- end }}
+```
+
+**Using Library Chart:**
+
+**app1/Chart.yaml:**
+```yaml
+apiVersion: v2
+name: app1
+version: 0.1.0
+dependencies:
+  - name: common-lib
+    version: 0.1.0
+    repository: "file://../common-lib"
+```
+
+**app1/templates/deployment.yaml:**
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: {{ include "common.fullname" . }}
+  labels:
+    {{- include "common.labels" . | nindent 4 }}
+spec:
+  selector:
+    matchLabels:
+      {{- include "common.selectorLabels" . | nindent 6 }}
+  # ... rest of deployment
+```
+
+**Install with Dependencies:**
+```bash
+helm dependency update k8s/app1
+helm install app1-release k8s/app1
+```
+
+</details>
+
+**Documentation Required:**
+- Library chart structure
+- Shared templates implemented
+- How both apps use the library
+- Benefits of this approach (DRY, consistency, maintainability)
+- Terminal output showing successful deployment of both apps
+
+---
+
+## Checklist
+
+### Task 1 — Helm Fundamentals (2 pts)
+- [ ] Helm installed and verified
+- [ ] Chart repositories explored
+- [ ] Helm concepts understood
+- [ ] Documentation of setup
+
+### Task 2 — Create Your Helm Chart (3 pts)
+- [ ] Chart created in `k8s/` directory
+- [ ] `Chart.yaml` properly configured
+- [ ] Manifests converted to templates
+- [ ] Values properly extracted
+- [ ] Helper templates implemented
+- [ ] Health checks remain functional (not commented out!)
+- [ ] Chart installs successfully
+
+### Task 3 — Multi-Environment Support (2 pts)
+- [ ] `values-dev.yaml` created
+- [ ] `values-prod.yaml` created
+- [ ] Environment-specific configurations
+- [ ] Both environments tested
+- [ ] Documentation of differences
+
+### Task 4 — Chart Hooks (3 pts)
+- [ ] Pre-install hook implemented
+- [ ] Post-install hook implemented
+- [ ] Proper hook annotations
+- [ ] Hook weights configured
+- [ ] Deletion policies applied
+- [ ] Hooks execute successfully
+- [ ] Hooks deleted per policy
+
+### Task 5 — Documentation (2 pts)
+- [ ] `k8s/HELM.md` complete
+- [ ] Chart structure explained
+- [ ] Configuration guide provided
+- [ ] Hook implementation documented
+- [ ] Installation evidence included
+- [ ] Operations documented
+
+### Bonus — Library Charts (2.5 pts)
+- [ ] Library chart created
+- [ ] Shared templates extracted
+- [ ] Two app charts using library
+- [ ] Dependencies configured
+- [ ] Both apps deploy successfully
+- [ ] Documentation complete
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Fundamentals** | 2 pts | Helm installed, concepts understood |
+| **Chart Creation** | 3 pts | Proper templating, values, helpers |
+| **Multi-Environment** | 2 pts | Different configs, tested |
+| **Hooks** | 3 pts | Pre/post install hooks working |
+| **Documentation** | 2 pts | Complete HELM.md |
+| **Bonus** | 2.5 pts | Library chart implementation |
+| **Total** | 14.5 pts | 12 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **12/12:** Excellent templating, working hooks, multi-env, great docs
+- **10-11/12:** Working chart, hooks function, good documentation
+- **8-9/12:** Basic chart works, missing best practices or hooks
+- **<8/12:** Chart doesn't install, commented out probes, poor templating
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Helm Documentation</summary>
+
+- [Helm Documentation](https://helm.sh/docs/)
+- [Chart Best Practices](https://helm.sh/docs/chart_best_practices/)
+- [Chart Template Guide](https://helm.sh/docs/chart_template_guide/)
+- [Helm Commands](https://helm.sh/docs/helm/)
+
+</details>
+
+<details>
+<summary>🎓 Learning Resources</summary>
+
+- [Quickstart Guide](https://helm.sh/docs/intro/quickstart/)
+- [Using Helm](https://helm.sh/docs/intro/using_helm/)
+- [Go Template Primer](https://helm.sh/docs/chart_template_guide/builtin_objects/)
+- [Chart Development Tips](https://helm.sh/docs/howto/charts_tips_and_tricks/)
+
+</details>
+
+<details>
+<summary>🛠️ Tools</summary>
+
+- [Helm](https://helm.sh/) - Official site
+- [Artifact Hub](https://artifacthub.io/) - Public chart repository
+- [helm-docs](https://github.com/norwoodj/helm-docs) - Generate docs from values
+- [chart-testing](https://github.com/helm/chart-testing) - Lint and test charts
+
+</details>
+
+<details>
+<summary>📦 Public Chart Repositories</summary>
+
+- [Bitnami Charts](https://github.com/bitnami/charts)
+- [Prometheus Community](https://github.com/prometheus-community/helm-charts)
+- [Grafana Charts](https://github.com/grafana/helm-charts)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 11:** Secrets management with Vault (integrate with Helm)
+- **Lab 12:** ConfigMaps and persistent volumes
+- **Lab 13:** ArgoCD deploys Helm charts via GitOps
+- **Lab 14:** Progressive delivery with Argo Rollouts
+- **Lab 15:** StatefulSets for stateful applications
+
+---
+
+**Good luck!** ⛵
+
+> **Remember:** Helm makes your deployments reusable and configurable. Never comment out health checks - configure them properly. Template everything, hardcode nothing (except defaults).
diff --git a/labs/lab11.md b/labs/lab11.md
index e69ab67618..272471f35c 100644
--- a/labs/lab11.md
+++ b/labs/lab11.md
@@ -1,447 +1,447 @@
-# Lab 11 — Kubernetes Secrets & HashiCorp Vault
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-Secret%20Management-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Vault%20%7C%20K8s%20Secrets-informational)
-
-> Secure your Kubernetes applications by implementing proper secret management with native Secrets and HashiCorp Vault integration.
-
-## Overview
-
-Secret management is critical for production Kubernetes deployments. Hardcoded credentials in code or config files are a security nightmare. This lab teaches you how to properly manage sensitive data using Kubernetes native Secrets and enterprise-grade HashiCorp Vault.
-
-**What You'll Learn:**
-- Kubernetes Secrets creation and consumption
-- Base64 encoding vs actual encryption
-- Helm-based secret management
-- HashiCorp Vault installation and configuration
-- Kubernetes authentication with Vault
-- Sidecar injection pattern for secrets
-
-**Building On:** Your Helm chart from Lab 10 will be extended with secret management capabilities.
-
-**Tech Stack:** Kubernetes Secrets | HashiCorp Vault 1.18+ | Vault Helm 0.28+ | Vault Agent Injector
-
----
-
-## Tasks
-
-### Task 1 — Kubernetes Secrets Fundamentals (2 pts)
-
-**Objective:** Understand how Kubernetes Secrets work and their security model.
-
-**Requirements:**
-
-1. **Create a Secret Using kubectl**
-   - Create a secret named `app-credentials` with:
-     - `username` key
-     - `password` key
-   - Use the imperative `kubectl create secret` command
-
-2. **Examine the Secret**
-   - View the secret in YAML format
-   - Decode the base64-encoded values
-   - Understand what "encoding" vs "encryption" means
-
-3. **Understand Security Implications**
-   - Research: Are Kubernetes Secrets encrypted at rest by default?
-   - What is etcd encryption and when should you enable it?
-
-<details>
-<summary>💡 Hints</summary>
-
-**Creating Secrets:**
-There are multiple ways to create secrets:
-- `kubectl create secret generic` - from literals or files
-- `kubectl create secret docker-registry` - for image pull secrets
-- `kubectl create secret tls` - for TLS certificates
-
-**Useful Commands:**
-```bash
-# Create from literals
-kubectl create secret generic <name> --from-literal=key=value
-
-# View secret
-kubectl get secret <name> -o yaml
-
-# Decode base64 (Linux/Mac)
-echo "<base64-string>" | base64 -d
-```
-
-**Security Model:**
-Kubernetes Secrets are base64-encoded, NOT encrypted by default. Anyone with API access can decode them. For production:
-- Enable etcd encryption at rest
-- Use RBAC to limit secret access
-- Consider external secret managers (Vault, AWS Secrets Manager, etc.)
-
-**Resources:**
-- [Kubernetes Secrets Concepts](https://kubernetes.io/docs/concepts/configuration/secret/)
-- [Encrypting Secret Data at Rest](https://kubernetes.io/docs/tasks/administer-cluster/encrypt-data/)
-
-</details>
-
----
-
-### Task 2 — Helm-Managed Secrets (3 pts)
-
-**Objective:** Integrate secrets into your Helm chart and inject them into your application.
-
-**Requirements:**
-
-1. **Create Secret Template**
-   - Add `templates/secrets.yaml` to your Helm chart
-   - Define secret values in `values.yaml` (with placeholder defaults)
-   - Use proper templating for secret name and labels
-
-2. **Inject Secrets as Environment Variables**
-   - Update your deployment to consume the secret
-   - Use `envFrom` with `secretRef` for all keys
-   - OR use individual `env` entries with `secretKeyRef`
-
-3. **Verify Secret Injection**
-   - Deploy the updated chart
-   - Exec into the pod and verify environment variables
-   - Ensure secrets are not visible in `kubectl describe pod`
-
-4. **Add Resource Limits**
-   - Configure CPU and memory requests/limits in your deployment
-   - Use values.yaml for configurability
-   - Apply Kubernetes resource management best practices
-
-<details>
-<summary>💡 Hints</summary>
-
-**Secret Template Structure:**
-Your `templates/secrets.yaml` should:
-- Use the standard `v1` API and `Secret` kind
-- Include proper metadata with templated name and labels
-- Reference values from `values.yaml`
-- Use `stringData` for plain text (auto-encoded) or `data` for pre-encoded
-
-**Consuming Secrets in Deployment:**
-There are two patterns for environment variables:
-
-Pattern 1 - All keys from secret:
-```yaml
-envFrom:
-  - secretRef:
-      name: {{ include "mychart.fullname" . }}-secret
-```
-
-Pattern 2 - Specific keys:
-```yaml
-env:
-  - name: DATABASE_PASSWORD
-    valueFrom:
-      secretKeyRef:
-        name: secret-name
-        key: password
-```
-
-**Resource Limits:**
-```yaml
-resources:
-  requests:
-    memory: "64Mi"
-    cpu: "100m"
-  limits:
-    memory: "128Mi"
-    cpu: "200m"
-```
-
-**Security Note:**
-Never commit real secrets to Git! Use:
-- Placeholder values in `values.yaml`
-- `--set` flag during install
-- External secret management (next task)
-
-**Resources:**
-- [Managing Secrets with kubectl](https://kubernetes.io/docs/tasks/configmap-secret/managing-secret-using-kubectl/)
-- [Resource Management](https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/)
-
-</details>
-
----
-
-### Task 3 — HashiCorp Vault Integration (3 pts)
-
-**Objective:** Deploy HashiCorp Vault and configure it to inject secrets into your application.
-
-**Requirements:**
-
-1. **Install Vault via Helm**
-   - Add HashiCorp Helm repository
-   - Install Vault in dev mode (for learning purposes)
-   - Verify all Vault pods are running
-
-2. **Configure Vault**
-   - Enable KV secrets engine (v2)
-   - Create a secret path for your application
-   - Store at least two key-value pairs
-
-3. **Configure Kubernetes Authentication**
-   - Enable Kubernetes auth method in Vault
-   - Create a policy that grants read access to your secret path
-   - Create a role bound to your application's service account
-
-4. **Enable Vault Agent Injection**
-   - Add Vault annotations to your deployment
-   - Configure the agent to inject secrets as files
-   - Verify secrets are available inside the pod at the expected path
-
-<details>
-<summary>💡 Hints</summary>
-
-**Installing Vault:**
-```bash
-# Add repo
-helm repo add hashicorp https://helm.releases.hashicorp.com
-helm repo update
-
-# Install in dev mode (NOT for production!)
-helm install vault hashicorp/vault \
-  --set "server.dev.enabled=true" \
-  --set "injector.enabled=true"
-```
-
-**Vault Configuration Steps:**
-1. Exec into Vault pod: `kubectl exec -it vault-0 -- /bin/sh`
-2. Vault is auto-initialized in dev mode
-3. Use `vault` CLI inside the pod
-
-**Key Vault Commands:**
-```bash
-# Enable KV v2
-vault secrets enable -path=secret kv-v2
-
-# Create secret
-vault kv put secret/myapp/config username="admin" password="secret123"
-
-# Enable K8s auth
-vault auth enable kubernetes
-
-# Configure K8s auth (get values from your cluster)
-vault write auth/kubernetes/config \
-  kubernetes_host="https://$KUBERNETES_PORT_443_TCP_ADDR:443"
-```
-
-**Policy and Role:**
-You need to:
-1. Create a policy that allows reading from your secret path
-2. Create a role that binds the policy to your service account
-
-**Vault Agent Annotations:**
-Add these to your deployment's pod template:
-```yaml
-annotations:
-  vault.hashicorp.com/agent-inject: "true"
-  vault.hashicorp.com/role: "your-role"
-  vault.hashicorp.com/agent-inject-secret-config: "secret/data/myapp/config"
-```
-
-**Resources:**
-- [Vault Helm Chart](https://developer.hashicorp.com/vault/docs/platform/k8s/helm)
-- [Vault K8s Sidecar Tutorial](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar)
-- [Agent Annotations](https://developer.hashicorp.com/vault/docs/platform/k8s/injector/annotations)
-
-</details>
-
----
-
-### Task 4 — Documentation (2 pts)
-
-**Objective:** Document your secret management implementation.
-
-**Create `k8s/SECRETS.md` with:**
-
-1. **Kubernetes Secrets**
-   - Output of creating and viewing your secret
-   - Decoded secret values demonstration
-   - Explanation of base64 encoding vs encryption
-
-2. **Helm Secret Integration**
-   - Chart structure showing secrets.yaml
-   - How secrets are consumed in deployment
-   - Verification output (env vars in pod, excluding actual values)
-
-3. **Resource Management**
-   - Resource limits configuration
-   - Explanation of requests vs limits
-   - How to choose appropriate values
-
-4. **Vault Integration**
-   - Vault installation verification (`kubectl get pods`)
-   - Policy and role configuration (sanitized)
-   - Proof of secret injection (show file exists, path structure)
-   - Explanation of the sidecar injection pattern
-
-5. **Security Analysis**
-   - Comparison: K8s Secrets vs Vault
-   - When to use each approach
-   - Production recommendations
-
----
-
-## Bonus Task — Vault Agent Templates (2.5 pts)
-
-**Objective:** Use Vault Agent templating to render secrets in custom formats.
-
-**Requirements:**
-
-1. **Implement Template Annotation**
-   - Use `vault.hashicorp.com/agent-inject-template-*` annotation
-   - Render secrets as a configuration file (e.g., `.env` format or JSON)
-   - Include multiple secrets in a single rendered file
-
-2. **Dynamic Secret Rotation**
-   - Research how Vault Agent handles secret updates
-   - Document the refresh mechanism
-   - Explain `vault.hashicorp.com/agent-inject-command` annotation
-
-3. **Named Templates for Environment Variables**
-   - Create a named template in `_helpers.tpl` for common environment variables
-   - Use `include` to reference it in your deployment
-   - Demonstrate DRY principle in Helm charts
-
-<details>
-<summary>💡 Hints</summary>
-
-**Template Annotation Example:**
-```yaml
-vault.hashicorp.com/agent-inject-template-config: |
-  {{- with secret "secret/data/myapp/config" -}}
-  DATABASE_URL={{ .Data.data.db_url }}
-  API_KEY={{ .Data.data.api_key }}
-  {{- end -}}
-```
-
-**Named Template Pattern:**
-In `_helpers.tpl`:
-```yaml
-{{- define "mychart.envVars" -}}
-- name: APP_ENV
-  value: {{ .Values.environment }}
-- name: LOG_LEVEL
-  value: {{ .Values.logLevel }}
-{{- end -}}
-```
-
-In deployment:
-```yaml
-env:
-  {{- include "mychart.envVars" . | nindent 12 }}
-```
-
-**Resources:**
-- [Vault Agent Templates](https://developer.hashicorp.com/vault/docs/platform/k8s/injector/annotations#vault-hashicorp-com-agent-inject-template)
-- [Helm Named Templates](https://helm.sh/docs/chart_template_guide/named_templates/)
-
-</details>
-
-**Bonus Documentation:**
-- Template annotation configuration
-- Rendered secret file content
-- Named template implementation
-- Benefits of templating approach
-
----
-
-## Checklist
-
-### Task 1 — Kubernetes Secrets Fundamentals (2 pts)
-- [ ] Secret created via kubectl
-- [ ] Secret viewed and decoded
-- [ ] Security implications understood and documented
-
-### Task 2 — Helm-Managed Secrets (3 pts)
-- [ ] `templates/secrets.yaml` created
-- [ ] Secrets defined in `values.yaml`
-- [ ] Deployment updated to consume secrets
-- [ ] Environment variables verified in pod
-- [ ] Resource limits configured
-
-### Task 3 — HashiCorp Vault Integration (3 pts)
-- [ ] Vault installed via Helm
-- [ ] KV secrets engine configured
-- [ ] Kubernetes auth method enabled
-- [ ] Policy and role created
-- [ ] Vault Agent injection working
-- [ ] Secrets accessible in pod
-
-### Task 4 — Documentation (2 pts)
-- [ ] `k8s/SECRETS.md` complete
-- [ ] All sections documented with evidence
-- [ ] Security analysis included
-
-### Bonus — Vault Agent Templates (2.5 pts)
-- [ ] Template annotation implemented
-- [ ] Custom format rendering working
-- [ ] Named templates in `_helpers.tpl`
-- [ ] Documentation complete
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **K8s Secrets** | 2 pts | Create, view, decode, understand security |
-| **Helm Secrets** | 3 pts | Template, inject, verify, resource limits |
-| **Vault Integration** | 3 pts | Install, configure, auth, inject |
-| **Documentation** | 2 pts | Complete SECRETS.md with evidence |
-| **Bonus** | 2.5 pts | Templates, named templates, rotation |
-| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
-
-**Grading:**
-- **10/10:** Working Vault injection, proper Helm secrets, good documentation
-- **8-9/10:** Vault working, minor issues with docs or config
-- **6-7/10:** K8s secrets work, Vault partially configured
-- **<6/10:** Secrets not properly implemented, missing Vault setup
-
----
-
-## Resources
-
-<details>
-<summary>📚 Official Documentation</summary>
-
-- [Kubernetes Secrets](https://kubernetes.io/docs/concepts/configuration/secret/)
-- [HashiCorp Vault](https://developer.hashicorp.com/vault/docs)
-- [Vault Helm Chart](https://developer.hashicorp.com/vault/docs/platform/k8s/helm)
-- [Vault K8s Injector](https://developer.hashicorp.com/vault/docs/platform/k8s/injector)
-
-</details>
-
-<details>
-<summary>🎓 Tutorials</summary>
-
-- [Vault on Kubernetes Deployment Guide](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-raft-deployment-guide)
-- [Injecting Secrets into Kubernetes Pods](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar)
-- [Kubernetes Auth Method](https://developer.hashicorp.com/vault/docs/auth/kubernetes)
-
-</details>
-
-<details>
-<summary>🔐 Security Best Practices</summary>
-
-- [Kubernetes Secrets Best Practices](https://kubernetes.io/docs/concepts/security/secrets-good-practices/)
-- [Encrypting Data at Rest](https://kubernetes.io/docs/tasks/administer-cluster/encrypt-data/)
-- [External Secrets Operator](https://external-secrets.io/) - Alternative approach
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 12:** ConfigMaps for non-sensitive configuration and persistent storage
-- **Lab 13:** ArgoCD will deploy your secured Helm charts via GitOps
-- **Lab 14:** Progressive delivery with Argo Rollouts
-- **Lab 15:** StatefulSets with persistent storage
-
----
-
-**Good luck!** 🔐
-
-> **Remember:** Never commit real secrets to version control. Use placeholder values and inject real secrets at deployment time. In production, always use an external secret manager like Vault.
+# Lab 11 — Kubernetes Secrets & HashiCorp Vault
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Secret%20Management-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Vault%20%7C%20K8s%20Secrets-informational)
+
+> Secure your Kubernetes applications by implementing proper secret management with native Secrets and HashiCorp Vault integration.
+
+## Overview
+
+Secret management is critical for production Kubernetes deployments. Hardcoded credentials in code or config files are a security nightmare. This lab teaches you how to properly manage sensitive data using Kubernetes native Secrets and enterprise-grade HashiCorp Vault.
+
+**What You'll Learn:**
+- Kubernetes Secrets creation and consumption
+- Base64 encoding vs actual encryption
+- Helm-based secret management
+- HashiCorp Vault installation and configuration
+- Kubernetes authentication with Vault
+- Sidecar injection pattern for secrets
+
+**Building On:** Your Helm chart from Lab 10 will be extended with secret management capabilities.
+
+**Tech Stack:** Kubernetes Secrets | HashiCorp Vault 1.18+ | Vault Helm 0.28+ | Vault Agent Injector
+
+---
+
+## Tasks
+
+### Task 1 — Kubernetes Secrets Fundamentals (2 pts)
+
+**Objective:** Understand how Kubernetes Secrets work and their security model.
+
+**Requirements:**
+
+1. **Create a Secret Using kubectl**
+   - Create a secret named `app-credentials` with:
+     - `username` key
+     - `password` key
+   - Use the imperative `kubectl create secret` command
+
+2. **Examine the Secret**
+   - View the secret in YAML format
+   - Decode the base64-encoded values
+   - Understand what "encoding" vs "encryption" means
+
+3. **Understand Security Implications**
+   - Research: Are Kubernetes Secrets encrypted at rest by default?
+   - What is etcd encryption and when should you enable it?
+
+<details>
+<summary>💡 Hints</summary>
+
+**Creating Secrets:**
+There are multiple ways to create secrets:
+- `kubectl create secret generic` - from literals or files
+- `kubectl create secret docker-registry` - for image pull secrets
+- `kubectl create secret tls` - for TLS certificates
+
+**Useful Commands:**
+```bash
+# Create from literals
+kubectl create secret generic <name> --from-literal=key=value
+
+# View secret
+kubectl get secret <name> -o yaml
+
+# Decode base64 (Linux/Mac)
+echo "<base64-string>" | base64 -d
+```
+
+**Security Model:**
+Kubernetes Secrets are base64-encoded, NOT encrypted by default. Anyone with API access can decode them. For production:
+- Enable etcd encryption at rest
+- Use RBAC to limit secret access
+- Consider external secret managers (Vault, AWS Secrets Manager, etc.)
+
+**Resources:**
+- [Kubernetes Secrets Concepts](https://kubernetes.io/docs/concepts/configuration/secret/)
+- [Encrypting Secret Data at Rest](https://kubernetes.io/docs/tasks/administer-cluster/encrypt-data/)
+
+</details>
+
+---
+
+### Task 2 — Helm-Managed Secrets (3 pts)
+
+**Objective:** Integrate secrets into your Helm chart and inject them into your application.
+
+**Requirements:**
+
+1. **Create Secret Template**
+   - Add `templates/secrets.yaml` to your Helm chart
+   - Define secret values in `values.yaml` (with placeholder defaults)
+   - Use proper templating for secret name and labels
+
+2. **Inject Secrets as Environment Variables**
+   - Update your deployment to consume the secret
+   - Use `envFrom` with `secretRef` for all keys
+   - OR use individual `env` entries with `secretKeyRef`
+
+3. **Verify Secret Injection**
+   - Deploy the updated chart
+   - Exec into the pod and verify environment variables
+   - Ensure secrets are not visible in `kubectl describe pod`
+
+4. **Add Resource Limits**
+   - Configure CPU and memory requests/limits in your deployment
+   - Use values.yaml for configurability
+   - Apply Kubernetes resource management best practices
+
+<details>
+<summary>💡 Hints</summary>
+
+**Secret Template Structure:**
+Your `templates/secrets.yaml` should:
+- Use the standard `v1` API and `Secret` kind
+- Include proper metadata with templated name and labels
+- Reference values from `values.yaml`
+- Use `stringData` for plain text (auto-encoded) or `data` for pre-encoded
+
+**Consuming Secrets in Deployment:**
+There are two patterns for environment variables:
+
+Pattern 1 - All keys from secret:
+```yaml
+envFrom:
+  - secretRef:
+      name: {{ include "mychart.fullname" . }}-secret
+```
+
+Pattern 2 - Specific keys:
+```yaml
+env:
+  - name: DATABASE_PASSWORD
+    valueFrom:
+      secretKeyRef:
+        name: secret-name
+        key: password
+```
+
+**Resource Limits:**
+```yaml
+resources:
+  requests:
+    memory: "64Mi"
+    cpu: "100m"
+  limits:
+    memory: "128Mi"
+    cpu: "200m"
+```
+
+**Security Note:**
+Never commit real secrets to Git! Use:
+- Placeholder values in `values.yaml`
+- `--set` flag during install
+- External secret management (next task)
+
+**Resources:**
+- [Managing Secrets with kubectl](https://kubernetes.io/docs/tasks/configmap-secret/managing-secret-using-kubectl/)
+- [Resource Management](https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/)
+
+</details>
+
+---
+
+### Task 3 — HashiCorp Vault Integration (3 pts)
+
+**Objective:** Deploy HashiCorp Vault and configure it to inject secrets into your application.
+
+**Requirements:**
+
+1. **Install Vault via Helm**
+   - Add HashiCorp Helm repository
+   - Install Vault in dev mode (for learning purposes)
+   - Verify all Vault pods are running
+
+2. **Configure Vault**
+   - Enable KV secrets engine (v2)
+   - Create a secret path for your application
+   - Store at least two key-value pairs
+
+3. **Configure Kubernetes Authentication**
+   - Enable Kubernetes auth method in Vault
+   - Create a policy that grants read access to your secret path
+   - Create a role bound to your application's service account
+
+4. **Enable Vault Agent Injection**
+   - Add Vault annotations to your deployment
+   - Configure the agent to inject secrets as files
+   - Verify secrets are available inside the pod at the expected path
+
+<details>
+<summary>💡 Hints</summary>
+
+**Installing Vault:**
+```bash
+# Add repo
+helm repo add hashicorp https://helm.releases.hashicorp.com
+helm repo update
+
+# Install in dev mode (NOT for production!)
+helm install vault hashicorp/vault \
+  --set "server.dev.enabled=true" \
+  --set "injector.enabled=true"
+```
+
+**Vault Configuration Steps:**
+1. Exec into Vault pod: `kubectl exec -it vault-0 -- /bin/sh`
+2. Vault is auto-initialized in dev mode
+3. Use `vault` CLI inside the pod
+
+**Key Vault Commands:**
+```bash
+# Enable KV v2
+vault secrets enable -path=secret kv-v2
+
+# Create secret
+vault kv put secret/myapp/config username="admin" password="secret123"
+
+# Enable K8s auth
+vault auth enable kubernetes
+
+# Configure K8s auth (get values from your cluster)
+vault write auth/kubernetes/config \
+  kubernetes_host="https://$KUBERNETES_PORT_443_TCP_ADDR:443"
+```
+
+**Policy and Role:**
+You need to:
+1. Create a policy that allows reading from your secret path
+2. Create a role that binds the policy to your service account
+
+**Vault Agent Annotations:**
+Add these to your deployment's pod template:
+```yaml
+annotations:
+  vault.hashicorp.com/agent-inject: "true"
+  vault.hashicorp.com/role: "your-role"
+  vault.hashicorp.com/agent-inject-secret-config: "secret/data/myapp/config"
+```
+
+**Resources:**
+- [Vault Helm Chart](https://developer.hashicorp.com/vault/docs/platform/k8s/helm)
+- [Vault K8s Sidecar Tutorial](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar)
+- [Agent Annotations](https://developer.hashicorp.com/vault/docs/platform/k8s/injector/annotations)
+
+</details>
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Objective:** Document your secret management implementation.
+
+**Create `k8s/SECRETS.md` with:**
+
+1. **Kubernetes Secrets**
+   - Output of creating and viewing your secret
+   - Decoded secret values demonstration
+   - Explanation of base64 encoding vs encryption
+
+2. **Helm Secret Integration**
+   - Chart structure showing secrets.yaml
+   - How secrets are consumed in deployment
+   - Verification output (env vars in pod, excluding actual values)
+
+3. **Resource Management**
+   - Resource limits configuration
+   - Explanation of requests vs limits
+   - How to choose appropriate values
+
+4. **Vault Integration**
+   - Vault installation verification (`kubectl get pods`)
+   - Policy and role configuration (sanitized)
+   - Proof of secret injection (show file exists, path structure)
+   - Explanation of the sidecar injection pattern
+
+5. **Security Analysis**
+   - Comparison: K8s Secrets vs Vault
+   - When to use each approach
+   - Production recommendations
+
+---
+
+## Bonus Task — Vault Agent Templates (2.5 pts)
+
+**Objective:** Use Vault Agent templating to render secrets in custom formats.
+
+**Requirements:**
+
+1. **Implement Template Annotation**
+   - Use `vault.hashicorp.com/agent-inject-template-*` annotation
+   - Render secrets as a configuration file (e.g., `.env` format or JSON)
+   - Include multiple secrets in a single rendered file
+
+2. **Dynamic Secret Rotation**
+   - Research how Vault Agent handles secret updates
+   - Document the refresh mechanism
+   - Explain `vault.hashicorp.com/agent-inject-command` annotation
+
+3. **Named Templates for Environment Variables**
+   - Create a named template in `_helpers.tpl` for common environment variables
+   - Use `include` to reference it in your deployment
+   - Demonstrate DRY principle in Helm charts
+
+<details>
+<summary>💡 Hints</summary>
+
+**Template Annotation Example:**
+```yaml
+vault.hashicorp.com/agent-inject-template-config: |
+  {{- with secret "secret/data/myapp/config" -}}
+  DATABASE_URL={{ .Data.data.db_url }}
+  API_KEY={{ .Data.data.api_key }}
+  {{- end -}}
+```
+
+**Named Template Pattern:**
+In `_helpers.tpl`:
+```yaml
+{{- define "mychart.envVars" -}}
+- name: APP_ENV
+  value: {{ .Values.environment }}
+- name: LOG_LEVEL
+  value: {{ .Values.logLevel }}
+{{- end -}}
+```
+
+In deployment:
+```yaml
+env:
+  {{- include "mychart.envVars" . | nindent 12 }}
+```
+
+**Resources:**
+- [Vault Agent Templates](https://developer.hashicorp.com/vault/docs/platform/k8s/injector/annotations#vault-hashicorp-com-agent-inject-template)
+- [Helm Named Templates](https://helm.sh/docs/chart_template_guide/named_templates/)
+
+</details>
+
+**Bonus Documentation:**
+- Template annotation configuration
+- Rendered secret file content
+- Named template implementation
+- Benefits of templating approach
+
+---
+
+## Checklist
+
+### Task 1 — Kubernetes Secrets Fundamentals (2 pts)
+- [ ] Secret created via kubectl
+- [ ] Secret viewed and decoded
+- [ ] Security implications understood and documented
+
+### Task 2 — Helm-Managed Secrets (3 pts)
+- [ ] `templates/secrets.yaml` created
+- [ ] Secrets defined in `values.yaml`
+- [ ] Deployment updated to consume secrets
+- [ ] Environment variables verified in pod
+- [ ] Resource limits configured
+
+### Task 3 — HashiCorp Vault Integration (3 pts)
+- [ ] Vault installed via Helm
+- [ ] KV secrets engine configured
+- [ ] Kubernetes auth method enabled
+- [ ] Policy and role created
+- [ ] Vault Agent injection working
+- [ ] Secrets accessible in pod
+
+### Task 4 — Documentation (2 pts)
+- [ ] `k8s/SECRETS.md` complete
+- [ ] All sections documented with evidence
+- [ ] Security analysis included
+
+### Bonus — Vault Agent Templates (2.5 pts)
+- [ ] Template annotation implemented
+- [ ] Custom format rendering working
+- [ ] Named templates in `_helpers.tpl`
+- [ ] Documentation complete
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **K8s Secrets** | 2 pts | Create, view, decode, understand security |
+| **Helm Secrets** | 3 pts | Template, inject, verify, resource limits |
+| **Vault Integration** | 3 pts | Install, configure, auth, inject |
+| **Documentation** | 2 pts | Complete SECRETS.md with evidence |
+| **Bonus** | 2.5 pts | Templates, named templates, rotation |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Working Vault injection, proper Helm secrets, good documentation
+- **8-9/10:** Vault working, minor issues with docs or config
+- **6-7/10:** K8s secrets work, Vault partially configured
+- **<6/10:** Secrets not properly implemented, missing Vault setup
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Documentation</summary>
+
+- [Kubernetes Secrets](https://kubernetes.io/docs/concepts/configuration/secret/)
+- [HashiCorp Vault](https://developer.hashicorp.com/vault/docs)
+- [Vault Helm Chart](https://developer.hashicorp.com/vault/docs/platform/k8s/helm)
+- [Vault K8s Injector](https://developer.hashicorp.com/vault/docs/platform/k8s/injector)
+
+</details>
+
+<details>
+<summary>🎓 Tutorials</summary>
+
+- [Vault on Kubernetes Deployment Guide](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-raft-deployment-guide)
+- [Injecting Secrets into Kubernetes Pods](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar)
+- [Kubernetes Auth Method](https://developer.hashicorp.com/vault/docs/auth/kubernetes)
+
+</details>
+
+<details>
+<summary>🔐 Security Best Practices</summary>
+
+- [Kubernetes Secrets Best Practices](https://kubernetes.io/docs/concepts/security/secrets-good-practices/)
+- [Encrypting Data at Rest](https://kubernetes.io/docs/tasks/administer-cluster/encrypt-data/)
+- [External Secrets Operator](https://external-secrets.io/) - Alternative approach
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 12:** ConfigMaps for non-sensitive configuration and persistent storage
+- **Lab 13:** ArgoCD will deploy your secured Helm charts via GitOps
+- **Lab 14:** Progressive delivery with Argo Rollouts
+- **Lab 15:** StatefulSets with persistent storage
+
+---
+
+**Good luck!** 🔐
+
+> **Remember:** Never commit real secrets to version control. Use placeholder values and inject real secrets at deployment time. In production, always use an external secret manager like Vault.
diff --git a/labs/lab12.md b/labs/lab12.md
index 76fffacf8f..2e9f3fa579 100644
--- a/labs/lab12.md
+++ b/labs/lab12.md
@@ -1,466 +1,466 @@
-# Lab 12 — ConfigMaps & Persistent Volumes
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-Configuration%20%26%20Storage-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-ConfigMaps%20%7C%20PVC-informational)
-
-> Externalize application configuration with ConfigMaps and ensure data persistence with Persistent Volumes.
-
-## Overview
-
-Production applications need externalized configuration and persistent storage. ConfigMaps decouple configuration from container images, enabling the same image to run in different environments. Persistent Volumes ensure your application data survives pod restarts and rescheduling.
-
-**What You'll Learn:**
-- ConfigMap creation and mounting strategies
-- File-based vs environment variable configuration
-- Persistent Volume Claims (PVC) in Kubernetes
-- Volume mounting and data persistence
-- Configuration best practices
-
-**Building On:** Your Helm chart from Lab 11 will be extended with ConfigMaps and persistent storage.
-
-**Tech Stack:** Kubernetes ConfigMaps | PersistentVolumeClaim | Helm | Volume Mounts
-
----
-
-## Tasks
-
-### Task 1 — Application Persistence Upgrade (2 pts)
-
-**Objective:** Modify your application to track and persist visit counts.
-
-**Requirements:**
-
-1. **Add Visits Counter Logic**
-   - Implement a counter that increments on each request to the root endpoint
-   - Store the counter value in a file (e.g., `/data/visits`)
-   - Create a new `/visits` endpoint that returns the current count
-
-2. **Update Application Code**
-   - Read counter from file on startup (default to 0 if file doesn't exist)
-   - Increment and save on each root endpoint access
-   - Handle concurrent access appropriately
-
-3. **Test Locally with Docker**
-   - Update `docker-compose.yml` to mount a volume for the visits file
-   - Verify the counter persists across container restarts
-   - Update your application's `README.md`
-
-<details>
-<summary>💡 Hints</summary>
-
-**Implementation Pattern:**
-```
-Request to / → Read counter from file → Increment → Write back → Return response
-Request to /visits → Read counter from file → Return count
-```
-
-**File-Based Counter:**
-- Use a simple text file or JSON
-- Handle file not found gracefully
-- Consider atomic write operations
-
-**Docker Compose Volume:**
-```yaml
-volumes:
-  - ./data:/app/data
-```
-
-**Testing:**
-1. Start container
-2. Access root endpoint multiple times
-3. Check file on host: `cat ./data/visits`
-4. Restart container
-5. Verify counter continues from last value
-
-**Thread Safety:**
-For a simple counter, file locking or atomic operations help prevent race conditions. For this lab, basic file read/write is acceptable.
-
-</details>
-
----
-
-### Task 2 — ConfigMaps (3 pts)
-
-**Objective:** Externalize application configuration using Kubernetes ConfigMaps.
-
-**Requirements:**
-
-1. **Create Configuration File**
-   - Create a `files/` directory in your Helm chart
-   - Add `config.json` with application configuration:
-     - Application name
-     - Environment (dev/prod)
-     - Feature flags or settings
-
-2. **Create ConfigMap Template**
-   - Add `templates/configmap.yaml` to your Helm chart
-   - Use `.Files.Get` to load the config file content
-   - Include proper metadata and labels
-
-3. **Mount ConfigMap as File**
-   - Update deployment to mount ConfigMap as a volume
-   - Mount at a specific path (e.g., `/config/config.json`)
-   - Verify the file is accessible inside the pod
-
-4. **Use ConfigMap as Environment Variables**
-   - Create a second ConfigMap with key-value pairs
-   - Use `envFrom` with `configMapRef` to inject all keys
-   - Verify environment variables in the pod
-
-<details>
-<summary>💡 Hints</summary>
-
-**ConfigMap from File:**
-```yaml
-apiVersion: v1
-kind: ConfigMap
-metadata:
-  name: {{ include "mychart.fullname" . }}-config
-data:
-  config.json: |-
-{{ .Files.Get "files/config.json" | indent 4 }}
-```
-
-**ConfigMap for Env Vars:**
-```yaml
-apiVersion: v1
-kind: ConfigMap
-metadata:
-  name: {{ include "mychart.fullname" . }}-env
-data:
-  APP_ENV: {{ .Values.environment | quote }}
-  LOG_LEVEL: {{ .Values.logLevel | quote }}
-```
-
-**Volume Mount Pattern:**
-In deployment spec:
-```yaml
-volumes:
-  - name: config-volume
-    configMap:
-      name: config-name
-containers:
-  - volumeMounts:
-      - name: config-volume
-        mountPath: /config
-```
-
-**Environment Variables:**
-```yaml
-envFrom:
-  - configMapRef:
-      name: {{ include "mychart.fullname" . }}-env
-```
-
-**Verification:**
-```bash
-kubectl exec <pod> -- cat /config/config.json
-kubectl exec <pod> -- printenv | grep APP_
-```
-
-**Resources:**
-- [ConfigMaps](https://kubernetes.io/docs/concepts/configuration/configmap/)
-- [Configure Pod with ConfigMap](https://kubernetes.io/docs/tasks/configure-pod-container/configure-pod-configmap/)
-
-</details>
-
----
-
-### Task 3 — Persistent Volumes (3 pts)
-
-**Objective:** Implement persistent storage for your application's visit counter.
-
-**Requirements:**
-
-1. **Create PersistentVolumeClaim**
-   - Add `templates/pvc.yaml` to your Helm chart
-   - Request appropriate storage size (e.g., 100Mi)
-   - Use `ReadWriteOnce` access mode
-   - Make storage class configurable via values
-
-2. **Mount PVC to Deployment**
-   - Add volume referencing the PVC
-   - Mount at your data directory (e.g., `/data`)
-   - Ensure your application writes visits file there
-
-3. **Verify Persistence**
-   - Deploy the application
-   - Access root endpoint multiple times
-   - Delete the pod (not the deployment)
-   - Verify the new pod has the same counter value
-
-4. **Test Data Survival**
-   - Check visits count before pod deletion
-   - Delete pod: `kubectl delete pod <pod-name>`
-   - Wait for new pod to start
-   - Verify visits count is preserved
-
-<details>
-<summary>💡 Hints</summary>
-
-**PVC Template:**
-```yaml
-apiVersion: v1
-kind: PersistentVolumeClaim
-metadata:
-  name: {{ include "mychart.fullname" . }}-data
-  labels:
-    {{- include "mychart.labels" . | nindent 4 }}
-spec:
-  accessModes:
-    - ReadWriteOnce
-  resources:
-    requests:
-      storage: {{ .Values.persistence.size }}
-  {{- if .Values.persistence.storageClass }}
-  storageClassName: {{ .Values.persistence.storageClass }}
-  {{- end }}
-```
-
-**Values.yaml:**
-```yaml
-persistence:
-  enabled: true
-  size: 100Mi
-  storageClass: ""  # Use default
-```
-
-**Mounting PVC:**
-```yaml
-volumes:
-  - name: data-volume
-    persistentVolumeClaim:
-      claimName: {{ include "mychart.fullname" . }}-data
-containers:
-  - volumeMounts:
-      - name: data-volume
-        mountPath: /data
-```
-
-**Minikube Storage:**
-Minikube provides a default storage class that provisions hostPath volumes automatically.
-
-**Verification Commands:**
-```bash
-kubectl get pvc
-kubectl describe pvc <pvc-name>
-kubectl exec <pod> -- cat /data/visits
-```
-
-**Resources:**
-- [Persistent Volumes](https://kubernetes.io/docs/concepts/storage/persistent-volumes/)
-- [Configure Pod with PVC](https://kubernetes.io/docs/tasks/configure-pod-container/configure-persistent-volume-storage/)
-
-</details>
-
----
-
-### Task 4 — Documentation (2 pts)
-
-**Objective:** Document your ConfigMap and persistence implementation.
-
-**Create `k8s/CONFIGMAPS.md` with:**
-
-1. **Application Changes**
-   - Description of visits counter implementation
-   - New endpoint documentation
-   - Local testing evidence with Docker
-
-2. **ConfigMap Implementation**
-   - ConfigMap template structure
-   - `config.json` content
-   - How ConfigMap is mounted as file
-   - How ConfigMap provides environment variables
-   - Verification outputs
-
-3. **Persistent Volume**
-   - PVC configuration explanation
-   - Access modes and storage class discussion
-   - Volume mount configuration
-   - Persistence test evidence:
-     - Counter value before pod deletion
-     - Pod deletion command
-     - Counter value after new pod starts
-
-4. **ConfigMap vs Secret**
-   - When to use ConfigMap
-   - When to use Secret
-   - Key differences
-
-**Required Screenshots/Outputs:**
-- `kubectl get configmap,pvc` output
-- File content inside pod (`cat /config/config.json`)
-- Environment variables in pod
-- Persistence test (before/after pod restart)
-
----
-
-## Bonus Task — ConfigMap Hot Reload (2.5 pts)
-
-**Objective:** Understand ConfigMap update behavior and implement configuration reloading.
-
-**Requirements:**
-
-1. **Test Default Update Behavior**
-   - Update ConfigMap content (e.g., via `kubectl edit configmap`)
-   - Observe when changes appear in the mounted file
-   - Document the delay (kubelet sync period)
-
-2. **Understand subPath Limitation**
-   - Research why `subPath` mounts don't receive updates
-   - Document when to use and avoid `subPath`
-
-3. **Implement Application Reload**
-   - Research approaches for configuration hot reload:
-     - Sidecar pattern (config reloader)
-     - Application file watching
-     - Pod restart via annotations
-   - Implement one approach and document it
-
-4. **Helm Upgrade Pattern**
-   - Use `helm.sh/resource-policy` or checksum annotations
-   - Trigger pod restart when ConfigMap changes
-   - Demonstrate the pattern
-
-<details>
-<summary>💡 Hints</summary>
-
-**Checksum Annotation Pattern:**
-```yaml
-spec:
-  template:
-    metadata:
-      annotations:
-        checksum/config: {{ include (print $.Template.BasePath "/configmap.yaml") . | sha256sum }}
-```
-
-This causes the deployment to update (and pods to restart) whenever the ConfigMap changes.
-
-**Config Reloader Sidecar:**
-Projects like `stakater/Reloader` automatically restart pods when ConfigMaps change.
-
-**Kubelet Sync Period:**
-By default, kubelet syncs ConfigMap changes every 60 seconds + cache TTL. Total delay can be up to a few minutes.
-
-**subPath Behavior:**
-When using `subPath`, the file is a copy, not a symlink, so it doesn't update. Use full directory mounts for auto-updates.
-
-**Resources:**
-- [ConfigMap Auto-Updates](https://kubernetes.io/docs/concepts/configuration/configmap/#mounted-configmaps-are-updated-automatically)
-- [Reloader](https://github.com/stakater/Reloader)
-
-</details>
-
-**Bonus Documentation:**
-- Update delay measurement
-- subPath limitation explanation
-- Chosen reload approach implementation
-- Evidence of configuration reload working
-
----
-
-## Checklist
-
-### Task 1 — Application Persistence Upgrade (2 pts)
-- [ ] Visits counter implemented
-- [ ] `/visits` endpoint created
-- [ ] Counter persists in file
-- [ ] Docker Compose volume configured
-- [ ] Local testing successful
-- [ ] README updated
-
-### Task 2 — ConfigMaps (3 pts)
-- [ ] `files/config.json` created
-- [ ] ConfigMap template for file mounting
-- [ ] ConfigMap template for env vars
-- [ ] ConfigMap mounted as file in pod
-- [ ] Environment variables injected
-- [ ] Verification outputs collected
-
-### Task 3 — Persistent Volumes (3 pts)
-- [ ] PVC template created
-- [ ] PVC mounted to deployment
-- [ ] Visits file stored on PVC
-- [ ] Persistence tested (pod deletion)
-- [ ] Data survives pod restart
-
-### Task 4 — Documentation (2 pts)
-- [ ] `k8s/CONFIGMAPS.md` complete
-- [ ] Application changes documented
-- [ ] ConfigMap implementation documented
-- [ ] PVC implementation documented
-- [ ] All verification outputs included
-
-### Bonus — ConfigMap Hot Reload (2.5 pts)
-- [ ] Update delay tested
-- [ ] subPath limitation documented
-- [ ] Reload mechanism implemented
-- [ ] Documentation complete
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **App Upgrade** | 2 pts | Visits counter, persistence, /visits endpoint |
-| **ConfigMaps** | 3 pts | File mount, env vars, proper templating |
-| **Persistent Volumes** | 3 pts | PVC, mount, verified persistence |
-| **Documentation** | 2 pts | Complete CONFIGMAPS.md |
-| **Bonus** | 2.5 pts | Hot reload understanding and implementation |
-| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
-
-**Grading:**
-- **10/10:** Working persistence, proper ConfigMaps, verified data survival
-- **8-9/10:** ConfigMaps work, persistence mostly working
-- **6-7/10:** Basic ConfigMap mounting, persistence issues
-- **<6/10:** ConfigMaps not properly mounted, no persistence
-
----
-
-## Resources
-
-<details>
-<summary>📚 Official Documentation</summary>
-
-- [ConfigMaps](https://kubernetes.io/docs/concepts/configuration/configmap/)
-- [Persistent Volumes](https://kubernetes.io/docs/concepts/storage/persistent-volumes/)
-- [Persistent Volume Claims](https://kubernetes.io/docs/concepts/storage/persistent-volumes/#persistentvolumeclaims)
-- [Storage Classes](https://kubernetes.io/docs/concepts/storage/storage-classes/)
-
-</details>
-
-<details>
-<summary>🎓 Tutorials</summary>
-
-- [Configure Pod with ConfigMap](https://kubernetes.io/docs/tasks/configure-pod-container/configure-pod-configmap/)
-- [Configure Pod with PVC](https://kubernetes.io/docs/tasks/configure-pod-container/configure-persistent-volume-storage/)
-- [Mounting ConfigMaps as Files](https://kubernetes.io/docs/concepts/configuration/configmap/#using-configmaps-as-files-from-a-pod)
-
-</details>
-
-<details>
-<summary>🛠️ Tools & Patterns</summary>
-
-- [Helm Files Function](https://helm.sh/docs/chart_template_guide/accessing_files/)
-- [Stakater Reloader](https://github.com/stakater/Reloader)
-- [Minikube Storage](https://minikube.sigs.k8s.io/docs/handbook/persistent_volumes/)
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 13:** ArgoCD will deploy your configured Helm charts via GitOps
-- **Lab 14:** Progressive delivery with Argo Rollouts
-- **Lab 15:** StatefulSets for per-pod persistent storage
-- **Lab 16:** Monitoring your application configuration and storage
-
----
-
-**Good luck!** 📦
-
-> **Remember:** ConfigMaps are for non-sensitive configuration data. Use Secrets (Lab 11) for sensitive data. Persistent Volumes ensure your data survives the ephemeral nature of pods.
+# Lab 12 — ConfigMaps & Persistent Volumes
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Configuration%20%26%20Storage-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-ConfigMaps%20%7C%20PVC-informational)
+
+> Externalize application configuration with ConfigMaps and ensure data persistence with Persistent Volumes.
+
+## Overview
+
+Production applications need externalized configuration and persistent storage. ConfigMaps decouple configuration from container images, enabling the same image to run in different environments. Persistent Volumes ensure your application data survives pod restarts and rescheduling.
+
+**What You'll Learn:**
+- ConfigMap creation and mounting strategies
+- File-based vs environment variable configuration
+- Persistent Volume Claims (PVC) in Kubernetes
+- Volume mounting and data persistence
+- Configuration best practices
+
+**Building On:** Your Helm chart from Lab 11 will be extended with ConfigMaps and persistent storage.
+
+**Tech Stack:** Kubernetes ConfigMaps | PersistentVolumeClaim | Helm | Volume Mounts
+
+---
+
+## Tasks
+
+### Task 1 — Application Persistence Upgrade (2 pts)
+
+**Objective:** Modify your application to track and persist visit counts.
+
+**Requirements:**
+
+1. **Add Visits Counter Logic**
+   - Implement a counter that increments on each request to the root endpoint
+   - Store the counter value in a file (e.g., `/data/visits`)
+   - Create a new `/visits` endpoint that returns the current count
+
+2. **Update Application Code**
+   - Read counter from file on startup (default to 0 if file doesn't exist)
+   - Increment and save on each root endpoint access
+   - Handle concurrent access appropriately
+
+3. **Test Locally with Docker**
+   - Update `docker-compose.yml` to mount a volume for the visits file
+   - Verify the counter persists across container restarts
+   - Update your application's `README.md`
+
+<details>
+<summary>💡 Hints</summary>
+
+**Implementation Pattern:**
+```
+Request to / → Read counter from file → Increment → Write back → Return response
+Request to /visits → Read counter from file → Return count
+```
+
+**File-Based Counter:**
+- Use a simple text file or JSON
+- Handle file not found gracefully
+- Consider atomic write operations
+
+**Docker Compose Volume:**
+```yaml
+volumes:
+  - ./data:/app/data
+```
+
+**Testing:**
+1. Start container
+2. Access root endpoint multiple times
+3. Check file on host: `cat ./data/visits`
+4. Restart container
+5. Verify counter continues from last value
+
+**Thread Safety:**
+For a simple counter, file locking or atomic operations help prevent race conditions. For this lab, basic file read/write is acceptable.
+
+</details>
+
+---
+
+### Task 2 — ConfigMaps (3 pts)
+
+**Objective:** Externalize application configuration using Kubernetes ConfigMaps.
+
+**Requirements:**
+
+1. **Create Configuration File**
+   - Create a `files/` directory in your Helm chart
+   - Add `config.json` with application configuration:
+     - Application name
+     - Environment (dev/prod)
+     - Feature flags or settings
+
+2. **Create ConfigMap Template**
+   - Add `templates/configmap.yaml` to your Helm chart
+   - Use `.Files.Get` to load the config file content
+   - Include proper metadata and labels
+
+3. **Mount ConfigMap as File**
+   - Update deployment to mount ConfigMap as a volume
+   - Mount at a specific path (e.g., `/config/config.json`)
+   - Verify the file is accessible inside the pod
+
+4. **Use ConfigMap as Environment Variables**
+   - Create a second ConfigMap with key-value pairs
+   - Use `envFrom` with `configMapRef` to inject all keys
+   - Verify environment variables in the pod
+
+<details>
+<summary>💡 Hints</summary>
+
+**ConfigMap from File:**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: {{ include "mychart.fullname" . }}-config
+data:
+  config.json: |-
+{{ .Files.Get "files/config.json" | indent 4 }}
+```
+
+**ConfigMap for Env Vars:**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: {{ include "mychart.fullname" . }}-env
+data:
+  APP_ENV: {{ .Values.environment | quote }}
+  LOG_LEVEL: {{ .Values.logLevel | quote }}
+```
+
+**Volume Mount Pattern:**
+In deployment spec:
+```yaml
+volumes:
+  - name: config-volume
+    configMap:
+      name: config-name
+containers:
+  - volumeMounts:
+      - name: config-volume
+        mountPath: /config
+```
+
+**Environment Variables:**
+```yaml
+envFrom:
+  - configMapRef:
+      name: {{ include "mychart.fullname" . }}-env
+```
+
+**Verification:**
+```bash
+kubectl exec <pod> -- cat /config/config.json
+kubectl exec <pod> -- printenv | grep APP_
+```
+
+**Resources:**
+- [ConfigMaps](https://kubernetes.io/docs/concepts/configuration/configmap/)
+- [Configure Pod with ConfigMap](https://kubernetes.io/docs/tasks/configure-pod-container/configure-pod-configmap/)
+
+</details>
+
+---
+
+### Task 3 — Persistent Volumes (3 pts)
+
+**Objective:** Implement persistent storage for your application's visit counter.
+
+**Requirements:**
+
+1. **Create PersistentVolumeClaim**
+   - Add `templates/pvc.yaml` to your Helm chart
+   - Request appropriate storage size (e.g., 100Mi)
+   - Use `ReadWriteOnce` access mode
+   - Make storage class configurable via values
+
+2. **Mount PVC to Deployment**
+   - Add volume referencing the PVC
+   - Mount at your data directory (e.g., `/data`)
+   - Ensure your application writes visits file there
+
+3. **Verify Persistence**
+   - Deploy the application
+   - Access root endpoint multiple times
+   - Delete the pod (not the deployment)
+   - Verify the new pod has the same counter value
+
+4. **Test Data Survival**
+   - Check visits count before pod deletion
+   - Delete pod: `kubectl delete pod <pod-name>`
+   - Wait for new pod to start
+   - Verify visits count is preserved
+
+<details>
+<summary>💡 Hints</summary>
+
+**PVC Template:**
+```yaml
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: {{ include "mychart.fullname" . }}-data
+  labels:
+    {{- include "mychart.labels" . | nindent 4 }}
+spec:
+  accessModes:
+    - ReadWriteOnce
+  resources:
+    requests:
+      storage: {{ .Values.persistence.size }}
+  {{- if .Values.persistence.storageClass }}
+  storageClassName: {{ .Values.persistence.storageClass }}
+  {{- end }}
+```
+
+**Values.yaml:**
+```yaml
+persistence:
+  enabled: true
+  size: 100Mi
+  storageClass: ""  # Use default
+```
+
+**Mounting PVC:**
+```yaml
+volumes:
+  - name: data-volume
+    persistentVolumeClaim:
+      claimName: {{ include "mychart.fullname" . }}-data
+containers:
+  - volumeMounts:
+      - name: data-volume
+        mountPath: /data
+```
+
+**Minikube Storage:**
+Minikube provides a default storage class that provisions hostPath volumes automatically.
+
+**Verification Commands:**
+```bash
+kubectl get pvc
+kubectl describe pvc <pvc-name>
+kubectl exec <pod> -- cat /data/visits
+```
+
+**Resources:**
+- [Persistent Volumes](https://kubernetes.io/docs/concepts/storage/persistent-volumes/)
+- [Configure Pod with PVC](https://kubernetes.io/docs/tasks/configure-pod-container/configure-persistent-volume-storage/)
+
+</details>
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Objective:** Document your ConfigMap and persistence implementation.
+
+**Create `k8s/CONFIGMAPS.md` with:**
+
+1. **Application Changes**
+   - Description of visits counter implementation
+   - New endpoint documentation
+   - Local testing evidence with Docker
+
+2. **ConfigMap Implementation**
+   - ConfigMap template structure
+   - `config.json` content
+   - How ConfigMap is mounted as file
+   - How ConfigMap provides environment variables
+   - Verification outputs
+
+3. **Persistent Volume**
+   - PVC configuration explanation
+   - Access modes and storage class discussion
+   - Volume mount configuration
+   - Persistence test evidence:
+     - Counter value before pod deletion
+     - Pod deletion command
+     - Counter value after new pod starts
+
+4. **ConfigMap vs Secret**
+   - When to use ConfigMap
+   - When to use Secret
+   - Key differences
+
+**Required Screenshots/Outputs:**
+- `kubectl get configmap,pvc` output
+- File content inside pod (`cat /config/config.json`)
+- Environment variables in pod
+- Persistence test (before/after pod restart)
+
+---
+
+## Bonus Task — ConfigMap Hot Reload (2.5 pts)
+
+**Objective:** Understand ConfigMap update behavior and implement configuration reloading.
+
+**Requirements:**
+
+1. **Test Default Update Behavior**
+   - Update ConfigMap content (e.g., via `kubectl edit configmap`)
+   - Observe when changes appear in the mounted file
+   - Document the delay (kubelet sync period)
+
+2. **Understand subPath Limitation**
+   - Research why `subPath` mounts don't receive updates
+   - Document when to use and avoid `subPath`
+
+3. **Implement Application Reload**
+   - Research approaches for configuration hot reload:
+     - Sidecar pattern (config reloader)
+     - Application file watching
+     - Pod restart via annotations
+   - Implement one approach and document it
+
+4. **Helm Upgrade Pattern**
+   - Use `helm.sh/resource-policy` or checksum annotations
+   - Trigger pod restart when ConfigMap changes
+   - Demonstrate the pattern
+
+<details>
+<summary>💡 Hints</summary>
+
+**Checksum Annotation Pattern:**
+```yaml
+spec:
+  template:
+    metadata:
+      annotations:
+        checksum/config: {{ include (print $.Template.BasePath "/configmap.yaml") . | sha256sum }}
+```
+
+This causes the deployment to update (and pods to restart) whenever the ConfigMap changes.
+
+**Config Reloader Sidecar:**
+Projects like `stakater/Reloader` automatically restart pods when ConfigMaps change.
+
+**Kubelet Sync Period:**
+By default, kubelet syncs ConfigMap changes every 60 seconds + cache TTL. Total delay can be up to a few minutes.
+
+**subPath Behavior:**
+When using `subPath`, the file is a copy, not a symlink, so it doesn't update. Use full directory mounts for auto-updates.
+
+**Resources:**
+- [ConfigMap Auto-Updates](https://kubernetes.io/docs/concepts/configuration/configmap/#mounted-configmaps-are-updated-automatically)
+- [Reloader](https://github.com/stakater/Reloader)
+
+</details>
+
+**Bonus Documentation:**
+- Update delay measurement
+- subPath limitation explanation
+- Chosen reload approach implementation
+- Evidence of configuration reload working
+
+---
+
+## Checklist
+
+### Task 1 — Application Persistence Upgrade (2 pts)
+- [ ] Visits counter implemented
+- [ ] `/visits` endpoint created
+- [ ] Counter persists in file
+- [ ] Docker Compose volume configured
+- [ ] Local testing successful
+- [ ] README updated
+
+### Task 2 — ConfigMaps (3 pts)
+- [ ] `files/config.json` created
+- [ ] ConfigMap template for file mounting
+- [ ] ConfigMap template for env vars
+- [ ] ConfigMap mounted as file in pod
+- [ ] Environment variables injected
+- [ ] Verification outputs collected
+
+### Task 3 — Persistent Volumes (3 pts)
+- [ ] PVC template created
+- [ ] PVC mounted to deployment
+- [ ] Visits file stored on PVC
+- [ ] Persistence tested (pod deletion)
+- [ ] Data survives pod restart
+
+### Task 4 — Documentation (2 pts)
+- [ ] `k8s/CONFIGMAPS.md` complete
+- [ ] Application changes documented
+- [ ] ConfigMap implementation documented
+- [ ] PVC implementation documented
+- [ ] All verification outputs included
+
+### Bonus — ConfigMap Hot Reload (2.5 pts)
+- [ ] Update delay tested
+- [ ] subPath limitation documented
+- [ ] Reload mechanism implemented
+- [ ] Documentation complete
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **App Upgrade** | 2 pts | Visits counter, persistence, /visits endpoint |
+| **ConfigMaps** | 3 pts | File mount, env vars, proper templating |
+| **Persistent Volumes** | 3 pts | PVC, mount, verified persistence |
+| **Documentation** | 2 pts | Complete CONFIGMAPS.md |
+| **Bonus** | 2.5 pts | Hot reload understanding and implementation |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Working persistence, proper ConfigMaps, verified data survival
+- **8-9/10:** ConfigMaps work, persistence mostly working
+- **6-7/10:** Basic ConfigMap mounting, persistence issues
+- **<6/10:** ConfigMaps not properly mounted, no persistence
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Documentation</summary>
+
+- [ConfigMaps](https://kubernetes.io/docs/concepts/configuration/configmap/)
+- [Persistent Volumes](https://kubernetes.io/docs/concepts/storage/persistent-volumes/)
+- [Persistent Volume Claims](https://kubernetes.io/docs/concepts/storage/persistent-volumes/#persistentvolumeclaims)
+- [Storage Classes](https://kubernetes.io/docs/concepts/storage/storage-classes/)
+
+</details>
+
+<details>
+<summary>🎓 Tutorials</summary>
+
+- [Configure Pod with ConfigMap](https://kubernetes.io/docs/tasks/configure-pod-container/configure-pod-configmap/)
+- [Configure Pod with PVC](https://kubernetes.io/docs/tasks/configure-pod-container/configure-persistent-volume-storage/)
+- [Mounting ConfigMaps as Files](https://kubernetes.io/docs/concepts/configuration/configmap/#using-configmaps-as-files-from-a-pod)
+
+</details>
+
+<details>
+<summary>🛠️ Tools & Patterns</summary>
+
+- [Helm Files Function](https://helm.sh/docs/chart_template_guide/accessing_files/)
+- [Stakater Reloader](https://github.com/stakater/Reloader)
+- [Minikube Storage](https://minikube.sigs.k8s.io/docs/handbook/persistent_volumes/)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 13:** ArgoCD will deploy your configured Helm charts via GitOps
+- **Lab 14:** Progressive delivery with Argo Rollouts
+- **Lab 15:** StatefulSets for per-pod persistent storage
+- **Lab 16:** Monitoring your application configuration and storage
+
+---
+
+**Good luck!** 📦
+
+> **Remember:** ConfigMaps are for non-sensitive configuration data. Use Secrets (Lab 11) for sensitive data. Persistent Volumes ensure your data survives the ephemeral nature of pods.
diff --git a/labs/lab13.md b/labs/lab13.md
index 21c6321d21..13ea5ceb0a 100644
--- a/labs/lab13.md
+++ b/labs/lab13.md
@@ -1,594 +1,594 @@
-# Lab 13 — GitOps with ArgoCD
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-GitOps-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-ArgoCD%202.13-informational)
-
-> Implement GitOps continuous deployment using ArgoCD for declarative, version-controlled Kubernetes deployments.
-
-## Overview
-
-GitOps is the practice of using Git as the single source of truth for declarative infrastructure and applications. ArgoCD is a declarative, GitOps continuous delivery tool for Kubernetes that automatically syncs your cluster state with your Git repository.
-
-**What You'll Learn:**
-- GitOps principles and benefits
-- ArgoCD installation and configuration
-- Application deployment via ArgoCD
-- Multi-environment deployment patterns
-- Auto-sync and self-healing mechanisms
-- Sync policies and strategies
-
-**Building On:** Your Helm chart from Labs 10-12 will be deployed and managed by ArgoCD.
-
-**Tech Stack:** ArgoCD 2.13+ | Kubernetes | Helm | GitOps
-
----
-
-## Tasks
-
-### Task 1 — ArgoCD Installation & Setup (2 pts)
-
-**Objective:** Install ArgoCD and access the management interface.
-
-**Requirements:**
-
-1. **Install ArgoCD via Helm**
-   - Add the ArgoCD Helm repository
-   - Create a dedicated namespace for ArgoCD
-   - Install ArgoCD with appropriate configuration
-   - Wait for all components to be ready
-
-2. **Access ArgoCD UI**
-   - Set up port forwarding to the ArgoCD server
-   - Retrieve the initial admin password
-   - Log in to the ArgoCD web interface
-   - Explore the UI layout and features
-
-3. **Install ArgoCD CLI**
-   - Install the `argocd` CLI tool for your platform
-   - Log in via CLI
-   - Verify connection with basic commands
-
-<details>
-<summary>💡 Hints</summary>
-
-**Installation Commands:**
-```bash
-# Add Helm repo
-helm repo add argo https://argoproj.github.io/argo-helm
-helm repo update
-
-# Create namespace and install
-kubectl create namespace argocd
-helm install argocd argo/argo-cd --namespace argocd
-
-# Wait for pods
-kubectl wait --for=condition=ready pod -l app.kubernetes.io/name=argocd-server -n argocd --timeout=120s
-```
-
-**Accessing UI:**
-```bash
-# Port forward (keep running)
-kubectl port-forward svc/argocd-server -n argocd 8080:443
-
-# Get initial password
-kubectl -n argocd get secret argocd-initial-admin-secret -o jsonpath="{.data.password}" | base64 -d
-
-# Access at https://localhost:8080
-# Username: admin
-```
-
-**CLI Installation:**
-- **macOS:** `brew install argocd`
-- **Linux:** Download from GitHub releases
-- Check [ArgoCD CLI Installation](https://argo-cd.readthedocs.io/en/stable/cli_installation/)
-
-**CLI Login:**
-```bash
-argocd login localhost:8080 --insecure
-# Use admin and the password retrieved above
-```
-
-**Resources:**
-- [ArgoCD Getting Started](https://argo-cd.readthedocs.io/en/stable/getting_started/)
-- [ArgoCD Helm Chart](https://github.com/argoproj/argo-helm/tree/main/charts/argo-cd)
-
-</details>
-
----
-
-### Task 2 — Application Deployment (3 pts)
-
-**Objective:** Deploy your application using ArgoCD's declarative Application resource.
-
-**Requirements:**
-
-1. **Create ArgoCD Application Manifest**
-   - Create `k8s/argocd/` directory
-   - Create `application.yaml` defining your app
-   - Specify:
-     - Source: Your Git repository and path to Helm chart
-     - Destination: Target cluster and namespace
-     - Sync policy: Manual initially
-
-2. **Deploy the Application**
-   - Apply the Application manifest
-   - Observe the application in ArgoCD UI
-   - Understand the sync status indicators
-
-3. **Perform Initial Sync**
-   - Trigger manual sync via UI or CLI
-   - Watch the deployment progress
-   - Verify all resources are created
-   - Access your application
-
-4. **Test GitOps Workflow**
-   - Make a change to your Helm chart (e.g., replica count)
-   - Commit and push to your repository
-   - Observe ArgoCD detecting the drift
-   - Sync the changes
-
-<details>
-<summary>💡 Hints</summary>
-
-**Application Manifest Structure:**
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: Application
-metadata:
-  name: python-app
-  namespace: argocd
-spec:
-  project: default
-  source:
-    repoURL: https://github.com/<username>/<repo>.git
-    targetRevision: <branch>
-    path: <path-to-helm-chart>
-    helm:
-      valueFiles:
-        - values.yaml
-  destination:
-    server: https://kubernetes.default.svc
-    namespace: default
-  syncPolicy:
-    syncOptions:
-      - CreateNamespace=true
-```
-
-**Key Fields:**
-- `repoURL`: Your GitHub repository URL
-- `targetRevision`: Branch name (e.g., `main`, `lab13`)
-- `path`: Path to Helm chart within repo (e.g., `k8s/app-python`)
-- `destination.namespace`: Where to deploy
-
-**Apply and Sync:**
-```bash
-kubectl apply -f k8s/argocd/application.yaml
-
-# CLI sync
-argocd app sync python-app
-
-# Check status
-argocd app get python-app
-```
-
-**Sync Status:**
-- **Synced:** Cluster matches Git
-- **OutOfSync:** Git has changes not applied
-- **Unknown:** Unable to determine state
-- **Healthy/Degraded/Progressing:** Application health
-
-**Resources:**
-- [ArgoCD Application Specification](https://argo-cd.readthedocs.io/en/stable/operator-manual/declarative-setup/)
-- [Sync Options](https://argo-cd.readthedocs.io/en/stable/user-guide/sync-options/)
-
-</details>
-
----
-
-### Task 3 — Multi-Environment Deployment (3 pts)
-
-**Objective:** Deploy your application to multiple environments (dev/prod) with different configurations.
-
-**Requirements:**
-
-1. **Create Namespaces**
-   - Create `dev` and `prod` namespaces
-   - These will host separate instances of your app
-
-2. **Create Environment-Specific Applications**
-   - Create `application-dev.yaml` using `values-dev.yaml`
-   - Create `application-prod.yaml` using `values-prod.yaml`
-   - Different replica counts, resource limits per environment
-
-3. **Enable Auto-Sync for Dev**
-   - Configure automatic sync for the dev environment
-   - Add `automated` sync policy
-   - Enable `selfHeal` and `prune` options
-
-4. **Keep Prod Manual**
-   - Production remains manual sync
-   - Understand why this is a best practice
-   - Document the deployment workflow difference
-
-5. **Verify Both Environments**
-   - Both apps visible in ArgoCD UI
-   - Different configurations applied
-   - Resources deployed to correct namespaces
-
-<details>
-<summary>💡 Hints</summary>
-
-**Create Namespaces:**
-```bash
-kubectl create namespace dev
-kubectl create namespace prod
-```
-
-**Dev Application with Auto-Sync:**
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: Application
-metadata:
-  name: python-app-dev
-  namespace: argocd
-spec:
-  project: default
-  source:
-    repoURL: https://github.com/<username>/<repo>.git
-    targetRevision: <branch>
-    path: <path-to-helm-chart>
-    helm:
-      valueFiles:
-        - values-dev.yaml
-  destination:
-    server: https://kubernetes.default.svc
-    namespace: dev
-  syncPolicy:
-    automated:
-      prune: true
-      selfHeal: true
-    syncOptions:
-      - CreateNamespace=true
-```
-
-**Prod Application (Manual):**
-```yaml
-# Similar but without automated sync policy
-syncPolicy:
-  syncOptions:
-    - CreateNamespace=true
-  # No automated block = manual sync
-```
-
-**Sync Policy Options:**
-- `automated`: Enable auto-sync
-- `prune`: Delete resources removed from Git
-- `selfHeal`: Revert manual cluster changes
-- Without `automated`: Manual sync required
-
-**Why Manual for Prod?**
-- Change review before deployment
-- Controlled release timing
-- Compliance requirements
-- Rollback planning
-
-**Verification:**
-```bash
-kubectl get pods -n dev
-kubectl get pods -n prod
-argocd app list
-```
-
-</details>
-
----
-
-### Task 4 — Self-Healing & Sync Policies (2 pts)
-
-**Objective:** Test and understand ArgoCD's self-healing and drift detection capabilities.
-
-**Requirements:**
-
-1. **Test Self-Healing (Dev Environment)**
-   - Manually scale the deployment:
-     ```bash
-     kubectl scale deployment <name> -n dev --replicas=5
-     ```
-   - Observe ArgoCD detecting the drift
-   - Watch it automatically revert to Git-defined state
-   - Document the behavior with timestamps
-
-2. **Test Pod Deletion**
-   - Delete a pod in dev namespace
-   - Observe Kubernetes recreating the pod
-   - Note: This is Kubernetes behavior, not ArgoCD
-   - Understand the difference between:
-     - Kubernetes self-healing (pod recreation)
-     - ArgoCD self-healing (configuration drift)
-
-3. **Test Configuration Drift**
-   - Manually edit a resource (e.g., add a label)
-   - Observe ArgoCD diff view
-   - Watch self-heal revert the change
-
-4. **Document Sync Behavior**
-   - Explain when ArgoCD syncs vs when Kubernetes heals
-   - What triggers ArgoCD sync?
-   - What is the sync interval?
-
-<details>
-<summary>💡 Hints</summary>
-
-**Self-Healing Test:**
-```bash
-# Scale manually
-kubectl scale deployment python-app-dev -n dev --replicas=5
-
-# Watch ArgoCD revert (if selfHeal enabled)
-kubectl get pods -n dev -w
-
-# Check ArgoCD status
-argocd app get python-app-dev
-```
-
-**View Drift:**
-```bash
-argocd app diff python-app-dev
-```
-
-**Pod Deletion Test:**
-```bash
-# Delete a pod
-kubectl delete pod -n dev -l app.kubernetes.io/name=python-app
-
-# Kubernetes recreates it immediately (ReplicaSet controller)
-kubectl get pods -n dev -w
-```
-
-**Key Difference:**
-- **Kubernetes Self-Healing:** ReplicaSet/Deployment ensures desired pod count
-- **ArgoCD Self-Healing:** Reverts cluster state to match Git state
-
-**Sync Interval:**
-ArgoCD polls Git every 3 minutes by default. You can also:
-- Use webhooks for immediate sync
-- Manually trigger sync
-- Configure different intervals
-
-**Resources:**
-- [Automated Sync Policy](https://argo-cd.readthedocs.io/en/stable/user-guide/auto_sync/)
-- [Self Heal](https://argo-cd.readthedocs.io/en/stable/user-guide/auto_sync/#automatic-self-healing)
-
-</details>
-
-**Documentation Required in `k8s/ARGOCD.md`:**
-
-1. **ArgoCD Setup**
-   - Installation verification
-   - UI access method
-   - CLI configuration
-
-2. **Application Configuration**
-   - Application manifests
-   - Source and destination configuration
-   - Values file selection
-
-3. **Multi-Environment**
-   - Dev vs Prod configuration differences
-   - Sync policy differences and rationale
-   - Namespace separation
-
-4. **Self-Healing Evidence**
-   - Manual scale test with before/after
-   - Pod deletion test
-   - Configuration drift test
-   - Explanation of behaviors
-
-5. **Screenshots**
-   - ArgoCD UI showing both applications
-   - Sync status
-   - Application details view
-
----
-
-## Bonus Task — ApplicationSet (2.5 pts)
-
-**Objective:** Use ApplicationSet to generate multiple applications from a single template.
-
-**Requirements:**
-
-1. **Understand ApplicationSet**
-   - Research ApplicationSet generators
-   - Understand use cases (multi-cluster, multi-tenant, mono-repo)
-
-2. **Implement List Generator**
-   - Create an ApplicationSet that generates both dev and prod apps
-   - Use the List generator to define environment-specific parameters
-   - Replace individual Application manifests
-
-3. **Implement Git Directory Generator (Optional)**
-   - If you have multiple apps in your repo
-   - Use Git directory generator to auto-discover apps
-
-4. **Document the Pattern**
-   - Benefits of ApplicationSet over individual Applications
-   - When to use which generator type
-   - Scaling considerations
-
-<details>
-<summary>💡 Hints</summary>
-
-**ApplicationSet with List Generator:**
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: ApplicationSet
-metadata:
-  name: python-app-set
-  namespace: argocd
-spec:
-  generators:
-    - list:
-        elements:
-          - env: dev
-            namespace: dev
-            valuesFile: values-dev.yaml
-            autoSync: true
-          - env: prod
-            namespace: prod
-            valuesFile: values-prod.yaml
-            autoSync: false
-  template:
-    metadata:
-      name: 'python-app-{{env}}'
-    spec:
-      project: default
-      source:
-        repoURL: https://github.com/<username>/<repo>.git
-        targetRevision: <branch>
-        path: <path-to-helm-chart>
-        helm:
-          valueFiles:
-            - '{{valuesFile}}'
-      destination:
-        server: https://kubernetes.default.svc
-        namespace: '{{namespace}}'
-      syncPolicy:
-        # Conditional sync policy based on env
-        # Note: This requires templating tricks or separate ApplicationSets
-```
-
-**Git Directory Generator:**
-```yaml
-generators:
-  - git:
-      repoURL: https://github.com/<username>/<repo>.git
-      revision: HEAD
-      directories:
-        - path: k8s/*
-```
-
-**Generators Available:**
-- List: Explicit list of parameters
-- Cluster: Multi-cluster deployments
-- Git: Based on Git files/directories
-- Matrix: Combine multiple generators
-- Merge: Merge generator outputs
-
-**Resources:**
-- [ApplicationSet Documentation](https://argo-cd.readthedocs.io/en/stable/user-guide/application-set/)
-- [Generators](https://argo-cd.readthedocs.io/en/stable/operator-manual/applicationset/Generators/)
-
-</details>
-
-**Bonus Documentation:**
-- ApplicationSet manifest
-- Generator configuration explanation
-- Generated Applications screenshot
-- Comparison with individual Applications
-
----
-
-## Checklist
-
-### Task 1 — ArgoCD Installation & Setup (2 pts)
-- [ ] ArgoCD installed via Helm
-- [ ] All pods running in argocd namespace
-- [ ] UI accessible via port-forward
-- [ ] Admin password retrieved
-- [ ] CLI installed and logged in
-
-### Task 2 — Application Deployment (3 pts)
-- [ ] `k8s/argocd/` directory created
-- [ ] Application manifest created
-- [ ] Application visible in ArgoCD UI
-- [ ] Initial sync completed
-- [ ] App accessible and working
-- [ ] GitOps workflow tested
-
-### Task 3 — Multi-Environment Deployment (3 pts)
-- [ ] Dev and prod namespaces created
-- [ ] Dev application with auto-sync
-- [ ] Prod application with manual sync
-- [ ] Different configurations per environment
-- [ ] Both apps deployed and verified
-
-### Task 4 — Self-Healing & Documentation (2 pts)
-- [ ] Manual scale test performed
-- [ ] Self-healing observed
-- [ ] Pod deletion test performed
-- [ ] Configuration drift test done
-- [ ] `k8s/ARGOCD.md` complete
-
-### Bonus — ApplicationSet (2.5 pts)
-- [ ] ApplicationSet manifest created
-- [ ] Multiple apps generated from template
-- [ ] Generator configuration documented
-- [ ] Benefits documented
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Installation** | 2 pts | ArgoCD running, UI/CLI accessible |
-| **App Deployment** | 3 pts | Application manifest, sync working |
-| **Multi-Environment** | 3 pts | Dev/prod with different configs |
-| **Self-Healing** | 2 pts | Tests performed, documented |
-| **Bonus** | 2.5 pts | ApplicationSet implementation |
-| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
-
-**Grading:**
-- **10/10:** Full GitOps workflow, multi-env, self-healing documented
-- **8-9/10:** ArgoCD works, minor issues with multi-env or docs
-- **6-7/10:** Basic app deployment, missing multi-env or self-healing
-- **<6/10:** ArgoCD not properly configured, apps not syncing
-
----
-
-## Resources
-
-<details>
-<summary>📚 Official Documentation</summary>
-
-- [ArgoCD Documentation](https://argo-cd.readthedocs.io/)
-- [ArgoCD Operator Manual](https://argo-cd.readthedocs.io/en/stable/operator-manual/)
-- [Application CRD](https://argo-cd.readthedocs.io/en/stable/operator-manual/declarative-setup/)
-- [Sync Policies](https://argo-cd.readthedocs.io/en/stable/user-guide/auto_sync/)
-
-</details>
-
-<details>
-<summary>🎓 GitOps Concepts</summary>
-
-- [GitOps Principles](https://opengitops.dev/)
-- [GitOps Working Group](https://github.com/gitops-working-group/gitops-working-group)
-- [ArgoCD Best Practices](https://argo-cd.readthedocs.io/en/stable/user-guide/best_practices/)
-
-</details>
-
-<details>
-<summary>🛠️ Advanced Topics</summary>
-
-- [ApplicationSet](https://argo-cd.readthedocs.io/en/stable/user-guide/application-set/)
-- [Sync Waves](https://argo-cd.readthedocs.io/en/stable/user-guide/sync-waves/)
-- [Resource Hooks](https://argo-cd.readthedocs.io/en/stable/user-guide/resource_hooks/)
-- [Notifications](https://argo-cd.readthedocs.io/en/stable/operator-manual/notifications/)
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 14:** Progressive delivery with Argo Rollouts
-- **Lab 15:** StatefulSets for stateful applications
-- **Lab 16:** Monitoring your GitOps deployments
-
----
-
-**Good luck!** 🔄
-
-> **Remember:** GitOps means Git is the source of truth. Any changes should go through Git, not direct `kubectl` commands. ArgoCD ensures your cluster always matches what's in Git.
+# Lab 13 — GitOps with ArgoCD
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-GitOps-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-ArgoCD%202.13-informational)
+
+> Implement GitOps continuous deployment using ArgoCD for declarative, version-controlled Kubernetes deployments.
+
+## Overview
+
+GitOps is the practice of using Git as the single source of truth for declarative infrastructure and applications. ArgoCD is a declarative, GitOps continuous delivery tool for Kubernetes that automatically syncs your cluster state with your Git repository.
+
+**What You'll Learn:**
+- GitOps principles and benefits
+- ArgoCD installation and configuration
+- Application deployment via ArgoCD
+- Multi-environment deployment patterns
+- Auto-sync and self-healing mechanisms
+- Sync policies and strategies
+
+**Building On:** Your Helm chart from Labs 10-12 will be deployed and managed by ArgoCD.
+
+**Tech Stack:** ArgoCD 2.13+ | Kubernetes | Helm | GitOps
+
+---
+
+## Tasks
+
+### Task 1 — ArgoCD Installation & Setup (2 pts)
+
+**Objective:** Install ArgoCD and access the management interface.
+
+**Requirements:**
+
+1. **Install ArgoCD via Helm**
+   - Add the ArgoCD Helm repository
+   - Create a dedicated namespace for ArgoCD
+   - Install ArgoCD with appropriate configuration
+   - Wait for all components to be ready
+
+2. **Access ArgoCD UI**
+   - Set up port forwarding to the ArgoCD server
+   - Retrieve the initial admin password
+   - Log in to the ArgoCD web interface
+   - Explore the UI layout and features
+
+3. **Install ArgoCD CLI**
+   - Install the `argocd` CLI tool for your platform
+   - Log in via CLI
+   - Verify connection with basic commands
+
+<details>
+<summary>💡 Hints</summary>
+
+**Installation Commands:**
+```bash
+# Add Helm repo
+helm repo add argo https://argoproj.github.io/argo-helm
+helm repo update
+
+# Create namespace and install
+kubectl create namespace argocd
+helm install argocd argo/argo-cd --namespace argocd
+
+# Wait for pods
+kubectl wait --for=condition=ready pod -l app.kubernetes.io/name=argocd-server -n argocd --timeout=120s
+```
+
+**Accessing UI:**
+```bash
+# Port forward (keep running)
+kubectl port-forward svc/argocd-server -n argocd 8080:443
+
+# Get initial password
+kubectl -n argocd get secret argocd-initial-admin-secret -o jsonpath="{.data.password}" | base64 -d
+
+# Access at https://localhost:8080
+# Username: admin
+```
+
+**CLI Installation:**
+- **macOS:** `brew install argocd`
+- **Linux:** Download from GitHub releases
+- Check [ArgoCD CLI Installation](https://argo-cd.readthedocs.io/en/stable/cli_installation/)
+
+**CLI Login:**
+```bash
+argocd login localhost:8080 --insecure
+# Use admin and the password retrieved above
+```
+
+**Resources:**
+- [ArgoCD Getting Started](https://argo-cd.readthedocs.io/en/stable/getting_started/)
+- [ArgoCD Helm Chart](https://github.com/argoproj/argo-helm/tree/main/charts/argo-cd)
+
+</details>
+
+---
+
+### Task 2 — Application Deployment (3 pts)
+
+**Objective:** Deploy your application using ArgoCD's declarative Application resource.
+
+**Requirements:**
+
+1. **Create ArgoCD Application Manifest**
+   - Create `k8s/argocd/` directory
+   - Create `application.yaml` defining your app
+   - Specify:
+     - Source: Your Git repository and path to Helm chart
+     - Destination: Target cluster and namespace
+     - Sync policy: Manual initially
+
+2. **Deploy the Application**
+   - Apply the Application manifest
+   - Observe the application in ArgoCD UI
+   - Understand the sync status indicators
+
+3. **Perform Initial Sync**
+   - Trigger manual sync via UI or CLI
+   - Watch the deployment progress
+   - Verify all resources are created
+   - Access your application
+
+4. **Test GitOps Workflow**
+   - Make a change to your Helm chart (e.g., replica count)
+   - Commit and push to your repository
+   - Observe ArgoCD detecting the drift
+   - Sync the changes
+
+<details>
+<summary>💡 Hints</summary>
+
+**Application Manifest Structure:**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Application
+metadata:
+  name: python-app
+  namespace: argocd
+spec:
+  project: default
+  source:
+    repoURL: https://github.com/<username>/<repo>.git
+    targetRevision: <branch>
+    path: <path-to-helm-chart>
+    helm:
+      valueFiles:
+        - values.yaml
+  destination:
+    server: https://kubernetes.default.svc
+    namespace: default
+  syncPolicy:
+    syncOptions:
+      - CreateNamespace=true
+```
+
+**Key Fields:**
+- `repoURL`: Your GitHub repository URL
+- `targetRevision`: Branch name (e.g., `main`, `lab13`)
+- `path`: Path to Helm chart within repo (e.g., `k8s/app-python`)
+- `destination.namespace`: Where to deploy
+
+**Apply and Sync:**
+```bash
+kubectl apply -f k8s/argocd/application.yaml
+
+# CLI sync
+argocd app sync python-app
+
+# Check status
+argocd app get python-app
+```
+
+**Sync Status:**
+- **Synced:** Cluster matches Git
+- **OutOfSync:** Git has changes not applied
+- **Unknown:** Unable to determine state
+- **Healthy/Degraded/Progressing:** Application health
+
+**Resources:**
+- [ArgoCD Application Specification](https://argo-cd.readthedocs.io/en/stable/operator-manual/declarative-setup/)
+- [Sync Options](https://argo-cd.readthedocs.io/en/stable/user-guide/sync-options/)
+
+</details>
+
+---
+
+### Task 3 — Multi-Environment Deployment (3 pts)
+
+**Objective:** Deploy your application to multiple environments (dev/prod) with different configurations.
+
+**Requirements:**
+
+1. **Create Namespaces**
+   - Create `dev` and `prod` namespaces
+   - These will host separate instances of your app
+
+2. **Create Environment-Specific Applications**
+   - Create `application-dev.yaml` using `values-dev.yaml`
+   - Create `application-prod.yaml` using `values-prod.yaml`
+   - Different replica counts, resource limits per environment
+
+3. **Enable Auto-Sync for Dev**
+   - Configure automatic sync for the dev environment
+   - Add `automated` sync policy
+   - Enable `selfHeal` and `prune` options
+
+4. **Keep Prod Manual**
+   - Production remains manual sync
+   - Understand why this is a best practice
+   - Document the deployment workflow difference
+
+5. **Verify Both Environments**
+   - Both apps visible in ArgoCD UI
+   - Different configurations applied
+   - Resources deployed to correct namespaces
+
+<details>
+<summary>💡 Hints</summary>
+
+**Create Namespaces:**
+```bash
+kubectl create namespace dev
+kubectl create namespace prod
+```
+
+**Dev Application with Auto-Sync:**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Application
+metadata:
+  name: python-app-dev
+  namespace: argocd
+spec:
+  project: default
+  source:
+    repoURL: https://github.com/<username>/<repo>.git
+    targetRevision: <branch>
+    path: <path-to-helm-chart>
+    helm:
+      valueFiles:
+        - values-dev.yaml
+  destination:
+    server: https://kubernetes.default.svc
+    namespace: dev
+  syncPolicy:
+    automated:
+      prune: true
+      selfHeal: true
+    syncOptions:
+      - CreateNamespace=true
+```
+
+**Prod Application (Manual):**
+```yaml
+# Similar but without automated sync policy
+syncPolicy:
+  syncOptions:
+    - CreateNamespace=true
+  # No automated block = manual sync
+```
+
+**Sync Policy Options:**
+- `automated`: Enable auto-sync
+- `prune`: Delete resources removed from Git
+- `selfHeal`: Revert manual cluster changes
+- Without `automated`: Manual sync required
+
+**Why Manual for Prod?**
+- Change review before deployment
+- Controlled release timing
+- Compliance requirements
+- Rollback planning
+
+**Verification:**
+```bash
+kubectl get pods -n dev
+kubectl get pods -n prod
+argocd app list
+```
+
+</details>
+
+---
+
+### Task 4 — Self-Healing & Sync Policies (2 pts)
+
+**Objective:** Test and understand ArgoCD's self-healing and drift detection capabilities.
+
+**Requirements:**
+
+1. **Test Self-Healing (Dev Environment)**
+   - Manually scale the deployment:
+     ```bash
+     kubectl scale deployment <name> -n dev --replicas=5
+     ```
+   - Observe ArgoCD detecting the drift
+   - Watch it automatically revert to Git-defined state
+   - Document the behavior with timestamps
+
+2. **Test Pod Deletion**
+   - Delete a pod in dev namespace
+   - Observe Kubernetes recreating the pod
+   - Note: This is Kubernetes behavior, not ArgoCD
+   - Understand the difference between:
+     - Kubernetes self-healing (pod recreation)
+     - ArgoCD self-healing (configuration drift)
+
+3. **Test Configuration Drift**
+   - Manually edit a resource (e.g., add a label)
+   - Observe ArgoCD diff view
+   - Watch self-heal revert the change
+
+4. **Document Sync Behavior**
+   - Explain when ArgoCD syncs vs when Kubernetes heals
+   - What triggers ArgoCD sync?
+   - What is the sync interval?
+
+<details>
+<summary>💡 Hints</summary>
+
+**Self-Healing Test:**
+```bash
+# Scale manually
+kubectl scale deployment python-app-dev -n dev --replicas=5
+
+# Watch ArgoCD revert (if selfHeal enabled)
+kubectl get pods -n dev -w
+
+# Check ArgoCD status
+argocd app get python-app-dev
+```
+
+**View Drift:**
+```bash
+argocd app diff python-app-dev
+```
+
+**Pod Deletion Test:**
+```bash
+# Delete a pod
+kubectl delete pod -n dev -l app.kubernetes.io/name=python-app
+
+# Kubernetes recreates it immediately (ReplicaSet controller)
+kubectl get pods -n dev -w
+```
+
+**Key Difference:**
+- **Kubernetes Self-Healing:** ReplicaSet/Deployment ensures desired pod count
+- **ArgoCD Self-Healing:** Reverts cluster state to match Git state
+
+**Sync Interval:**
+ArgoCD polls Git every 3 minutes by default. You can also:
+- Use webhooks for immediate sync
+- Manually trigger sync
+- Configure different intervals
+
+**Resources:**
+- [Automated Sync Policy](https://argo-cd.readthedocs.io/en/stable/user-guide/auto_sync/)
+- [Self Heal](https://argo-cd.readthedocs.io/en/stable/user-guide/auto_sync/#automatic-self-healing)
+
+</details>
+
+**Documentation Required in `k8s/ARGOCD.md`:**
+
+1. **ArgoCD Setup**
+   - Installation verification
+   - UI access method
+   - CLI configuration
+
+2. **Application Configuration**
+   - Application manifests
+   - Source and destination configuration
+   - Values file selection
+
+3. **Multi-Environment**
+   - Dev vs Prod configuration differences
+   - Sync policy differences and rationale
+   - Namespace separation
+
+4. **Self-Healing Evidence**
+   - Manual scale test with before/after
+   - Pod deletion test
+   - Configuration drift test
+   - Explanation of behaviors
+
+5. **Screenshots**
+   - ArgoCD UI showing both applications
+   - Sync status
+   - Application details view
+
+---
+
+## Bonus Task — ApplicationSet (2.5 pts)
+
+**Objective:** Use ApplicationSet to generate multiple applications from a single template.
+
+**Requirements:**
+
+1. **Understand ApplicationSet**
+   - Research ApplicationSet generators
+   - Understand use cases (multi-cluster, multi-tenant, mono-repo)
+
+2. **Implement List Generator**
+   - Create an ApplicationSet that generates both dev and prod apps
+   - Use the List generator to define environment-specific parameters
+   - Replace individual Application manifests
+
+3. **Implement Git Directory Generator (Optional)**
+   - If you have multiple apps in your repo
+   - Use Git directory generator to auto-discover apps
+
+4. **Document the Pattern**
+   - Benefits of ApplicationSet over individual Applications
+   - When to use which generator type
+   - Scaling considerations
+
+<details>
+<summary>💡 Hints</summary>
+
+**ApplicationSet with List Generator:**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: ApplicationSet
+metadata:
+  name: python-app-set
+  namespace: argocd
+spec:
+  generators:
+    - list:
+        elements:
+          - env: dev
+            namespace: dev
+            valuesFile: values-dev.yaml
+            autoSync: true
+          - env: prod
+            namespace: prod
+            valuesFile: values-prod.yaml
+            autoSync: false
+  template:
+    metadata:
+      name: 'python-app-{{env}}'
+    spec:
+      project: default
+      source:
+        repoURL: https://github.com/<username>/<repo>.git
+        targetRevision: <branch>
+        path: <path-to-helm-chart>
+        helm:
+          valueFiles:
+            - '{{valuesFile}}'
+      destination:
+        server: https://kubernetes.default.svc
+        namespace: '{{namespace}}'
+      syncPolicy:
+        # Conditional sync policy based on env
+        # Note: This requires templating tricks or separate ApplicationSets
+```
+
+**Git Directory Generator:**
+```yaml
+generators:
+  - git:
+      repoURL: https://github.com/<username>/<repo>.git
+      revision: HEAD
+      directories:
+        - path: k8s/*
+```
+
+**Generators Available:**
+- List: Explicit list of parameters
+- Cluster: Multi-cluster deployments
+- Git: Based on Git files/directories
+- Matrix: Combine multiple generators
+- Merge: Merge generator outputs
+
+**Resources:**
+- [ApplicationSet Documentation](https://argo-cd.readthedocs.io/en/stable/user-guide/application-set/)
+- [Generators](https://argo-cd.readthedocs.io/en/stable/operator-manual/applicationset/Generators/)
+
+</details>
+
+**Bonus Documentation:**
+- ApplicationSet manifest
+- Generator configuration explanation
+- Generated Applications screenshot
+- Comparison with individual Applications
+
+---
+
+## Checklist
+
+### Task 1 — ArgoCD Installation & Setup (2 pts)
+- [ ] ArgoCD installed via Helm
+- [ ] All pods running in argocd namespace
+- [ ] UI accessible via port-forward
+- [ ] Admin password retrieved
+- [ ] CLI installed and logged in
+
+### Task 2 — Application Deployment (3 pts)
+- [ ] `k8s/argocd/` directory created
+- [ ] Application manifest created
+- [ ] Application visible in ArgoCD UI
+- [ ] Initial sync completed
+- [ ] App accessible and working
+- [ ] GitOps workflow tested
+
+### Task 3 — Multi-Environment Deployment (3 pts)
+- [ ] Dev and prod namespaces created
+- [ ] Dev application with auto-sync
+- [ ] Prod application with manual sync
+- [ ] Different configurations per environment
+- [ ] Both apps deployed and verified
+
+### Task 4 — Self-Healing & Documentation (2 pts)
+- [ ] Manual scale test performed
+- [ ] Self-healing observed
+- [ ] Pod deletion test performed
+- [ ] Configuration drift test done
+- [ ] `k8s/ARGOCD.md` complete
+
+### Bonus — ApplicationSet (2.5 pts)
+- [ ] ApplicationSet manifest created
+- [ ] Multiple apps generated from template
+- [ ] Generator configuration documented
+- [ ] Benefits documented
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Installation** | 2 pts | ArgoCD running, UI/CLI accessible |
+| **App Deployment** | 3 pts | Application manifest, sync working |
+| **Multi-Environment** | 3 pts | Dev/prod with different configs |
+| **Self-Healing** | 2 pts | Tests performed, documented |
+| **Bonus** | 2.5 pts | ApplicationSet implementation |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Full GitOps workflow, multi-env, self-healing documented
+- **8-9/10:** ArgoCD works, minor issues with multi-env or docs
+- **6-7/10:** Basic app deployment, missing multi-env or self-healing
+- **<6/10:** ArgoCD not properly configured, apps not syncing
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Documentation</summary>
+
+- [ArgoCD Documentation](https://argo-cd.readthedocs.io/)
+- [ArgoCD Operator Manual](https://argo-cd.readthedocs.io/en/stable/operator-manual/)
+- [Application CRD](https://argo-cd.readthedocs.io/en/stable/operator-manual/declarative-setup/)
+- [Sync Policies](https://argo-cd.readthedocs.io/en/stable/user-guide/auto_sync/)
+
+</details>
+
+<details>
+<summary>🎓 GitOps Concepts</summary>
+
+- [GitOps Principles](https://opengitops.dev/)
+- [GitOps Working Group](https://github.com/gitops-working-group/gitops-working-group)
+- [ArgoCD Best Practices](https://argo-cd.readthedocs.io/en/stable/user-guide/best_practices/)
+
+</details>
+
+<details>
+<summary>🛠️ Advanced Topics</summary>
+
+- [ApplicationSet](https://argo-cd.readthedocs.io/en/stable/user-guide/application-set/)
+- [Sync Waves](https://argo-cd.readthedocs.io/en/stable/user-guide/sync-waves/)
+- [Resource Hooks](https://argo-cd.readthedocs.io/en/stable/user-guide/resource_hooks/)
+- [Notifications](https://argo-cd.readthedocs.io/en/stable/operator-manual/notifications/)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 14:** Progressive delivery with Argo Rollouts
+- **Lab 15:** StatefulSets for stateful applications
+- **Lab 16:** Monitoring your GitOps deployments
+
+---
+
+**Good luck!** 🔄
+
+> **Remember:** GitOps means Git is the source of truth. Any changes should go through Git, not direct `kubectl` commands. ArgoCD ensures your cluster always matches what's in Git.
diff --git a/labs/lab14.md b/labs/lab14.md
index 6cc6eaa347..146af45deb 100644
--- a/labs/lab14.md
+++ b/labs/lab14.md
@@ -1,453 +1,453 @@
-# Lab 14 — Progressive Delivery with Argo Rollouts
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-Progressive%20Delivery-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Argo%20Rollouts-informational)
-
-> Implement canary and blue-green deployment strategies for safe, automated releases with traffic shifting and automatic rollback.
-
-## Overview
-
-Progressive delivery extends continuous delivery by gradually rolling out changes to a subset of users before full deployment. Argo Rollouts provides advanced deployment capabilities including canary releases, blue-green deployments, and automated rollbacks based on metrics.
-
-**What You'll Learn:**
-- Canary deployment strategy with traffic shifting
-- Blue-green deployment with instant rollback
-- Argo Rollouts Dashboard for visualization
-- Metrics-based automated promotion/rollback
-- Integration with existing Kubernetes services
-
-**Building On:** Your Helm chart from Lab 13 (ArgoCD) with Deployment will be converted to Rollout.
-
-**Tech Stack:** Argo Rollouts 1.7+ | Kubernetes | Prometheus (optional for analysis)
-
----
-
-## Tasks
-
-### Task 1 — Argo Rollouts Fundamentals (2 pts)
-
-**Objective:** Install Argo Rollouts and understand the Rollout CRD.
-
-**Requirements:**
-
-1. **Install Argo Rollouts Controller**
-   - Install via kubectl or Helm
-   - Verify controller is running
-   - Install kubectl plugin for CLI management
-
-2. **Install Argo Rollouts Dashboard**
-   - Deploy the dashboard for visualization
-   - Access via port-forward
-   - Explore the UI
-
-3. **Understand Rollout vs Deployment**
-   - Compare Rollout CRD with Deployment
-   - Identify additional fields for progressive delivery
-   - Document key differences
-
-<details>
-<summary>💡 Hints</summary>
-
-**Installation:**
-```bash
-# Install controller
-kubectl create namespace argo-rollouts
-kubectl apply -n argo-rollouts -f https://github.com/argoproj/argo-rollouts/releases/latest/download/install.yaml
-
-# Install kubectl plugin
-# macOS
-brew install argoproj/tap/kubectl-argo-rollouts
-
-# Linux
-curl -LO https://github.com/argoproj/argo-rollouts/releases/latest/download/kubectl-argo-rollouts-linux-amd64
-chmod +x kubectl-argo-rollouts-linux-amd64
-sudo mv kubectl-argo-rollouts-linux-amd64 /usr/local/bin/kubectl-argo-rollouts
-
-# Verify
-kubectl argo rollouts version
-```
-
-**Dashboard:**
-```bash
-# Install dashboard
-kubectl apply -n argo-rollouts -f https://github.com/argoproj/argo-rollouts/releases/latest/download/dashboard-install.yaml
-
-# Access
-kubectl port-forward svc/argo-rollouts-dashboard -n argo-rollouts 3100:3100
-# Open http://localhost:3100
-```
-
-**Rollout vs Deployment:**
-- Rollout has `strategy` field with `canary` or `blueGreen` options
-- Supports traffic management, analysis, and automated rollback
-- Otherwise identical structure to Deployment
-
-**Resources:**
-- [Argo Rollouts Installation](https://argoproj.github.io/argo-rollouts/installation/)
-- [Rollout Specification](https://argoproj.github.io/argo-rollouts/features/specification/)
-
-</details>
-
----
-
-### Task 2 — Canary Deployment (3 pts)
-
-**Objective:** Implement canary deployment strategy with gradual traffic shifting.
-
-**Requirements:**
-
-1. **Convert Deployment to Rollout**
-   - Create `templates/rollout.yaml` in your Helm chart
-   - Change `kind: Deployment` to `kind: Rollout`
-   - Add canary strategy configuration
-
-2. **Configure Canary Steps**
-   - Implement progressive traffic shifting:
-     - 20% → pause (manual promotion)
-     - 40% → pause 30 seconds
-     - 60% → pause 30 seconds
-     - 80% → pause 30 seconds
-     - 100%
-
-3. **Deploy and Test**
-   - Install the Rollout
-   - Make a change (e.g., update image tag or env var)
-   - Watch traffic shifting in dashboard
-   - Manually promote through first step
-   - Observe automatic progression
-
-4. **Test Rollback**
-   - During a rollout, abort it
-   - Observe traffic shifting back to stable version
-   - Verify instant rollback capability
-
-<details>
-<summary>💡 Hints</summary>
-
-**Rollout with Canary Strategy:**
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: Rollout
-metadata:
-  name: {{ include "mychart.fullname" . }}
-spec:
-  replicas: {{ .Values.replicaCount }}
-  selector:
-    matchLabels:
-      {{- include "mychart.selectorLabels" . | nindent 6 }}
-  template:
-    # Same as Deployment pod template
-    metadata:
-      labels:
-        {{- include "mychart.selectorLabels" . | nindent 8 }}
-    spec:
-      containers:
-        - name: {{ .Chart.Name }}
-          image: "{{ .Values.image.repository }}:{{ .Values.image.tag }}"
-          # ... rest of container spec
-  strategy:
-    canary:
-      steps:
-        - setWeight: 20
-        - pause: {}  # Manual promotion required
-        - setWeight: 40
-        - pause: { duration: 30s }
-        - setWeight: 60
-        - pause: { duration: 30s }
-        - setWeight: 80
-        - pause: { duration: 30s }
-        - setWeight: 100
-```
-
-**CLI Commands:**
-```bash
-# Watch rollout status
-kubectl argo rollouts get rollout <name> -w
-
-# Promote to next step
-kubectl argo rollouts promote <name>
-
-# Abort rollout
-kubectl argo rollouts abort <name>
-
-# Retry aborted rollout
-kubectl argo rollouts retry rollout <name>
-```
-
-**Important:** Your existing Service still works - it automatically routes to the correct pods based on Rollout's traffic management.
-
-</details>
-
----
-
-### Task 3 — Blue-Green Deployment (3 pts)
-
-**Objective:** Implement blue-green deployment with preview environment.
-
-**Requirements:**
-
-1. **Create Blue-Green Rollout**
-   - Create a separate values file or modify existing
-   - Configure `blueGreen` strategy instead of `canary`
-   - Set up active and preview services
-
-2. **Configure Services**
-   - Active service: serves production traffic
-   - Preview service: serves new version for testing
-   - Understand `autoPromotionEnabled` setting
-
-3. **Test Blue-Green Flow**
-   - Deploy initial version (blue)
-   - Update image/config (triggers green deployment)
-   - Access preview service to test new version
-   - Promote green to active
-   - Verify instant switch
-
-4. **Test Instant Rollback**
-   - After promotion, trigger rollback
-   - Observe instant traffic switch back
-   - Document the speed difference vs canary
-
-<details>
-<summary>💡 Hints</summary>
-
-**Blue-Green Strategy:**
-```yaml
-spec:
-  strategy:
-    blueGreen:
-      activeService: {{ include "mychart.fullname" . }}
-      previewService: {{ include "mychart.fullname" . }}-preview
-      autoPromotionEnabled: false  # Manual promotion
-      # autoPromotionSeconds: 30  # Or auto-promote after 30s
-```
-
-**Preview Service:**
-```yaml
-apiVersion: v1
-kind: Service
-metadata:
-  name: {{ include "mychart.fullname" . }}-preview
-spec:
-  selector:
-    {{- include "mychart.selectorLabels" . | nindent 4 }}
-  ports:
-    - port: {{ .Values.service.port }}
-      targetPort: {{ .Values.service.targetPort }}
-```
-
-**Testing:**
-```bash
-# Access active (production)
-kubectl port-forward svc/myapp 8080:80
-
-# Access preview (new version)
-kubectl port-forward svc/myapp-preview 8081:80
-
-# Compare both, then promote
-kubectl argo rollouts promote myapp
-```
-
-**Blue-Green vs Canary:**
-- Blue-Green: Instant switch, all-or-nothing
-- Canary: Gradual traffic shift, percentage-based
-- Blue-Green: Need 2x resources during deployment
-- Canary: Shared resources, mixed traffic
-
-</details>
-
----
-
-### Task 4 — Documentation (2 pts)
-
-**Objective:** Document your progressive delivery implementation.
-
-**Create `k8s/ROLLOUTS.md` with:**
-
-1. **Argo Rollouts Setup**
-   - Installation verification
-   - Dashboard access
-
-2. **Canary Deployment**
-   - Strategy configuration explained
-   - Step-by-step rollout progression (screenshots from dashboard)
-   - Promotion and abort demonstration
-
-3. **Blue-Green Deployment**
-   - Strategy configuration explained
-   - Preview vs active service
-   - Promotion process
-
-4. **Strategy Comparison**
-   - When to use canary vs blue-green
-   - Pros and cons of each
-   - Your recommendation for different scenarios
-
-5. **CLI Commands Reference**
-   - Useful commands you used
-   - Monitoring and troubleshooting
-
----
-
-## Bonus Task — Automated Analysis (2.5 pts)
-
-**Objective:** Integrate metrics-based analysis for automated promotion/rollback.
-
-**Requirements:**
-
-1. **Create AnalysisTemplate**
-   - Define success criteria based on metrics
-   - Use Prometheus or web analysis provider
-   - Set failure thresholds
-
-2. **Integrate with Canary**
-   - Add analysis step to canary strategy
-   - Configure automatic rollback on failure
-   - Test with intentional failure
-
-3. **Document Analysis**
-   - AnalysisTemplate configuration
-   - How metrics determine success/failure
-   - Demonstration of auto-rollback
-
-<details>
-<summary>💡 Hints</summary>
-
-**Simple Web Analysis (no Prometheus):**
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: AnalysisTemplate
-metadata:
-  name: success-rate
-spec:
-  metrics:
-    - name: webcheck
-      provider:
-        web:
-          url: http://{{ include "mychart.fullname" . }}.default.svc/health
-          jsonPath: "{$.status}"
-      successCondition: result == "ok"
-      interval: 10s
-      count: 3
-      failureLimit: 1
-```
-
-**Canary with Analysis:**
-```yaml
-strategy:
-  canary:
-    steps:
-      - setWeight: 20
-      - analysis:
-          templates:
-            - templateName: success-rate
-      - setWeight: 50
-      - pause: { duration: 30s }
-      - setWeight: 100
-```
-
-**Prometheus Analysis (if Lab 16 monitoring is set up):**
-```yaml
-metrics:
-  - name: error-rate
-    provider:
-      prometheus:
-        address: http://prometheus.monitoring:9090
-        query: |
-          sum(rate(http_requests_total{status=~"5.*"}[1m])) /
-          sum(rate(http_requests_total[1m]))
-    successCondition: result[0] < 0.05
-    interval: 30s
-```
-
-**Resources:**
-- [Analysis & Progressive Delivery](https://argoproj.github.io/argo-rollouts/features/analysis/)
-- [AnalysisTemplate Specification](https://argoproj.github.io/argo-rollouts/analysis/overview/)
-
-</details>
-
----
-
-## Checklist
-
-### Task 1 — Argo Rollouts Fundamentals (2 pts)
-- [ ] Controller installed and running
-- [ ] kubectl plugin installed
-- [ ] Dashboard accessible
-- [ ] Rollout vs Deployment differences documented
-
-### Task 2 — Canary Deployment (3 pts)
-- [ ] Deployment converted to Rollout
-- [ ] Canary steps configured
-- [ ] Traffic shifting observed in dashboard
-- [ ] Manual promotion tested
-- [ ] Rollback tested
-
-### Task 3 — Blue-Green Deployment (3 pts)
-- [ ] Blue-green strategy configured
-- [ ] Preview service created
-- [ ] Preview environment tested
-- [ ] Promotion to active tested
-- [ ] Instant rollback verified
-
-### Task 4 — Documentation (2 pts)
-- [ ] `k8s/ROLLOUTS.md` complete
-- [ ] Both strategies documented
-- [ ] Screenshots included
-- [ ] Comparison analysis provided
-
-### Bonus — Automated Analysis (2.5 pts)
-- [ ] AnalysisTemplate created
-- [ ] Integrated with canary strategy
-- [ ] Auto-rollback demonstrated
-- [ ] Documentation complete
-
----
-
-## Rubric
-
-| Criteria | Points | Description |
-|----------|--------|-------------|
-| **Fundamentals** | 2 pts | Installation, dashboard, concepts |
-| **Canary** | 3 pts | Working canary with traffic shifting |
-| **Blue-Green** | 3 pts | Working blue-green with preview |
-| **Documentation** | 2 pts | Complete ROLLOUTS.md |
-| **Bonus** | 2.5 pts | Automated analysis integration |
-| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
-
----
-
-## Resources
-
-<details>
-<summary>📚 Official Documentation</summary>
-
-- [Argo Rollouts Documentation](https://argoproj.github.io/argo-rollouts/)
-- [Canary Strategy](https://argoproj.github.io/argo-rollouts/features/canary/)
-- [Blue-Green Strategy](https://argoproj.github.io/argo-rollouts/features/bluegreen/)
-- [Analysis & Progressive Delivery](https://argoproj.github.io/argo-rollouts/features/analysis/)
-
-</details>
-
-<details>
-<summary>🎓 Tutorials</summary>
-
-- [Getting Started Guide](https://argoproj.github.io/argo-rollouts/getting-started/)
-- [Canary with Traffic Management](https://argoproj.github.io/argo-rollouts/getting-started/nginx/)
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 15:** StatefulSets for stateful applications (different use case than Rollouts)
-- **Lab 16:** Monitoring your rollouts with Prometheus/Grafana
-
----
-
-**Good luck!** 🚀
-
-> **Remember:** Rollouts replace Deployments when you need progressive delivery. For stateful applications (Lab 15), you'll still use StatefulSets - they serve different purposes.
+# Lab 14 — Progressive Delivery with Argo Rollouts
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Progressive%20Delivery-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Argo%20Rollouts-informational)
+
+> Implement canary and blue-green deployment strategies for safe, automated releases with traffic shifting and automatic rollback.
+
+## Overview
+
+Progressive delivery extends continuous delivery by gradually rolling out changes to a subset of users before full deployment. Argo Rollouts provides advanced deployment capabilities including canary releases, blue-green deployments, and automated rollbacks based on metrics.
+
+**What You'll Learn:**
+- Canary deployment strategy with traffic shifting
+- Blue-green deployment with instant rollback
+- Argo Rollouts Dashboard for visualization
+- Metrics-based automated promotion/rollback
+- Integration with existing Kubernetes services
+
+**Building On:** Your Helm chart from Lab 13 (ArgoCD) with Deployment will be converted to Rollout.
+
+**Tech Stack:** Argo Rollouts 1.7+ | Kubernetes | Prometheus (optional for analysis)
+
+---
+
+## Tasks
+
+### Task 1 — Argo Rollouts Fundamentals (2 pts)
+
+**Objective:** Install Argo Rollouts and understand the Rollout CRD.
+
+**Requirements:**
+
+1. **Install Argo Rollouts Controller**
+   - Install via kubectl or Helm
+   - Verify controller is running
+   - Install kubectl plugin for CLI management
+
+2. **Install Argo Rollouts Dashboard**
+   - Deploy the dashboard for visualization
+   - Access via port-forward
+   - Explore the UI
+
+3. **Understand Rollout vs Deployment**
+   - Compare Rollout CRD with Deployment
+   - Identify additional fields for progressive delivery
+   - Document key differences
+
+<details>
+<summary>💡 Hints</summary>
+
+**Installation:**
+```bash
+# Install controller
+kubectl create namespace argo-rollouts
+kubectl apply -n argo-rollouts -f https://github.com/argoproj/argo-rollouts/releases/latest/download/install.yaml
+
+# Install kubectl plugin
+# macOS
+brew install argoproj/tap/kubectl-argo-rollouts
+
+# Linux
+curl -LO https://github.com/argoproj/argo-rollouts/releases/latest/download/kubectl-argo-rollouts-linux-amd64
+chmod +x kubectl-argo-rollouts-linux-amd64
+sudo mv kubectl-argo-rollouts-linux-amd64 /usr/local/bin/kubectl-argo-rollouts
+
+# Verify
+kubectl argo rollouts version
+```
+
+**Dashboard:**
+```bash
+# Install dashboard
+kubectl apply -n argo-rollouts -f https://github.com/argoproj/argo-rollouts/releases/latest/download/dashboard-install.yaml
+
+# Access
+kubectl port-forward svc/argo-rollouts-dashboard -n argo-rollouts 3100:3100
+# Open http://localhost:3100
+```
+
+**Rollout vs Deployment:**
+- Rollout has `strategy` field with `canary` or `blueGreen` options
+- Supports traffic management, analysis, and automated rollback
+- Otherwise identical structure to Deployment
+
+**Resources:**
+- [Argo Rollouts Installation](https://argoproj.github.io/argo-rollouts/installation/)
+- [Rollout Specification](https://argoproj.github.io/argo-rollouts/features/specification/)
+
+</details>
+
+---
+
+### Task 2 — Canary Deployment (3 pts)
+
+**Objective:** Implement canary deployment strategy with gradual traffic shifting.
+
+**Requirements:**
+
+1. **Convert Deployment to Rollout**
+   - Create `templates/rollout.yaml` in your Helm chart
+   - Change `kind: Deployment` to `kind: Rollout`
+   - Add canary strategy configuration
+
+2. **Configure Canary Steps**
+   - Implement progressive traffic shifting:
+     - 20% → pause (manual promotion)
+     - 40% → pause 30 seconds
+     - 60% → pause 30 seconds
+     - 80% → pause 30 seconds
+     - 100%
+
+3. **Deploy and Test**
+   - Install the Rollout
+   - Make a change (e.g., update image tag or env var)
+   - Watch traffic shifting in dashboard
+   - Manually promote through first step
+   - Observe automatic progression
+
+4. **Test Rollback**
+   - During a rollout, abort it
+   - Observe traffic shifting back to stable version
+   - Verify instant rollback capability
+
+<details>
+<summary>💡 Hints</summary>
+
+**Rollout with Canary Strategy:**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Rollout
+metadata:
+  name: {{ include "mychart.fullname" . }}
+spec:
+  replicas: {{ .Values.replicaCount }}
+  selector:
+    matchLabels:
+      {{- include "mychart.selectorLabels" . | nindent 6 }}
+  template:
+    # Same as Deployment pod template
+    metadata:
+      labels:
+        {{- include "mychart.selectorLabels" . | nindent 8 }}
+    spec:
+      containers:
+        - name: {{ .Chart.Name }}
+          image: "{{ .Values.image.repository }}:{{ .Values.image.tag }}"
+          # ... rest of container spec
+  strategy:
+    canary:
+      steps:
+        - setWeight: 20
+        - pause: {}  # Manual promotion required
+        - setWeight: 40
+        - pause: { duration: 30s }
+        - setWeight: 60
+        - pause: { duration: 30s }
+        - setWeight: 80
+        - pause: { duration: 30s }
+        - setWeight: 100
+```
+
+**CLI Commands:**
+```bash
+# Watch rollout status
+kubectl argo rollouts get rollout <name> -w
+
+# Promote to next step
+kubectl argo rollouts promote <name>
+
+# Abort rollout
+kubectl argo rollouts abort <name>
+
+# Retry aborted rollout
+kubectl argo rollouts retry rollout <name>
+```
+
+**Important:** Your existing Service still works - it automatically routes to the correct pods based on Rollout's traffic management.
+
+</details>
+
+---
+
+### Task 3 — Blue-Green Deployment (3 pts)
+
+**Objective:** Implement blue-green deployment with preview environment.
+
+**Requirements:**
+
+1. **Create Blue-Green Rollout**
+   - Create a separate values file or modify existing
+   - Configure `blueGreen` strategy instead of `canary`
+   - Set up active and preview services
+
+2. **Configure Services**
+   - Active service: serves production traffic
+   - Preview service: serves new version for testing
+   - Understand `autoPromotionEnabled` setting
+
+3. **Test Blue-Green Flow**
+   - Deploy initial version (blue)
+   - Update image/config (triggers green deployment)
+   - Access preview service to test new version
+   - Promote green to active
+   - Verify instant switch
+
+4. **Test Instant Rollback**
+   - After promotion, trigger rollback
+   - Observe instant traffic switch back
+   - Document the speed difference vs canary
+
+<details>
+<summary>💡 Hints</summary>
+
+**Blue-Green Strategy:**
+```yaml
+spec:
+  strategy:
+    blueGreen:
+      activeService: {{ include "mychart.fullname" . }}
+      previewService: {{ include "mychart.fullname" . }}-preview
+      autoPromotionEnabled: false  # Manual promotion
+      # autoPromotionSeconds: 30  # Or auto-promote after 30s
+```
+
+**Preview Service:**
+```yaml
+apiVersion: v1
+kind: Service
+metadata:
+  name: {{ include "mychart.fullname" . }}-preview
+spec:
+  selector:
+    {{- include "mychart.selectorLabels" . | nindent 4 }}
+  ports:
+    - port: {{ .Values.service.port }}
+      targetPort: {{ .Values.service.targetPort }}
+```
+
+**Testing:**
+```bash
+# Access active (production)
+kubectl port-forward svc/myapp 8080:80
+
+# Access preview (new version)
+kubectl port-forward svc/myapp-preview 8081:80
+
+# Compare both, then promote
+kubectl argo rollouts promote myapp
+```
+
+**Blue-Green vs Canary:**
+- Blue-Green: Instant switch, all-or-nothing
+- Canary: Gradual traffic shift, percentage-based
+- Blue-Green: Need 2x resources during deployment
+- Canary: Shared resources, mixed traffic
+
+</details>
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Objective:** Document your progressive delivery implementation.
+
+**Create `k8s/ROLLOUTS.md` with:**
+
+1. **Argo Rollouts Setup**
+   - Installation verification
+   - Dashboard access
+
+2. **Canary Deployment**
+   - Strategy configuration explained
+   - Step-by-step rollout progression (screenshots from dashboard)
+   - Promotion and abort demonstration
+
+3. **Blue-Green Deployment**
+   - Strategy configuration explained
+   - Preview vs active service
+   - Promotion process
+
+4. **Strategy Comparison**
+   - When to use canary vs blue-green
+   - Pros and cons of each
+   - Your recommendation for different scenarios
+
+5. **CLI Commands Reference**
+   - Useful commands you used
+   - Monitoring and troubleshooting
+
+---
+
+## Bonus Task — Automated Analysis (2.5 pts)
+
+**Objective:** Integrate metrics-based analysis for automated promotion/rollback.
+
+**Requirements:**
+
+1. **Create AnalysisTemplate**
+   - Define success criteria based on metrics
+   - Use Prometheus or web analysis provider
+   - Set failure thresholds
+
+2. **Integrate with Canary**
+   - Add analysis step to canary strategy
+   - Configure automatic rollback on failure
+   - Test with intentional failure
+
+3. **Document Analysis**
+   - AnalysisTemplate configuration
+   - How metrics determine success/failure
+   - Demonstration of auto-rollback
+
+<details>
+<summary>💡 Hints</summary>
+
+**Simple Web Analysis (no Prometheus):**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: AnalysisTemplate
+metadata:
+  name: success-rate
+spec:
+  metrics:
+    - name: webcheck
+      provider:
+        web:
+          url: http://{{ include "mychart.fullname" . }}.default.svc/health
+          jsonPath: "{$.status}"
+      successCondition: result == "ok"
+      interval: 10s
+      count: 3
+      failureLimit: 1
+```
+
+**Canary with Analysis:**
+```yaml
+strategy:
+  canary:
+    steps:
+      - setWeight: 20
+      - analysis:
+          templates:
+            - templateName: success-rate
+      - setWeight: 50
+      - pause: { duration: 30s }
+      - setWeight: 100
+```
+
+**Prometheus Analysis (if Lab 16 monitoring is set up):**
+```yaml
+metrics:
+  - name: error-rate
+    provider:
+      prometheus:
+        address: http://prometheus.monitoring:9090
+        query: |
+          sum(rate(http_requests_total{status=~"5.*"}[1m])) /
+          sum(rate(http_requests_total[1m]))
+    successCondition: result[0] < 0.05
+    interval: 30s
+```
+
+**Resources:**
+- [Analysis & Progressive Delivery](https://argoproj.github.io/argo-rollouts/features/analysis/)
+- [AnalysisTemplate Specification](https://argoproj.github.io/argo-rollouts/analysis/overview/)
+
+</details>
+
+---
+
+## Checklist
+
+### Task 1 — Argo Rollouts Fundamentals (2 pts)
+- [ ] Controller installed and running
+- [ ] kubectl plugin installed
+- [ ] Dashboard accessible
+- [ ] Rollout vs Deployment differences documented
+
+### Task 2 — Canary Deployment (3 pts)
+- [ ] Deployment converted to Rollout
+- [ ] Canary steps configured
+- [ ] Traffic shifting observed in dashboard
+- [ ] Manual promotion tested
+- [ ] Rollback tested
+
+### Task 3 — Blue-Green Deployment (3 pts)
+- [ ] Blue-green strategy configured
+- [ ] Preview service created
+- [ ] Preview environment tested
+- [ ] Promotion to active tested
+- [ ] Instant rollback verified
+
+### Task 4 — Documentation (2 pts)
+- [ ] `k8s/ROLLOUTS.md` complete
+- [ ] Both strategies documented
+- [ ] Screenshots included
+- [ ] Comparison analysis provided
+
+### Bonus — Automated Analysis (2.5 pts)
+- [ ] AnalysisTemplate created
+- [ ] Integrated with canary strategy
+- [ ] Auto-rollback demonstrated
+- [ ] Documentation complete
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Fundamentals** | 2 pts | Installation, dashboard, concepts |
+| **Canary** | 3 pts | Working canary with traffic shifting |
+| **Blue-Green** | 3 pts | Working blue-green with preview |
+| **Documentation** | 2 pts | Complete ROLLOUTS.md |
+| **Bonus** | 2.5 pts | Automated analysis integration |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Documentation</summary>
+
+- [Argo Rollouts Documentation](https://argoproj.github.io/argo-rollouts/)
+- [Canary Strategy](https://argoproj.github.io/argo-rollouts/features/canary/)
+- [Blue-Green Strategy](https://argoproj.github.io/argo-rollouts/features/bluegreen/)
+- [Analysis & Progressive Delivery](https://argoproj.github.io/argo-rollouts/features/analysis/)
+
+</details>
+
+<details>
+<summary>🎓 Tutorials</summary>
+
+- [Getting Started Guide](https://argoproj.github.io/argo-rollouts/getting-started/)
+- [Canary with Traffic Management](https://argoproj.github.io/argo-rollouts/getting-started/nginx/)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 15:** StatefulSets for stateful applications (different use case than Rollouts)
+- **Lab 16:** Monitoring your rollouts with Prometheus/Grafana
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** Rollouts replace Deployments when you need progressive delivery. For stateful applications (Lab 15), you'll still use StatefulSets - they serve different purposes.
diff --git a/labs/lab15.md b/labs/lab15.md
index cbc416b25e..56f2a1083f 100644
--- a/labs/lab15.md
+++ b/labs/lab15.md
@@ -1,304 +1,304 @@
-# Lab 15 — StatefulSets & Persistent Storage
-
-![difficulty](https://img.shields.io/badge/difficulty-advanced-red)
-![topic](https://img.shields.io/badge/topic-StatefulSets-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-StatefulSet%20%7C%20PVC-informational)
-
-> Manage stateful applications in Kubernetes with stable network identities and persistent per-pod storage.
-
-## Overview
-
-While Deployments and Rollouts are perfect for stateless applications, many real-world applications need stable identities and persistent storage per instance. StatefulSets provide guarantees about ordering, uniqueness, and storage that other controllers cannot offer.
-
-**What You'll Learn:**
-- StatefulSet vs Deployment: when to use which
-- Stable network identities and pod naming
-- VolumeClaimTemplates for per-pod storage
-- Headless Services for direct pod access
-- Ordered vs parallel pod management
-
-**Building On:** Your Helm chart with visits counter from Lab 12. Note: StatefulSets serve a different purpose than Rollouts (Lab 14) - use Rollouts for progressive delivery of stateless apps, StatefulSets for stateful apps.
-
-**Tech Stack:** StatefulSets | Headless Services | VolumeClaimTemplates | Persistent Volumes
-
----
-
-## Tasks
-
-### Task 1 — StatefulSet Concepts (2 pts)
-
-**Objective:** Understand when and why to use StatefulSets.
-
-**Requirements:**
-
-1. **Study StatefulSet Guarantees**
-   - Stable, unique network identifiers
-   - Stable, persistent storage
-   - Ordered, graceful deployment and scaling
-
-2. **Compare with Deployments**
-   - Document key differences
-   - When to use Deployment vs StatefulSet
-   - Examples of stateful workloads
-
-3. **Understand Headless Services**
-   - What is a headless service (`clusterIP: None`)?
-   - How DNS works with StatefulSets
-
-<details>
-<summary>💡 Hints</summary>
-
-**StatefulSet Use Cases:**
-- Databases (MySQL, PostgreSQL, MongoDB)
-- Message queues (Kafka, RabbitMQ)
-- Distributed systems (Elasticsearch, Cassandra)
-
-**Key Differences:**
-
-| Feature | Deployment | StatefulSet |
-|---------|------------|-------------|
-| Pod Names | Random suffix | Ordered index (pod-0, pod-1) |
-| Storage | Shared PVC | Per-pod PVC via templates |
-| Scaling | Any order | Ordered (0→1→2) |
-| Network ID | Random | Stable DNS name |
-
-**Headless Service:**
-A Service with `clusterIP: None` creates DNS records for each pod:
-- `pod-0.service-name.namespace.svc.cluster.local`
-
-**Resources:**
-- [StatefulSet Basics](https://kubernetes.io/docs/tutorials/stateful-application/basic-stateful-set/)
-- [StatefulSet Concepts](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/)
-
-</details>
-
----
-
-### Task 2 — Convert Deployment to StatefulSet (3 pts)
-
-**Objective:** Transform your Helm chart to use a StatefulSet with per-pod storage.
-
-**Requirements:**
-
-1. **Create StatefulSet Template**
-   - Create `statefulset.yaml` (keep rollout.yaml for reference)
-   - Add `serviceName` field pointing to headless service
-   - Configure `volumeClaimTemplates` for per-pod storage
-
-2. **Create Headless Service**
-   - Create a new service with `clusterIP: None`
-   - Keep your existing service for external access
-
-3. **Configure VolumeClaimTemplates**
-   - Each pod gets its own PVC automatically
-   - Configure storage class and size via values
-
-4. **Deploy and Verify**
-   - Pods named with ordinal suffixes (app-0, app-1, app-2)
-   - Each pod has its own PVC
-
-<details>
-<summary>💡 Hints</summary>
-
-**StatefulSet Structure:**
-```yaml
-apiVersion: apps/v1
-kind: StatefulSet
-metadata:
-  name: {{ include "mychart.fullname" . }}
-spec:
-  serviceName: {{ include "mychart.fullname" . }}-headless
-  replicas: {{ .Values.replicaCount }}
-  selector:
-    matchLabels:
-      {{- include "mychart.selectorLabels" . | nindent 6 }}
-  template:
-    # Same as Deployment pod template
-  volumeClaimTemplates:
-    - metadata:
-        name: data
-      spec:
-        accessModes: [ "ReadWriteOnce" ]
-        resources:
-          requests:
-            storage: {{ .Values.persistence.size }}
-```
-
-**Headless Service:**
-```yaml
-apiVersion: v1
-kind: Service
-metadata:
-  name: {{ include "mychart.fullname" . }}-headless
-spec:
-  clusterIP: None
-  selector:
-    {{- include "mychart.selectorLabels" . | nindent 4 }}
-  ports:
-    - port: {{ .Values.service.port }}
-```
-
-**Verification:**
-```bash
-kubectl get statefulset
-kubectl get pods
-kubectl get pvc
-```
-
-</details>
-
----
-
-### Task 3 — Headless Service & Pod Identity (3 pts)
-
-**Objective:** Verify stable network identities and per-pod storage isolation.
-
-**Requirements:**
-
-1. **Test DNS Resolution**
-   - Exec into a pod
-   - Resolve other pods via DNS
-   - Document the DNS naming pattern
-
-2. **Test Per-Pod Storage**
-   - Access your app through each pod
-   - Verify each pod maintains its own visit count
-   - Demonstrate isolation between pods
-
-3. **Test Persistence**
-   - Note visit counts for each pod
-   - Delete one pod (not the StatefulSet)
-   - Verify the visit count is preserved after restart
-
-<details>
-<summary>💡 Hints</summary>
-
-**DNS Resolution Test:**
-```bash
-kubectl exec -it <statefulset>-0 -- /bin/sh
-nslookup <statefulset>-1.<headless-service>
-```
-
-**Per-Pod Visit Count Test:**
-```bash
-kubectl port-forward pod/<statefulset>-0 8080:8000 &
-kubectl port-forward pod/<statefulset>-1 8081:8000 &
-curl localhost:8080/visits
-curl localhost:8081/visits
-```
-
-**Persistence Test:**
-```bash
-kubectl exec <statefulset>-0 -- cat /data/visits
-kubectl delete pod <statefulset>-0
-# Wait for restart
-kubectl exec <statefulset>-0 -- cat /data/visits
-```
-
-</details>
-
----
-
-### Task 4 — Documentation (2 pts)
-
-**Objective:** Document your StatefulSet implementation.
-
-**Create `k8s/STATEFULSET.md` with:**
-
-1. **StatefulSet Overview** - Why StatefulSet, differences from Deployment
-2. **Resource Verification** - Output of `kubectl get po,sts,svc,pvc`
-3. **Network Identity** - DNS resolution outputs
-4. **Per-Pod Storage Evidence** - Different visit counts per pod
-5. **Persistence Test** - Data survives pod deletion
-
----
-
-## Bonus Task — Update Strategies (2.5 pts)
-
-**Objective:** Explore StatefulSet update strategies.
-
-**Requirements:**
-
-1. **Implement Partitioned Rolling Update**
-   - Configure `updateStrategy` with `partition`
-   - Update only pods with ordinal >= partition value
-
-2. **Test OnDelete Strategy**
-   - Pods only update when manually deleted
-   - Document use cases
-
-<details>
-<summary>💡 Hints</summary>
-
-**Rolling Update with Partition:**
-```yaml
-spec:
-  updateStrategy:
-    type: RollingUpdate
-    rollingUpdate:
-      partition: 2
-```
-
-**OnDelete Strategy:**
-```yaml
-spec:
-  updateStrategy:
-    type: OnDelete
-```
-
-**Resources:**
-- [StatefulSet Update Strategies](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/#update-strategies)
-
-</details>
-
----
-
-## Checklist
-
-- [ ] StatefulSet guarantees documented
-- [ ] `statefulset.yaml` created with volumeClaimTemplates
-- [ ] Headless service created
-- [ ] Per-pod PVCs verified
-- [ ] DNS resolution tested
-- [ ] Per-pod storage isolation proven
-- [ ] Persistence test passed
-- [ ] `k8s/STATEFULSET.md` complete
-
----
-
-## Rubric
-
-| Criteria | Points |
-|----------|--------|
-| **Concepts** | 2 pts |
-| **Implementation** | 3 pts |
-| **Identity & Storage** | 3 pts |
-| **Documentation** | 2 pts |
-| **Bonus** | 2.5 pts |
-| **Total** | 12.5 pts |
-
----
-
-## Resources
-
-<details>
-<summary>📚 Documentation</summary>
-
-- [StatefulSets](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/)
-- [Headless Services](https://kubernetes.io/docs/concepts/services-networking/service/#headless-services)
-- [VolumeClaimTemplates](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/#volume-claim-templates)
-
-</details>
-
----
-
-## Looking Ahead
-
-- **Lab 16:** Monitoring your StatefulSet with Prometheus/Grafana
-
----
-
-**Good luck!** 💾
-
-> **Remember:** StatefulSets are for applications needing stable identity and storage. For progressive delivery of stateless apps, use Rollouts (Lab 14).
+# Lab 15 — StatefulSets & Persistent Storage
+
+![difficulty](https://img.shields.io/badge/difficulty-advanced-red)
+![topic](https://img.shields.io/badge/topic-StatefulSets-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-StatefulSet%20%7C%20PVC-informational)
+
+> Manage stateful applications in Kubernetes with stable network identities and persistent per-pod storage.
+
+## Overview
+
+While Deployments and Rollouts are perfect for stateless applications, many real-world applications need stable identities and persistent storage per instance. StatefulSets provide guarantees about ordering, uniqueness, and storage that other controllers cannot offer.
+
+**What You'll Learn:**
+- StatefulSet vs Deployment: when to use which
+- Stable network identities and pod naming
+- VolumeClaimTemplates for per-pod storage
+- Headless Services for direct pod access
+- Ordered vs parallel pod management
+
+**Building On:** Your Helm chart with visits counter from Lab 12. Note: StatefulSets serve a different purpose than Rollouts (Lab 14) - use Rollouts for progressive delivery of stateless apps, StatefulSets for stateful apps.
+
+**Tech Stack:** StatefulSets | Headless Services | VolumeClaimTemplates | Persistent Volumes
+
+---
+
+## Tasks
+
+### Task 1 — StatefulSet Concepts (2 pts)
+
+**Objective:** Understand when and why to use StatefulSets.
+
+**Requirements:**
+
+1. **Study StatefulSet Guarantees**
+   - Stable, unique network identifiers
+   - Stable, persistent storage
+   - Ordered, graceful deployment and scaling
+
+2. **Compare with Deployments**
+   - Document key differences
+   - When to use Deployment vs StatefulSet
+   - Examples of stateful workloads
+
+3. **Understand Headless Services**
+   - What is a headless service (`clusterIP: None`)?
+   - How DNS works with StatefulSets
+
+<details>
+<summary>💡 Hints</summary>
+
+**StatefulSet Use Cases:**
+- Databases (MySQL, PostgreSQL, MongoDB)
+- Message queues (Kafka, RabbitMQ)
+- Distributed systems (Elasticsearch, Cassandra)
+
+**Key Differences:**
+
+| Feature | Deployment | StatefulSet |
+|---------|------------|-------------|
+| Pod Names | Random suffix | Ordered index (pod-0, pod-1) |
+| Storage | Shared PVC | Per-pod PVC via templates |
+| Scaling | Any order | Ordered (0→1→2) |
+| Network ID | Random | Stable DNS name |
+
+**Headless Service:**
+A Service with `clusterIP: None` creates DNS records for each pod:
+- `pod-0.service-name.namespace.svc.cluster.local`
+
+**Resources:**
+- [StatefulSet Basics](https://kubernetes.io/docs/tutorials/stateful-application/basic-stateful-set/)
+- [StatefulSet Concepts](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/)
+
+</details>
+
+---
+
+### Task 2 — Convert Deployment to StatefulSet (3 pts)
+
+**Objective:** Transform your Helm chart to use a StatefulSet with per-pod storage.
+
+**Requirements:**
+
+1. **Create StatefulSet Template**
+   - Create `statefulset.yaml` (keep rollout.yaml for reference)
+   - Add `serviceName` field pointing to headless service
+   - Configure `volumeClaimTemplates` for per-pod storage
+
+2. **Create Headless Service**
+   - Create a new service with `clusterIP: None`
+   - Keep your existing service for external access
+
+3. **Configure VolumeClaimTemplates**
+   - Each pod gets its own PVC automatically
+   - Configure storage class and size via values
+
+4. **Deploy and Verify**
+   - Pods named with ordinal suffixes (app-0, app-1, app-2)
+   - Each pod has its own PVC
+
+<details>
+<summary>💡 Hints</summary>
+
+**StatefulSet Structure:**
+```yaml
+apiVersion: apps/v1
+kind: StatefulSet
+metadata:
+  name: {{ include "mychart.fullname" . }}
+spec:
+  serviceName: {{ include "mychart.fullname" . }}-headless
+  replicas: {{ .Values.replicaCount }}
+  selector:
+    matchLabels:
+      {{- include "mychart.selectorLabels" . | nindent 6 }}
+  template:
+    # Same as Deployment pod template
+  volumeClaimTemplates:
+    - metadata:
+        name: data
+      spec:
+        accessModes: [ "ReadWriteOnce" ]
+        resources:
+          requests:
+            storage: {{ .Values.persistence.size }}
+```
+
+**Headless Service:**
+```yaml
+apiVersion: v1
+kind: Service
+metadata:
+  name: {{ include "mychart.fullname" . }}-headless
+spec:
+  clusterIP: None
+  selector:
+    {{- include "mychart.selectorLabels" . | nindent 4 }}
+  ports:
+    - port: {{ .Values.service.port }}
+```
+
+**Verification:**
+```bash
+kubectl get statefulset
+kubectl get pods
+kubectl get pvc
+```
+
+</details>
+
+---
+
+### Task 3 — Headless Service & Pod Identity (3 pts)
+
+**Objective:** Verify stable network identities and per-pod storage isolation.
+
+**Requirements:**
+
+1. **Test DNS Resolution**
+   - Exec into a pod
+   - Resolve other pods via DNS
+   - Document the DNS naming pattern
+
+2. **Test Per-Pod Storage**
+   - Access your app through each pod
+   - Verify each pod maintains its own visit count
+   - Demonstrate isolation between pods
+
+3. **Test Persistence**
+   - Note visit counts for each pod
+   - Delete one pod (not the StatefulSet)
+   - Verify the visit count is preserved after restart
+
+<details>
+<summary>💡 Hints</summary>
+
+**DNS Resolution Test:**
+```bash
+kubectl exec -it <statefulset>-0 -- /bin/sh
+nslookup <statefulset>-1.<headless-service>
+```
+
+**Per-Pod Visit Count Test:**
+```bash
+kubectl port-forward pod/<statefulset>-0 8080:8000 &
+kubectl port-forward pod/<statefulset>-1 8081:8000 &
+curl localhost:8080/visits
+curl localhost:8081/visits
+```
+
+**Persistence Test:**
+```bash
+kubectl exec <statefulset>-0 -- cat /data/visits
+kubectl delete pod <statefulset>-0
+# Wait for restart
+kubectl exec <statefulset>-0 -- cat /data/visits
+```
+
+</details>
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Objective:** Document your StatefulSet implementation.
+
+**Create `k8s/STATEFULSET.md` with:**
+
+1. **StatefulSet Overview** - Why StatefulSet, differences from Deployment
+2. **Resource Verification** - Output of `kubectl get po,sts,svc,pvc`
+3. **Network Identity** - DNS resolution outputs
+4. **Per-Pod Storage Evidence** - Different visit counts per pod
+5. **Persistence Test** - Data survives pod deletion
+
+---
+
+## Bonus Task — Update Strategies (2.5 pts)
+
+**Objective:** Explore StatefulSet update strategies.
+
+**Requirements:**
+
+1. **Implement Partitioned Rolling Update**
+   - Configure `updateStrategy` with `partition`
+   - Update only pods with ordinal >= partition value
+
+2. **Test OnDelete Strategy**
+   - Pods only update when manually deleted
+   - Document use cases
+
+<details>
+<summary>💡 Hints</summary>
+
+**Rolling Update with Partition:**
+```yaml
+spec:
+  updateStrategy:
+    type: RollingUpdate
+    rollingUpdate:
+      partition: 2
+```
+
+**OnDelete Strategy:**
+```yaml
+spec:
+  updateStrategy:
+    type: OnDelete
+```
+
+**Resources:**
+- [StatefulSet Update Strategies](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/#update-strategies)
+
+</details>
+
+---
+
+## Checklist
+
+- [ ] StatefulSet guarantees documented
+- [ ] `statefulset.yaml` created with volumeClaimTemplates
+- [ ] Headless service created
+- [ ] Per-pod PVCs verified
+- [ ] DNS resolution tested
+- [ ] Per-pod storage isolation proven
+- [ ] Persistence test passed
+- [ ] `k8s/STATEFULSET.md` complete
+
+---
+
+## Rubric
+
+| Criteria | Points |
+|----------|--------|
+| **Concepts** | 2 pts |
+| **Implementation** | 3 pts |
+| **Identity & Storage** | 3 pts |
+| **Documentation** | 2 pts |
+| **Bonus** | 2.5 pts |
+| **Total** | 12.5 pts |
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Documentation</summary>
+
+- [StatefulSets](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/)
+- [Headless Services](https://kubernetes.io/docs/concepts/services-networking/service/#headless-services)
+- [VolumeClaimTemplates](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/#volume-claim-templates)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 16:** Monitoring your StatefulSet with Prometheus/Grafana
+
+---
+
+**Good luck!** 💾
+
+> **Remember:** StatefulSets are for applications needing stable identity and storage. For progressive delivery of stateless apps, use Rollouts (Lab 14).
diff --git a/labs/lab16.md b/labs/lab16.md
index 6fa7220f36..2ddfeeaf15 100644
--- a/labs/lab16.md
+++ b/labs/lab16.md
@@ -1,261 +1,261 @@
-# Lab 16 — Kubernetes Monitoring & Init Containers
-
-![difficulty](https://img.shields.io/badge/difficulty-advanced-red)
-![topic](https://img.shields.io/badge/topic-Observability-blue)
-![points](https://img.shields.io/badge/points-10%2B2.5-orange)
-![tech](https://img.shields.io/badge/tech-Prometheus%20%7C%20Grafana-informational)
-
-> Implement comprehensive cluster monitoring with Kube-Prometheus stack and learn init container patterns.
-
-## Overview
-
-Production Kubernetes clusters require robust monitoring. The Kube-Prometheus stack provides a complete solution with Prometheus, Grafana, and Alertmanager. Init containers enable setup tasks before your main application starts.
-
-**What You'll Learn:**
-- Kube-Prometheus stack components
-- Grafana dashboard exploration
-- Prometheus metrics and queries
-- Init container patterns
-
-**Tech Stack:** Prometheus | Grafana | Alertmanager | node-exporter | Init Containers
-
-**Tested Versions:** Minikube v1.34+ | Kubernetes v1.32+ | kube-prometheus-stack 65.x
-
----
-
-## Tasks
-
-### Task 1 — Kube-Prometheus Stack (2 pts)
-
-**Objective:** Install and understand the monitoring stack.
-
-**Requirements:**
-
-1. **Understand Components** - Document roles of:
-   - Prometheus Operator
-   - Prometheus
-   - Alertmanager
-   - Grafana
-   - kube-state-metrics
-   - node-exporter
-
-2. **Install via Helm**
-   - Add prometheus-community repository
-   - Install in monitoring namespace
-   - Verify all pods are running
-
-<details>
-<summary>💡 Hints</summary>
-
-**Installation:**
-```bash
-helm repo add prometheus-community https://prometheus-community.github.io/helm-charts
-helm repo update
-
-helm install monitoring prometheus-community/kube-prometheus-stack \
-  --namespace monitoring \
-  --create-namespace
-
-kubectl get pods -n monitoring
-```
-
-**Resources:**
-- [kube-prometheus-stack](https://github.com/prometheus-community/helm-charts/tree/main/charts/kube-prometheus-stack)
-
-</details>
-
----
-
-### Task 2 — Grafana Dashboard Exploration (3 pts)
-
-**Objective:** Use Grafana dashboards to answer questions about your cluster.
-
-**Access Grafana:**
-```bash
-kubectl port-forward svc/monitoring-grafana -n monitoring 3000:80
-# Default: admin / prom-operator
-```
-
-**Answer these questions using dashboards:**
-
-1. **Pod Resources:** CPU/memory usage of your StatefulSet
-2. **Namespace Analysis:** Which pods use most/least CPU in default namespace?
-3. **Node Metrics:** Memory usage (% and MB), CPU cores
-4. **Kubelet:** How many pods/containers managed?
-5. **Network:** Traffic for pods in default namespace
-6. **Alerts:** How many active alerts? Check Alertmanager UI
-
-<details>
-<summary>💡 Hints</summary>
-
-**Useful Dashboards:**
-- "Kubernetes / Compute Resources / Namespace (Pods)"
-- "Kubernetes / Compute Resources / Pod"
-- "Node Exporter / Nodes"
-- "Kubernetes / Kubelet"
-
-**Alertmanager:**
-```bash
-kubectl port-forward svc/monitoring-kube-prometheus-alertmanager -n monitoring 9093:9093
-```
-
-</details>
-
----
-
-### Task 3 — Init Containers (3 pts)
-
-**Objective:** Implement init containers for pod initialization.
-
-**Requirements:**
-
-1. **Implement Basic Init Container**
-   - Download a file using `wget`
-   - Save to shared volume
-   - Verify main container can access it
-
-2. **Wait-for-Service Pattern**
-   - Create init container that waits for a service
-   - Only start main container when dependency ready
-
-<details>
-<summary>💡 Hints</summary>
-
-**Download Init Container:**
-```yaml
-spec:
-  initContainers:
-    - name: init-download
-      image: busybox:1.36
-      command: ['sh', '-c', 'wget -O /work-dir/index.html https://example.com']
-      volumeMounts:
-        - name: workdir
-          mountPath: /work-dir
-  containers:
-    - name: main-app
-      volumeMounts:
-        - name: workdir
-          mountPath: /data
-  volumes:
-    - name: workdir
-      emptyDir: {}
-```
-
-**Wait Pattern:**
-```yaml
-initContainers:
-  - name: wait-for-service
-    image: busybox:1.36
-    command: ['sh', '-c', 'until nslookup myservice; do sleep 2; done']
-```
-
-**Verification:**
-```bash
-kubectl get pods -w  # Watch Init:0/1 → Running
-kubectl logs <pod> -c init-download
-kubectl exec <pod> -- cat /data/index.html
-```
-
-</details>
-
----
-
-### Task 4 — Documentation (2 pts)
-
-**Create `k8s/MONITORING.md` with:**
-
-1. **Stack Components** - Descriptions in your own words
-2. **Installation Evidence** - `kubectl get po,svc -n monitoring`
-3. **Dashboard Answers** - All 6 questions with screenshots
-4. **Init Containers** - Implementation and proof of success
-
----
-
-## Bonus Task — Custom Metrics & ServiceMonitor (2.5 pts)
-
-**Objective:** Expose application metrics and configure Prometheus scraping.
-
-**Requirements:**
-
-1. **Add `/metrics` endpoint** to your app using Prometheus client library
-2. **Create ServiceMonitor** CRD for Prometheus to scrape your app
-3. **Verify metrics in Prometheus UI**
-
-<details>
-<summary>💡 Hints</summary>
-
-**ServiceMonitor:**
-```yaml
-apiVersion: monitoring.coreos.com/v1
-kind: ServiceMonitor
-metadata:
-  name: myapp-monitor
-  labels:
-    release: monitoring
-spec:
-  selector:
-    matchLabels:
-      app.kubernetes.io/name: myapp
-  endpoints:
-    - port: http
-      path: /metrics
-```
-
-**Prometheus UI:**
-```bash
-kubectl port-forward svc/monitoring-kube-prometheus-prometheus -n monitoring 9090:9090
-```
-
-</details>
-
----
-
-## Checklist
-
-- [ ] Prometheus stack installed
-- [ ] All 6 dashboard questions answered
-- [ ] Screenshots included
-- [ ] Init container downloading file
-- [ ] Wait-for-service pattern implemented
-- [ ] `k8s/MONITORING.md` complete
-
----
-
-## Rubric
-
-| Criteria | Points |
-|----------|--------|
-| **Prometheus Stack** | 2 pts |
-| **Grafana Exploration** | 3 pts |
-| **Init Containers** | 3 pts |
-| **Documentation** | 2 pts |
-| **Bonus** | 2.5 pts |
-| **Total** | 12.5 pts |
-
----
-
-## Resources
-
-<details>
-<summary>📚 Documentation</summary>
-
-- [Prometheus](https://prometheus.io/docs/)
-- [Grafana](https://grafana.com/docs/)
-- [Init Containers](https://kubernetes.io/docs/concepts/workloads/pods/init-containers/)
-- [ServiceMonitor](https://prometheus-operator.dev/docs/user-guides/getting-started/)
-
-</details>
-
----
-
-## Course Completion
-
-Congratulations on completing the core Kubernetes labs! You now have experience with the complete DevOps lifecycle from development to production monitoring.
-
-**Optional:** Labs 17-18 are exam alternatives covering Fly.io and 4EVERLAND.
-
----
-
-**Good luck!** 📊
-
-> **Remember:** Monitoring is not optional in production. If you can't measure it, you can't improve it.
+# Lab 16 — Kubernetes Monitoring & Init Containers
+
+![difficulty](https://img.shields.io/badge/difficulty-advanced-red)
+![topic](https://img.shields.io/badge/topic-Observability-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Prometheus%20%7C%20Grafana-informational)
+
+> Implement comprehensive cluster monitoring with Kube-Prometheus stack and learn init container patterns.
+
+## Overview
+
+Production Kubernetes clusters require robust monitoring. The Kube-Prometheus stack provides a complete solution with Prometheus, Grafana, and Alertmanager. Init containers enable setup tasks before your main application starts.
+
+**What You'll Learn:**
+- Kube-Prometheus stack components
+- Grafana dashboard exploration
+- Prometheus metrics and queries
+- Init container patterns
+
+**Tech Stack:** Prometheus | Grafana | Alertmanager | node-exporter | Init Containers
+
+**Tested Versions:** Minikube v1.34+ | Kubernetes v1.32+ | kube-prometheus-stack 65.x
+
+---
+
+## Tasks
+
+### Task 1 — Kube-Prometheus Stack (2 pts)
+
+**Objective:** Install and understand the monitoring stack.
+
+**Requirements:**
+
+1. **Understand Components** - Document roles of:
+   - Prometheus Operator
+   - Prometheus
+   - Alertmanager
+   - Grafana
+   - kube-state-metrics
+   - node-exporter
+
+2. **Install via Helm**
+   - Add prometheus-community repository
+   - Install in monitoring namespace
+   - Verify all pods are running
+
+<details>
+<summary>💡 Hints</summary>
+
+**Installation:**
+```bash
+helm repo add prometheus-community https://prometheus-community.github.io/helm-charts
+helm repo update
+
+helm install monitoring prometheus-community/kube-prometheus-stack \
+  --namespace monitoring \
+  --create-namespace
+
+kubectl get pods -n monitoring
+```
+
+**Resources:**
+- [kube-prometheus-stack](https://github.com/prometheus-community/helm-charts/tree/main/charts/kube-prometheus-stack)
+
+</details>
+
+---
+
+### Task 2 — Grafana Dashboard Exploration (3 pts)
+
+**Objective:** Use Grafana dashboards to answer questions about your cluster.
+
+**Access Grafana:**
+```bash
+kubectl port-forward svc/monitoring-grafana -n monitoring 3000:80
+# Default: admin / prom-operator
+```
+
+**Answer these questions using dashboards:**
+
+1. **Pod Resources:** CPU/memory usage of your StatefulSet
+2. **Namespace Analysis:** Which pods use most/least CPU in default namespace?
+3. **Node Metrics:** Memory usage (% and MB), CPU cores
+4. **Kubelet:** How many pods/containers managed?
+5. **Network:** Traffic for pods in default namespace
+6. **Alerts:** How many active alerts? Check Alertmanager UI
+
+<details>
+<summary>💡 Hints</summary>
+
+**Useful Dashboards:**
+- "Kubernetes / Compute Resources / Namespace (Pods)"
+- "Kubernetes / Compute Resources / Pod"
+- "Node Exporter / Nodes"
+- "Kubernetes / Kubelet"
+
+**Alertmanager:**
+```bash
+kubectl port-forward svc/monitoring-kube-prometheus-alertmanager -n monitoring 9093:9093
+```
+
+</details>
+
+---
+
+### Task 3 — Init Containers (3 pts)
+
+**Objective:** Implement init containers for pod initialization.
+
+**Requirements:**
+
+1. **Implement Basic Init Container**
+   - Download a file using `wget`
+   - Save to shared volume
+   - Verify main container can access it
+
+2. **Wait-for-Service Pattern**
+   - Create init container that waits for a service
+   - Only start main container when dependency ready
+
+<details>
+<summary>💡 Hints</summary>
+
+**Download Init Container:**
+```yaml
+spec:
+  initContainers:
+    - name: init-download
+      image: busybox:1.36
+      command: ['sh', '-c', 'wget -O /work-dir/index.html https://example.com']
+      volumeMounts:
+        - name: workdir
+          mountPath: /work-dir
+  containers:
+    - name: main-app
+      volumeMounts:
+        - name: workdir
+          mountPath: /data
+  volumes:
+    - name: workdir
+      emptyDir: {}
+```
+
+**Wait Pattern:**
+```yaml
+initContainers:
+  - name: wait-for-service
+    image: busybox:1.36
+    command: ['sh', '-c', 'until nslookup myservice; do sleep 2; done']
+```
+
+**Verification:**
+```bash
+kubectl get pods -w  # Watch Init:0/1 → Running
+kubectl logs <pod> -c init-download
+kubectl exec <pod> -- cat /data/index.html
+```
+
+</details>
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Create `k8s/MONITORING.md` with:**
+
+1. **Stack Components** - Descriptions in your own words
+2. **Installation Evidence** - `kubectl get po,svc -n monitoring`
+3. **Dashboard Answers** - All 6 questions with screenshots
+4. **Init Containers** - Implementation and proof of success
+
+---
+
+## Bonus Task — Custom Metrics & ServiceMonitor (2.5 pts)
+
+**Objective:** Expose application metrics and configure Prometheus scraping.
+
+**Requirements:**
+
+1. **Add `/metrics` endpoint** to your app using Prometheus client library
+2. **Create ServiceMonitor** CRD for Prometheus to scrape your app
+3. **Verify metrics in Prometheus UI**
+
+<details>
+<summary>💡 Hints</summary>
+
+**ServiceMonitor:**
+```yaml
+apiVersion: monitoring.coreos.com/v1
+kind: ServiceMonitor
+metadata:
+  name: myapp-monitor
+  labels:
+    release: monitoring
+spec:
+  selector:
+    matchLabels:
+      app.kubernetes.io/name: myapp
+  endpoints:
+    - port: http
+      path: /metrics
+```
+
+**Prometheus UI:**
+```bash
+kubectl port-forward svc/monitoring-kube-prometheus-prometheus -n monitoring 9090:9090
+```
+
+</details>
+
+---
+
+## Checklist
+
+- [ ] Prometheus stack installed
+- [ ] All 6 dashboard questions answered
+- [ ] Screenshots included
+- [ ] Init container downloading file
+- [ ] Wait-for-service pattern implemented
+- [ ] `k8s/MONITORING.md` complete
+
+---
+
+## Rubric
+
+| Criteria | Points |
+|----------|--------|
+| **Prometheus Stack** | 2 pts |
+| **Grafana Exploration** | 3 pts |
+| **Init Containers** | 3 pts |
+| **Documentation** | 2 pts |
+| **Bonus** | 2.5 pts |
+| **Total** | 12.5 pts |
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Documentation</summary>
+
+- [Prometheus](https://prometheus.io/docs/)
+- [Grafana](https://grafana.com/docs/)
+- [Init Containers](https://kubernetes.io/docs/concepts/workloads/pods/init-containers/)
+- [ServiceMonitor](https://prometheus-operator.dev/docs/user-guides/getting-started/)
+
+</details>
+
+---
+
+## Course Completion
+
+Congratulations on completing the core Kubernetes labs! You now have experience with the complete DevOps lifecycle from development to production monitoring.
+
+**Optional:** Labs 17-18 are exam alternatives covering Fly.io and 4EVERLAND.
+
+---
+
+**Good luck!** 📊
+
+> **Remember:** Monitoring is not optional in production. If you can't measure it, you can't improve it.
diff --git a/labs/lab17.md b/labs/lab17.md
index c0ca8ed79d..78f5ce0761 100644
--- a/labs/lab17.md
+++ b/labs/lab17.md
@@ -1,447 +1,447 @@
-# Lab 17 — Fly.io Edge Deployment
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-Edge%20Computing-blue)
-![points](https://img.shields.io/badge/points-20-orange)
-![type](https://img.shields.io/badge/type-Exam%20Alternative-purple)
-
-> Deploy your application globally on Fly.io's edge infrastructure and experience simplified cloud deployment.
-
-## Overview
-
-Fly.io is a platform for running applications close to users worldwide. Unlike Kubernetes which requires cluster management, Fly.io abstracts infrastructure away while still giving you control over deployment, scaling, and observability.
-
-**This is an Exam Alternative Lab** — Complete both Lab 17 and Lab 18 to replace the final exam.
-
-**What You'll Learn:**
-- Edge computing concepts
-- Platform-as-a-Service deployment
-- Global application distribution
-- Kubernetes vs PaaS trade-offs
-- Modern deployment workflows
-
-**Prerequisites:** Working Docker image from Lab 2
-
-**Tech Stack:** Fly.io | flyctl CLI | Docker | Multi-region deployment
-
----
-
-## Exam Alternative Requirements
-
-| Requirement | Details |
-|-------------|---------|
-| **Deadline** | 1 week before exam date |
-| **Minimum Score** | 16/20 points |
-| **Must Complete** | Both Lab 17 AND Lab 18 |
-| **Total Points** | 40 pts (replaces 40 pt exam) |
-
----
-
-## Tasks
-
-### Task 1 — Fly.io Setup (3 pts)
-
-**Objective:** Set up Fly.io account and CLI.
-
-**Requirements:**
-
-1. **Create Account**
-   - Sign up at [fly.io](https://fly.io)
-   - No credit card required for free tier
-   - Verify email
-
-2. **Install flyctl CLI**
-   - Install for your operating system
-   - Authenticate with `fly auth login`
-   - Verify with `fly version`
-
-3. **Explore Platform Concepts**
-   - Understand Fly Machines (VMs)
-   - Understand Fly Volumes (persistent storage)
-   - Understand Regions and edge deployment
-
-<details>
-<summary>💡 Hints</summary>
-
-**Installation:**
-```bash
-# macOS
-brew install flyctl
-
-# Linux
-curl -L https://fly.io/install.sh | sh
-
-# Windows (PowerShell)
-pwsh -Command "iwr https://fly.io/install.ps1 -useb | iex"
-```
-
-**Authentication:**
-```bash
-fly auth login
-# Opens browser for authentication
-
-fly auth whoami
-# Verify logged in
-```
-
-**Free Tier Includes:**
-- 3 shared-cpu-1x VMs (256MB RAM)
-- 3GB persistent storage
-- 160GB outbound bandwidth
-
-**Resources:**
-- [Fly.io Docs](https://fly.io/docs/)
-- [Getting Started](https://fly.io/docs/getting-started/)
-
-</details>
-
----
-
-### Task 2 — Deploy Application (4 pts)
-
-**Objective:** Deploy your application to Fly.io.
-
-**Requirements:**
-
-1. **Prepare Application**
-   - Ensure Dockerfile works locally
-   - Application should listen on port 8080 (or configure in fly.toml)
-
-2. **Launch Application**
-   - Run `fly launch` in your app directory
-   - Configure app name and region
-   - Review generated `fly.toml`
-
-3. **Deploy**
-   - Run `fly deploy`
-   - Wait for deployment to complete
-   - Access your application via provided URL
-
-4. **Verify**
-   - Test all endpoints work
-   - Check application logs
-   - Verify health checks pass
-
-<details>
-<summary>💡 Hints</summary>
-
-**Launch Process:**
-```bash
-cd app_python  # or app_go
-
-fly launch
-# Follow prompts:
-# - App name: your-unique-name
-# - Region: select closest
-# - Postgres/Redis: No (for now)
-# - Deploy now: Yes
-```
-
-**fly.toml Configuration:**
-```toml
-app = "your-app-name"
-primary_region = "ams"  # Amsterdam, or your choice
-
-[build]
-  dockerfile = "Dockerfile"
-
-[http_service]
-  internal_port = 8080
-  force_https = true
-  auto_stop_machines = true
-  auto_start_machines = true
-  min_machines_running = 0
-
-[checks]
-  [checks.health]
-    type = "http"
-    port = 8080
-    path = "/health"
-    interval = "10s"
-    timeout = "2s"
-```
-
-**Useful Commands:**
-```bash
-fly status          # App status
-fly logs            # View logs
-fly open            # Open in browser
-fly ssh console     # SSH into machine
-```
-
-</details>
-
----
-
-### Task 3 — Multi-Region Deployment (4 pts)
-
-**Objective:** Deploy your application to multiple regions worldwide.
-
-**Requirements:**
-
-1. **Add Regions**
-   - Deploy to at least 3 regions (e.g., ams, iad, sin)
-   - Understand region codes
-
-2. **Verify Global Distribution**
-   - Check machines in each region
-   - Access from different regions if possible
-
-3. **Test Latency**
-   - Document response times from different regions
-   - Understand how Fly routes requests to nearest region
-
-4. **Scale Machines**
-   - Scale to 2 machines in primary region
-   - Understand scaling commands
-
-<details>
-<summary>💡 Hints</summary>
-
-**Region Codes:**
-- `ams` - Amsterdam
-- `iad` - Virginia, USA
-- `sin` - Singapore
-- `syd` - Sydney
-- `lhr` - London
-
-**Adding Regions:**
-```bash
-# Add regions
-fly regions add iad sin
-
-# List regions
-fly regions list
-
-# Check machines
-fly machines list
-```
-
-**Scaling:**
-```bash
-# Scale in specific region
-fly scale count 2 --region ams
-
-# Or modify fly.toml and deploy
-```
-
-**Verify Distribution:**
-```bash
-fly status
-# Shows machines in each region
-
-fly ping
-# Test connectivity to regions
-```
-
-</details>
-
----
-
-### Task 4 — Secrets & Persistence (3 pts)
-
-**Objective:** Configure secrets and persistent storage.
-
-**Requirements:**
-
-1. **Configure Secrets**
-   - Set at least 2 secrets using `fly secrets`
-   - Verify secrets are available in application
-   - Understand secret management on Fly
-
-2. **Attach Volume** (if app needs persistence)
-   - Create Fly Volume
-   - Attach to application
-   - Verify data persists across deployments
-
-<details>
-<summary>💡 Hints</summary>
-
-**Secrets:**
-```bash
-# Set secrets
-fly secrets set DATABASE_URL="postgres://..." API_KEY="secret123"
-
-# List secrets (names only)
-fly secrets list
-
-# Secrets available as env vars in app
-```
-
-**Volumes:**
-```bash
-# Create volume
-fly volumes create myapp_data --size 1 --region ams
-
-# Update fly.toml
-[mounts]
-  source = "myapp_data"
-  destination = "/data"
-
-# Deploy
-fly deploy
-```
-
-**Verify Persistence:**
-```bash
-fly ssh console
-# Inside machine
-cat /data/visits
-```
-
-</details>
-
----
-
-### Task 5 — Monitoring & Operations (3 pts)
-
-**Objective:** Monitor and manage your deployed application.
-
-**Requirements:**
-
-1. **View Metrics**
-   - Access Fly.io dashboard
-   - View CPU, memory, network metrics
-   - Understand machine states
-
-2. **Manage Deployments**
-   - Deploy a new version
-   - View deployment history
-   - Understand rollback capability
-
-3. **Health Checks**
-   - Configure HTTP health checks
-   - Verify health check execution
-   - Understand failure behavior
-
-<details>
-<summary>💡 Hints</summary>
-
-**Dashboard:**
-- Visit https://fly.io/dashboard
-- Select your app
-- View Metrics, Machines, Volumes tabs
-
-**Deployments:**
-```bash
-fly releases
-# Shows deployment history
-
-fly deploy --strategy rolling
-# Rolling deployment
-
-fly deploy --strategy immediate
-# Immediate replacement
-```
-
-**Health Checks in fly.toml:**
-```toml
-[checks]
-  [checks.health]
-    type = "http"
-    port = 8080
-    path = "/health"
-    interval = "10s"
-    timeout = "2s"
-    grace_period = "30s"
-```
-
-</details>
-
----
-
-### Task 6 — Documentation & Comparison (3 pts)
-
-**Objective:** Document deployment and compare with Kubernetes.
-
-**Create `FLYIO.md` with:**
-
-1. **Deployment Summary**
-   - App URL
-   - Regions deployed
-   - Configuration used
-
-2. **Screenshots**
-   - Fly.io dashboard
-   - Multi-region machines
-   - Metrics view
-
-3. **Kubernetes vs Fly.io Comparison**
-
-| Aspect | Kubernetes | Fly.io |
-|--------|------------|--------|
-| Setup complexity | | |
-| Deployment speed | | |
-| Global distribution | | |
-| Cost (for small apps) | | |
-| Learning curve | | |
-| Control/flexibility | | |
-| Best use case | | |
-
-4. **When to Use Each**
-   - Scenarios favoring Kubernetes
-   - Scenarios favoring Fly.io
-   - Your recommendation
-
----
-
-## Checklist
-
-- [ ] Fly.io account created
-- [ ] flyctl CLI installed and authenticated
-- [ ] Application deployed successfully
-- [ ] Multiple regions configured (3+)
-- [ ] Secrets configured
-- [ ] Persistence tested (if applicable)
-- [ ] Health checks working
-- [ ] Metrics accessible
-- [ ] `FLYIO.md` documentation complete
-- [ ] Kubernetes comparison documented
-
----
-
-## Rubric
-
-| Criteria | Points |
-|----------|--------|
-| **Setup** | 3 pts |
-| **Deployment** | 4 pts |
-| **Multi-Region** | 4 pts |
-| **Secrets & Persistence** | 3 pts |
-| **Monitoring** | 3 pts |
-| **Documentation** | 3 pts |
-| **Total** | **20 pts** |
-
-**Grading:**
-- **18-20:** Excellent global deployment, thorough comparison
-- **16-17:** Working deployment, good documentation
-- **14-15:** Basic deployment, missing regions or docs
-- **<14:** Incomplete deployment
-
----
-
-## Resources
-
-<details>
-<summary>📚 Fly.io Documentation</summary>
-
-- [Fly.io Docs](https://fly.io/docs/)
-- [flyctl Reference](https://fly.io/docs/flyctl/)
-- [Fly Machines](https://fly.io/docs/machines/)
-- [Fly Volumes](https://fly.io/docs/volumes/)
-
-</details>
-
-<details>
-<summary>🌍 Regions</summary>
-
-- [Available Regions](https://fly.io/docs/reference/regions/)
-- [Region Selection](https://fly.io/docs/reference/scaling/#regions)
-
-</details>
-
----
-
-**Good luck!** ✈️
-
-> **Remember:** Fly.io is great for global, low-latency applications. Kubernetes gives more control but requires more management. Choose the right tool for your use case.
+# Lab 17 — Fly.io Edge Deployment
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Edge%20Computing-blue)
+![points](https://img.shields.io/badge/points-20-orange)
+![type](https://img.shields.io/badge/type-Exam%20Alternative-purple)
+
+> Deploy your application globally on Fly.io's edge infrastructure and experience simplified cloud deployment.
+
+## Overview
+
+Fly.io is a platform for running applications close to users worldwide. Unlike Kubernetes which requires cluster management, Fly.io abstracts infrastructure away while still giving you control over deployment, scaling, and observability.
+
+**This is an Exam Alternative Lab** — Complete both Lab 17 and Lab 18 to replace the final exam.
+
+**What You'll Learn:**
+- Edge computing concepts
+- Platform-as-a-Service deployment
+- Global application distribution
+- Kubernetes vs PaaS trade-offs
+- Modern deployment workflows
+
+**Prerequisites:** Working Docker image from Lab 2
+
+**Tech Stack:** Fly.io | flyctl CLI | Docker | Multi-region deployment
+
+---
+
+## Exam Alternative Requirements
+
+| Requirement | Details |
+|-------------|---------|
+| **Deadline** | 1 week before exam date |
+| **Minimum Score** | 16/20 points |
+| **Must Complete** | Both Lab 17 AND Lab 18 |
+| **Total Points** | 40 pts (replaces 40 pt exam) |
+
+---
+
+## Tasks
+
+### Task 1 — Fly.io Setup (3 pts)
+
+**Objective:** Set up Fly.io account and CLI.
+
+**Requirements:**
+
+1. **Create Account**
+   - Sign up at [fly.io](https://fly.io)
+   - No credit card required for free tier
+   - Verify email
+
+2. **Install flyctl CLI**
+   - Install for your operating system
+   - Authenticate with `fly auth login`
+   - Verify with `fly version`
+
+3. **Explore Platform Concepts**
+   - Understand Fly Machines (VMs)
+   - Understand Fly Volumes (persistent storage)
+   - Understand Regions and edge deployment
+
+<details>
+<summary>💡 Hints</summary>
+
+**Installation:**
+```bash
+# macOS
+brew install flyctl
+
+# Linux
+curl -L https://fly.io/install.sh | sh
+
+# Windows (PowerShell)
+pwsh -Command "iwr https://fly.io/install.ps1 -useb | iex"
+```
+
+**Authentication:**
+```bash
+fly auth login
+# Opens browser for authentication
+
+fly auth whoami
+# Verify logged in
+```
+
+**Free Tier Includes:**
+- 3 shared-cpu-1x VMs (256MB RAM)
+- 3GB persistent storage
+- 160GB outbound bandwidth
+
+**Resources:**
+- [Fly.io Docs](https://fly.io/docs/)
+- [Getting Started](https://fly.io/docs/getting-started/)
+
+</details>
+
+---
+
+### Task 2 — Deploy Application (4 pts)
+
+**Objective:** Deploy your application to Fly.io.
+
+**Requirements:**
+
+1. **Prepare Application**
+   - Ensure Dockerfile works locally
+   - Application should listen on port 8080 (or configure in fly.toml)
+
+2. **Launch Application**
+   - Run `fly launch` in your app directory
+   - Configure app name and region
+   - Review generated `fly.toml`
+
+3. **Deploy**
+   - Run `fly deploy`
+   - Wait for deployment to complete
+   - Access your application via provided URL
+
+4. **Verify**
+   - Test all endpoints work
+   - Check application logs
+   - Verify health checks pass
+
+<details>
+<summary>💡 Hints</summary>
+
+**Launch Process:**
+```bash
+cd app_python  # or app_go
+
+fly launch
+# Follow prompts:
+# - App name: your-unique-name
+# - Region: select closest
+# - Postgres/Redis: No (for now)
+# - Deploy now: Yes
+```
+
+**fly.toml Configuration:**
+```toml
+app = "your-app-name"
+primary_region = "ams"  # Amsterdam, or your choice
+
+[build]
+  dockerfile = "Dockerfile"
+
+[http_service]
+  internal_port = 8080
+  force_https = true
+  auto_stop_machines = true
+  auto_start_machines = true
+  min_machines_running = 0
+
+[checks]
+  [checks.health]
+    type = "http"
+    port = 8080
+    path = "/health"
+    interval = "10s"
+    timeout = "2s"
+```
+
+**Useful Commands:**
+```bash
+fly status          # App status
+fly logs            # View logs
+fly open            # Open in browser
+fly ssh console     # SSH into machine
+```
+
+</details>
+
+---
+
+### Task 3 — Multi-Region Deployment (4 pts)
+
+**Objective:** Deploy your application to multiple regions worldwide.
+
+**Requirements:**
+
+1. **Add Regions**
+   - Deploy to at least 3 regions (e.g., ams, iad, sin)
+   - Understand region codes
+
+2. **Verify Global Distribution**
+   - Check machines in each region
+   - Access from different regions if possible
+
+3. **Test Latency**
+   - Document response times from different regions
+   - Understand how Fly routes requests to nearest region
+
+4. **Scale Machines**
+   - Scale to 2 machines in primary region
+   - Understand scaling commands
+
+<details>
+<summary>💡 Hints</summary>
+
+**Region Codes:**
+- `ams` - Amsterdam
+- `iad` - Virginia, USA
+- `sin` - Singapore
+- `syd` - Sydney
+- `lhr` - London
+
+**Adding Regions:**
+```bash
+# Add regions
+fly regions add iad sin
+
+# List regions
+fly regions list
+
+# Check machines
+fly machines list
+```
+
+**Scaling:**
+```bash
+# Scale in specific region
+fly scale count 2 --region ams
+
+# Or modify fly.toml and deploy
+```
+
+**Verify Distribution:**
+```bash
+fly status
+# Shows machines in each region
+
+fly ping
+# Test connectivity to regions
+```
+
+</details>
+
+---
+
+### Task 4 — Secrets & Persistence (3 pts)
+
+**Objective:** Configure secrets and persistent storage.
+
+**Requirements:**
+
+1. **Configure Secrets**
+   - Set at least 2 secrets using `fly secrets`
+   - Verify secrets are available in application
+   - Understand secret management on Fly
+
+2. **Attach Volume** (if app needs persistence)
+   - Create Fly Volume
+   - Attach to application
+   - Verify data persists across deployments
+
+<details>
+<summary>💡 Hints</summary>
+
+**Secrets:**
+```bash
+# Set secrets
+fly secrets set DATABASE_URL="postgres://..." API_KEY="secret123"
+
+# List secrets (names only)
+fly secrets list
+
+# Secrets available as env vars in app
+```
+
+**Volumes:**
+```bash
+# Create volume
+fly volumes create myapp_data --size 1 --region ams
+
+# Update fly.toml
+[mounts]
+  source = "myapp_data"
+  destination = "/data"
+
+# Deploy
+fly deploy
+```
+
+**Verify Persistence:**
+```bash
+fly ssh console
+# Inside machine
+cat /data/visits
+```
+
+</details>
+
+---
+
+### Task 5 — Monitoring & Operations (3 pts)
+
+**Objective:** Monitor and manage your deployed application.
+
+**Requirements:**
+
+1. **View Metrics**
+   - Access Fly.io dashboard
+   - View CPU, memory, network metrics
+   - Understand machine states
+
+2. **Manage Deployments**
+   - Deploy a new version
+   - View deployment history
+   - Understand rollback capability
+
+3. **Health Checks**
+   - Configure HTTP health checks
+   - Verify health check execution
+   - Understand failure behavior
+
+<details>
+<summary>💡 Hints</summary>
+
+**Dashboard:**
+- Visit https://fly.io/dashboard
+- Select your app
+- View Metrics, Machines, Volumes tabs
+
+**Deployments:**
+```bash
+fly releases
+# Shows deployment history
+
+fly deploy --strategy rolling
+# Rolling deployment
+
+fly deploy --strategy immediate
+# Immediate replacement
+```
+
+**Health Checks in fly.toml:**
+```toml
+[checks]
+  [checks.health]
+    type = "http"
+    port = 8080
+    path = "/health"
+    interval = "10s"
+    timeout = "2s"
+    grace_period = "30s"
+```
+
+</details>
+
+---
+
+### Task 6 — Documentation & Comparison (3 pts)
+
+**Objective:** Document deployment and compare with Kubernetes.
+
+**Create `FLYIO.md` with:**
+
+1. **Deployment Summary**
+   - App URL
+   - Regions deployed
+   - Configuration used
+
+2. **Screenshots**
+   - Fly.io dashboard
+   - Multi-region machines
+   - Metrics view
+
+3. **Kubernetes vs Fly.io Comparison**
+
+| Aspect | Kubernetes | Fly.io |
+|--------|------------|--------|
+| Setup complexity | | |
+| Deployment speed | | |
+| Global distribution | | |
+| Cost (for small apps) | | |
+| Learning curve | | |
+| Control/flexibility | | |
+| Best use case | | |
+
+4. **When to Use Each**
+   - Scenarios favoring Kubernetes
+   - Scenarios favoring Fly.io
+   - Your recommendation
+
+---
+
+## Checklist
+
+- [ ] Fly.io account created
+- [ ] flyctl CLI installed and authenticated
+- [ ] Application deployed successfully
+- [ ] Multiple regions configured (3+)
+- [ ] Secrets configured
+- [ ] Persistence tested (if applicable)
+- [ ] Health checks working
+- [ ] Metrics accessible
+- [ ] `FLYIO.md` documentation complete
+- [ ] Kubernetes comparison documented
+
+---
+
+## Rubric
+
+| Criteria | Points |
+|----------|--------|
+| **Setup** | 3 pts |
+| **Deployment** | 4 pts |
+| **Multi-Region** | 4 pts |
+| **Secrets & Persistence** | 3 pts |
+| **Monitoring** | 3 pts |
+| **Documentation** | 3 pts |
+| **Total** | **20 pts** |
+
+**Grading:**
+- **18-20:** Excellent global deployment, thorough comparison
+- **16-17:** Working deployment, good documentation
+- **14-15:** Basic deployment, missing regions or docs
+- **<14:** Incomplete deployment
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Fly.io Documentation</summary>
+
+- [Fly.io Docs](https://fly.io/docs/)
+- [flyctl Reference](https://fly.io/docs/flyctl/)
+- [Fly Machines](https://fly.io/docs/machines/)
+- [Fly Volumes](https://fly.io/docs/volumes/)
+
+</details>
+
+<details>
+<summary>🌍 Regions</summary>
+
+- [Available Regions](https://fly.io/docs/reference/regions/)
+- [Region Selection](https://fly.io/docs/reference/scaling/#regions)
+
+</details>
+
+---
+
+**Good luck!** ✈️
+
+> **Remember:** Fly.io is great for global, low-latency applications. Kubernetes gives more control but requires more management. Choose the right tool for your use case.
diff --git a/labs/lab18.md b/labs/lab18.md
index 3491394659..e1dd9df85a 100644
--- a/labs/lab18.md
+++ b/labs/lab18.md
@@ -1,430 +1,430 @@
-# Lab 18 — Decentralized Hosting with 4EVERLAND & IPFS
-
-![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
-![topic](https://img.shields.io/badge/topic-Web3%20Infrastructure-blue)
-![points](https://img.shields.io/badge/points-20-orange)
-![type](https://img.shields.io/badge/type-Exam%20Alternative-purple)
-
-> Deploy content to the decentralized web using IPFS and 4EVERLAND for permanent, censorship-resistant hosting.
-
-## Overview
-
-The decentralized web (Web3) offers an alternative to traditional hosting where content is stored across a distributed network rather than centralized servers. IPFS (InterPlanetary File System) is the foundation, and 4EVERLAND provides a user-friendly gateway to this ecosystem.
-
-**This is an Exam Alternative Lab** — Complete both Lab 17 and Lab 18 to replace the final exam.
-
-**What You'll Learn:**
-- IPFS fundamentals and content addressing
-- Decentralized storage concepts
-- Pinning services and persistence
-- 4EVERLAND hosting platform
-- Centralized vs decentralized trade-offs
-
-**Prerequisites:** Basic understanding of web hosting, completed Docker lab
-
-**Tech Stack:** IPFS | 4EVERLAND | Docker | Content Addressing
-
-**Provided Files:**
-- `labs/lab18/index.html` — A beautiful course landing page ready to deploy
-
----
-
-## Exam Alternative Requirements
-
-| Requirement | Details |
-|-------------|---------|
-| **Deadline** | 1 week before exam date |
-| **Minimum Score** | 16/20 points |
-| **Must Complete** | Both Lab 17 AND Lab 18 |
-| **Total Points** | 40 pts (replaces 40 pt exam) |
-
----
-
-## Tasks
-
-### Task 1 — IPFS Fundamentals (3 pts)
-
-**Objective:** Understand IPFS concepts and run a local node.
-
-**Requirements:**
-
-1. **Study IPFS Concepts**
-   - Content addressing vs location addressing
-   - CIDs (Content Identifiers)
-   - Pinning and garbage collection
-   - IPFS gateways
-
-2. **Run Local IPFS Node**
-   - Use Docker to run IPFS node
-   - Access the Web UI
-   - Understand node configuration
-
-3. **Add Content Locally**
-   - Add a file to your local IPFS node
-   - Retrieve the CID
-   - Access via local gateway
-
-<details>
-<summary>💡 Hints</summary>
-
-**IPFS Concepts:**
-- **Content Addressing:** Files identified by hash of content, not location
-- **CID:** Unique identifier derived from content hash (e.g., `QmXxx...` or `bafyxxx...`)
-- **Pinning:** Marking content to keep it (prevent garbage collection)
-- **Gateway:** HTTP interface to IPFS network
-
-**Run IPFS with Docker:**
-```bash
-docker run -d --name ipfs \
-  -p 4001:4001 \
-  -p 8080:8080 \
-  -p 5001:5001 \
-  ipfs/kubo:latest
-
-# Web UI at http://localhost:5001/webui
-# Gateway at http://localhost:8080
-```
-
-**Add Content:**
-```bash
-# Create test file
-echo "Hello IPFS from DevOps course!" > hello.txt
-
-# Add to IPFS
-docker exec ipfs ipfs add /hello.txt
-# Returns: added QmXxx... hello.txt
-
-# Access via gateway
-curl http://localhost:8080/ipfs/QmXxx...
-```
-
-**Resources:**
-- [IPFS Docs](https://docs.ipfs.tech/)
-- [IPFS Concepts](https://docs.ipfs.tech/concepts/)
-
-</details>
-
----
-
-### Task 2 — 4EVERLAND Setup (3 pts)
-
-**Objective:** Set up 4EVERLAND account and explore the platform.
-
-**Requirements:**
-
-1. **Create Account**
-   - Sign up at [4everland.org](https://www.4everland.org/)
-   - Connect with GitHub or wallet
-   - Explore dashboard
-
-2. **Understand Services**
-   - Hosting: Deploy websites/apps
-   - Storage: IPFS pinning
-   - Gateway: Access IPFS content
-
-3. **Explore Free Tier**
-   - Understand limits and capabilities
-   - Review pricing for reference
-
-<details>
-<summary>💡 Hints</summary>
-
-**4EVERLAND Services:**
-- **Hosting:** Deploy from Git repos, automatic builds
-- **Bucket (Storage):** Upload files, get IPFS CIDs
-- **Gateway:** Access content via 4everland.link
-
-**Dashboard:**
-- Projects: Your deployed sites
-- Bucket: File storage
-- Domains: Custom domain setup
-
-**Free Tier Includes:**
-- 100 deployments/month
-- 5GB storage
-- 100GB bandwidth
-
-**Resources:**
-- [4EVERLAND Docs](https://docs.4everland.org/)
-
-</details>
-
----
-
-### Task 3 — Deploy Static Content (4 pts)
-
-**Objective:** Deploy a static site to 4EVERLAND.
-
-**Requirements:**
-
-1. **Use the Provided Static Site**
-   - A course landing page is provided at `labs/lab18/index.html`
-   - Review the HTML/CSS to understand the structure
-   - You may customize it or create your own
-
-2. **Deploy via 4EVERLAND**
-   - Connect your GitHub repository
-   - Configure build settings
-   - Deploy to IPFS via 4EVERLAND
-
-3. **Verify Deployment**
-   - Access via 4EVERLAND URL
-   - Access via IPFS gateway
-   - Note the CID
-
-4. **Test Permanence**
-   - Understand that content with same hash = same CID
-   - Make a change, redeploy, observe new CID
-
-<details>
-<summary>💡 Hints</summary>
-
-**Provided Static Site:**
-The course provides a beautiful landing page at `labs/lab18/index.html` that you can deploy. It includes:
-- Modern responsive design
-- Course curriculum overview
-- Learning roadmap
-- "Deployed on IPFS" badge
-
-**Deployment Steps:**
-1. Go to 4EVERLAND Dashboard → Hosting
-2. Click "New Project"
-3. Import from GitHub
-4. Select your repository and branch
-5. Configure:
-   - Framework: None (static)
-   - Build command: (leave empty for static)
-   - Output directory: `labs/lab18` (or root if you moved the file)
-6. Deploy
-
-**Alternative: Create Your Own**
-You can also create your own static site. Keep it simple:
-```html
-<!DOCTYPE html>
-<html>
-<head>
-    <title>My DevOps Portfolio</title>
-</head>
-<body>
-    <h1>Welcome to My DevOps Journey</h1>
-    <p>Deployed on IPFS via 4EVERLAND</p>
-</body>
-</html>
-```
-
-**Access URLs:**
-- 4EVERLAND: `https://your-project.4everland.app`
-- IPFS Gateway: `https://ipfs.4everland.link/ipfs/CID`
-
-</details>
-
----
-
-### Task 4 — IPFS Pinning (4 pts)
-
-**Objective:** Use 4EVERLAND's storage (Bucket) for IPFS pinning.
-
-**Requirements:**
-
-1. **Upload Files to Bucket**
-   - Upload multiple files (images, documents, etc.)
-   - Get CIDs for each file
-
-2. **Create a Directory Structure**
-   - Upload a folder with multiple files
-   - Understand directory CIDs
-
-3. **Access via Multiple Gateways**
-   - Access your content via:
-     - 4EVERLAND gateway
-     - Public IPFS gateways (ipfs.io, dweb.link)
-   - Understand gateway differences
-
-4. **Verify Pinning**
-   - Confirm content is pinned
-   - Understand pinning vs local storage
-
-<details>
-<summary>💡 Hints</summary>
-
-**Bucket Upload:**
-1. Dashboard → Bucket
-2. Create new bucket
-3. Upload files or folders
-4. Get CID from file details
-
-**Multiple Gateways:**
-```bash
-# 4EVERLAND
-https://ipfs.4everland.link/ipfs/QmXxx...
-
-# IPFS.io
-https://ipfs.io/ipfs/QmXxx...
-
-# Cloudflare
-https://cloudflare-ipfs.com/ipfs/QmXxx...
-
-# DWeb.link
-https://dweb.link/ipfs/QmXxx...
-```
-
-**Directory Upload:**
-- Upload entire folder
-- Get directory CID
-- Access files: `gateway/ipfs/DirCID/filename`
-
-**Pinning Importance:**
-- Unpinned content may be garbage collected
-- Pinning services keep content available
-- Multiple pins = more redundancy
-
-</details>
-
----
-
-### Task 5 — IPNS & Updates (3 pts)
-
-**Objective:** Understand mutable content with IPNS.
-
-**Requirements:**
-
-1. **Understand IPNS**
-   - IPFS = immutable (content changes = new CID)
-   - IPNS = mutable pointer to IPFS content
-   - IPNS name stays same, content can change
-
-2. **Explore 4EVERLAND Domains**
-   - Custom domains for your deployment
-   - How 4EVERLAND handles updates
-
-3. **Update Deployment**
-   - Make changes to your static site
-   - Redeploy
-   - Observe: same URL, new CID
-
-<details>
-<summary>💡 Hints</summary>
-
-**IPFS vs IPNS:**
-- **IPFS CID:** `QmXxx...` - changes when content changes
-- **IPNS Name:** `/ipns/k51xxx...` - stays same, points to current CID
-
-**4EVERLAND Handles This:**
-- Your project URL stays constant
-- Behind scenes, updates the IPNS pointer
-- Users always get latest version
-
-**Domain Configuration:**
-1. Dashboard → Hosting → Your Project
-2. Settings → Domains
-3. Add custom domain or use provided subdomain
-
-</details>
-
----
-
-### Task 6 — Documentation & Analysis (3 pts)
-
-**Objective:** Document your work and analyze decentralized hosting.
-
-**Create `4EVERLAND.md` with:**
-
-1. **Deployment Summary**
-   - What you deployed
-   - URLs (4EVERLAND and IPFS gateways)
-   - CIDs obtained
-
-2. **Screenshots**
-   - 4EVERLAND dashboard
-   - Deployed site
-   - Bucket storage
-   - Multiple gateway access
-
-3. **Centralized vs Decentralized Comparison**
-
-| Aspect | Traditional Hosting | IPFS/4EVERLAND |
-|--------|---------------------|----------------|
-| Content addressing | | |
-| Single point of failure | | |
-| Censorship resistance | | |
-| Update mechanism | | |
-| Cost model | | |
-| Speed/latency | | |
-| Best use cases | | |
-
-4. **Use Case Analysis**
-   - When decentralized hosting makes sense
-   - When traditional hosting is better
-   - Your recommendations
-
----
-
-## Checklist
-
-- [ ] IPFS concepts understood
-- [ ] Local IPFS node running
-- [ ] Content added to local IPFS
-- [ ] 4EVERLAND account created
-- [ ] Static site deployed via 4EVERLAND
-- [ ] Files uploaded to Bucket
-- [ ] Content accessed via multiple gateways
-- [ ] IPNS/updates understood
-- [ ] `4EVERLAND.md` documentation complete
-- [ ] Comparison analysis complete
-
----
-
-## Rubric
-
-| Criteria | Points |
-|----------|--------|
-| **IPFS Fundamentals** | 3 pts |
-| **4EVERLAND Setup** | 3 pts |
-| **Static Deployment** | 4 pts |
-| **IPFS Pinning** | 4 pts |
-| **IPNS & Updates** | 3 pts |
-| **Documentation** | 3 pts |
-| **Total** | **20 pts** |
-
-**Grading:**
-- **18-20:** Excellent understanding, thorough deployment, insightful analysis
-- **16-17:** Working deployment, good documentation
-- **14-15:** Basic deployment, incomplete analysis
-- **<14:** Incomplete deployment
-
----
-
-## Resources
-
-<details>
-<summary>📚 IPFS Documentation</summary>
-
-- [IPFS Docs](https://docs.ipfs.tech/)
-- [IPFS Concepts](https://docs.ipfs.tech/concepts/)
-- [Content Addressing](https://docs.ipfs.tech/concepts/content-addressing/)
-- [IPNS](https://docs.ipfs.tech/concepts/ipns/)
-
-</details>
-
-<details>
-<summary>🌐 4EVERLAND</summary>
-
-- [4EVERLAND Docs](https://docs.4everland.org/)
-- [Hosting Guide](https://docs.4everland.org/hosting/overview)
-- [Bucket (Storage)](https://docs.4everland.org/storage/bucket)
-
-</details>
-
-<details>
-<summary>🔗 Public Gateways</summary>
-
-- [IPFS Gateway Checker](https://ipfs.github.io/public-gateway-checker/)
-- [Gateway List](https://docs.ipfs.tech/concepts/ipfs-gateway/#gateway-providers)
-
-</details>
-
----
-
-**Good luck!** 🌐
-
-> **Remember:** Decentralized hosting trades some convenience for resilience and censorship resistance. Content-addressed storage ensures integrity - the same content always has the same identifier.
+# Lab 18 — Decentralized Hosting with 4EVERLAND & IPFS
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Web3%20Infrastructure-blue)
+![points](https://img.shields.io/badge/points-20-orange)
+![type](https://img.shields.io/badge/type-Exam%20Alternative-purple)
+
+> Deploy content to the decentralized web using IPFS and 4EVERLAND for permanent, censorship-resistant hosting.
+
+## Overview
+
+The decentralized web (Web3) offers an alternative to traditional hosting where content is stored across a distributed network rather than centralized servers. IPFS (InterPlanetary File System) is the foundation, and 4EVERLAND provides a user-friendly gateway to this ecosystem.
+
+**This is an Exam Alternative Lab** — Complete both Lab 17 and Lab 18 to replace the final exam.
+
+**What You'll Learn:**
+- IPFS fundamentals and content addressing
+- Decentralized storage concepts
+- Pinning services and persistence
+- 4EVERLAND hosting platform
+- Centralized vs decentralized trade-offs
+
+**Prerequisites:** Basic understanding of web hosting, completed Docker lab
+
+**Tech Stack:** IPFS | 4EVERLAND | Docker | Content Addressing
+
+**Provided Files:**
+- `labs/lab18/index.html` — A beautiful course landing page ready to deploy
+
+---
+
+## Exam Alternative Requirements
+
+| Requirement | Details |
+|-------------|---------|
+| **Deadline** | 1 week before exam date |
+| **Minimum Score** | 16/20 points |
+| **Must Complete** | Both Lab 17 AND Lab 18 |
+| **Total Points** | 40 pts (replaces 40 pt exam) |
+
+---
+
+## Tasks
+
+### Task 1 — IPFS Fundamentals (3 pts)
+
+**Objective:** Understand IPFS concepts and run a local node.
+
+**Requirements:**
+
+1. **Study IPFS Concepts**
+   - Content addressing vs location addressing
+   - CIDs (Content Identifiers)
+   - Pinning and garbage collection
+   - IPFS gateways
+
+2. **Run Local IPFS Node**
+   - Use Docker to run IPFS node
+   - Access the Web UI
+   - Understand node configuration
+
+3. **Add Content Locally**
+   - Add a file to your local IPFS node
+   - Retrieve the CID
+   - Access via local gateway
+
+<details>
+<summary>💡 Hints</summary>
+
+**IPFS Concepts:**
+- **Content Addressing:** Files identified by hash of content, not location
+- **CID:** Unique identifier derived from content hash (e.g., `QmXxx...` or `bafyxxx...`)
+- **Pinning:** Marking content to keep it (prevent garbage collection)
+- **Gateway:** HTTP interface to IPFS network
+
+**Run IPFS with Docker:**
+```bash
+docker run -d --name ipfs \
+  -p 4001:4001 \
+  -p 8080:8080 \
+  -p 5001:5001 \
+  ipfs/kubo:latest
+
+# Web UI at http://localhost:5001/webui
+# Gateway at http://localhost:8080
+```
+
+**Add Content:**
+```bash
+# Create test file
+echo "Hello IPFS from DevOps course!" > hello.txt
+
+# Add to IPFS
+docker exec ipfs ipfs add /hello.txt
+# Returns: added QmXxx... hello.txt
+
+# Access via gateway
+curl http://localhost:8080/ipfs/QmXxx...
+```
+
+**Resources:**
+- [IPFS Docs](https://docs.ipfs.tech/)
+- [IPFS Concepts](https://docs.ipfs.tech/concepts/)
+
+</details>
+
+---
+
+### Task 2 — 4EVERLAND Setup (3 pts)
+
+**Objective:** Set up 4EVERLAND account and explore the platform.
+
+**Requirements:**
+
+1. **Create Account**
+   - Sign up at [4everland.org](https://www.4everland.org/)
+   - Connect with GitHub or wallet
+   - Explore dashboard
+
+2. **Understand Services**
+   - Hosting: Deploy websites/apps
+   - Storage: IPFS pinning
+   - Gateway: Access IPFS content
+
+3. **Explore Free Tier**
+   - Understand limits and capabilities
+   - Review pricing for reference
+
+<details>
+<summary>💡 Hints</summary>
+
+**4EVERLAND Services:**
+- **Hosting:** Deploy from Git repos, automatic builds
+- **Bucket (Storage):** Upload files, get IPFS CIDs
+- **Gateway:** Access content via 4everland.link
+
+**Dashboard:**
+- Projects: Your deployed sites
+- Bucket: File storage
+- Domains: Custom domain setup
+
+**Free Tier Includes:**
+- 100 deployments/month
+- 5GB storage
+- 100GB bandwidth
+
+**Resources:**
+- [4EVERLAND Docs](https://docs.4everland.org/)
+
+</details>
+
+---
+
+### Task 3 — Deploy Static Content (4 pts)
+
+**Objective:** Deploy a static site to 4EVERLAND.
+
+**Requirements:**
+
+1. **Use the Provided Static Site**
+   - A course landing page is provided at `labs/lab18/index.html`
+   - Review the HTML/CSS to understand the structure
+   - You may customize it or create your own
+
+2. **Deploy via 4EVERLAND**
+   - Connect your GitHub repository
+   - Configure build settings
+   - Deploy to IPFS via 4EVERLAND
+
+3. **Verify Deployment**
+   - Access via 4EVERLAND URL
+   - Access via IPFS gateway
+   - Note the CID
+
+4. **Test Permanence**
+   - Understand that content with same hash = same CID
+   - Make a change, redeploy, observe new CID
+
+<details>
+<summary>💡 Hints</summary>
+
+**Provided Static Site:**
+The course provides a beautiful landing page at `labs/lab18/index.html` that you can deploy. It includes:
+- Modern responsive design
+- Course curriculum overview
+- Learning roadmap
+- "Deployed on IPFS" badge
+
+**Deployment Steps:**
+1. Go to 4EVERLAND Dashboard → Hosting
+2. Click "New Project"
+3. Import from GitHub
+4. Select your repository and branch
+5. Configure:
+   - Framework: None (static)
+   - Build command: (leave empty for static)
+   - Output directory: `labs/lab18` (or root if you moved the file)
+6. Deploy
+
+**Alternative: Create Your Own**
+You can also create your own static site. Keep it simple:
+```html
+<!DOCTYPE html>
+<html>
+<head>
+    <title>My DevOps Portfolio</title>
+</head>
+<body>
+    <h1>Welcome to My DevOps Journey</h1>
+    <p>Deployed on IPFS via 4EVERLAND</p>
+</body>
+</html>
+```
+
+**Access URLs:**
+- 4EVERLAND: `https://your-project.4everland.app`
+- IPFS Gateway: `https://ipfs.4everland.link/ipfs/CID`
+
+</details>
+
+---
+
+### Task 4 — IPFS Pinning (4 pts)
+
+**Objective:** Use 4EVERLAND's storage (Bucket) for IPFS pinning.
+
+**Requirements:**
+
+1. **Upload Files to Bucket**
+   - Upload multiple files (images, documents, etc.)
+   - Get CIDs for each file
+
+2. **Create a Directory Structure**
+   - Upload a folder with multiple files
+   - Understand directory CIDs
+
+3. **Access via Multiple Gateways**
+   - Access your content via:
+     - 4EVERLAND gateway
+     - Public IPFS gateways (ipfs.io, dweb.link)
+   - Understand gateway differences
+
+4. **Verify Pinning**
+   - Confirm content is pinned
+   - Understand pinning vs local storage
+
+<details>
+<summary>💡 Hints</summary>
+
+**Bucket Upload:**
+1. Dashboard → Bucket
+2. Create new bucket
+3. Upload files or folders
+4. Get CID from file details
+
+**Multiple Gateways:**
+```bash
+# 4EVERLAND
+https://ipfs.4everland.link/ipfs/QmXxx...
+
+# IPFS.io
+https://ipfs.io/ipfs/QmXxx...
+
+# Cloudflare
+https://cloudflare-ipfs.com/ipfs/QmXxx...
+
+# DWeb.link
+https://dweb.link/ipfs/QmXxx...
+```
+
+**Directory Upload:**
+- Upload entire folder
+- Get directory CID
+- Access files: `gateway/ipfs/DirCID/filename`
+
+**Pinning Importance:**
+- Unpinned content may be garbage collected
+- Pinning services keep content available
+- Multiple pins = more redundancy
+
+</details>
+
+---
+
+### Task 5 — IPNS & Updates (3 pts)
+
+**Objective:** Understand mutable content with IPNS.
+
+**Requirements:**
+
+1. **Understand IPNS**
+   - IPFS = immutable (content changes = new CID)
+   - IPNS = mutable pointer to IPFS content
+   - IPNS name stays same, content can change
+
+2. **Explore 4EVERLAND Domains**
+   - Custom domains for your deployment
+   - How 4EVERLAND handles updates
+
+3. **Update Deployment**
+   - Make changes to your static site
+   - Redeploy
+   - Observe: same URL, new CID
+
+<details>
+<summary>💡 Hints</summary>
+
+**IPFS vs IPNS:**
+- **IPFS CID:** `QmXxx...` - changes when content changes
+- **IPNS Name:** `/ipns/k51xxx...` - stays same, points to current CID
+
+**4EVERLAND Handles This:**
+- Your project URL stays constant
+- Behind scenes, updates the IPNS pointer
+- Users always get latest version
+
+**Domain Configuration:**
+1. Dashboard → Hosting → Your Project
+2. Settings → Domains
+3. Add custom domain or use provided subdomain
+
+</details>
+
+---
+
+### Task 6 — Documentation & Analysis (3 pts)
+
+**Objective:** Document your work and analyze decentralized hosting.
+
+**Create `4EVERLAND.md` with:**
+
+1. **Deployment Summary**
+   - What you deployed
+   - URLs (4EVERLAND and IPFS gateways)
+   - CIDs obtained
+
+2. **Screenshots**
+   - 4EVERLAND dashboard
+   - Deployed site
+   - Bucket storage
+   - Multiple gateway access
+
+3. **Centralized vs Decentralized Comparison**
+
+| Aspect | Traditional Hosting | IPFS/4EVERLAND |
+|--------|---------------------|----------------|
+| Content addressing | | |
+| Single point of failure | | |
+| Censorship resistance | | |
+| Update mechanism | | |
+| Cost model | | |
+| Speed/latency | | |
+| Best use cases | | |
+
+4. **Use Case Analysis**
+   - When decentralized hosting makes sense
+   - When traditional hosting is better
+   - Your recommendations
+
+---
+
+## Checklist
+
+- [ ] IPFS concepts understood
+- [ ] Local IPFS node running
+- [ ] Content added to local IPFS
+- [ ] 4EVERLAND account created
+- [ ] Static site deployed via 4EVERLAND
+- [ ] Files uploaded to Bucket
+- [ ] Content accessed via multiple gateways
+- [ ] IPNS/updates understood
+- [ ] `4EVERLAND.md` documentation complete
+- [ ] Comparison analysis complete
+
+---
+
+## Rubric
+
+| Criteria | Points |
+|----------|--------|
+| **IPFS Fundamentals** | 3 pts |
+| **4EVERLAND Setup** | 3 pts |
+| **Static Deployment** | 4 pts |
+| **IPFS Pinning** | 4 pts |
+| **IPNS & Updates** | 3 pts |
+| **Documentation** | 3 pts |
+| **Total** | **20 pts** |
+
+**Grading:**
+- **18-20:** Excellent understanding, thorough deployment, insightful analysis
+- **16-17:** Working deployment, good documentation
+- **14-15:** Basic deployment, incomplete analysis
+- **<14:** Incomplete deployment
+
+---
+
+## Resources
+
+<details>
+<summary>📚 IPFS Documentation</summary>
+
+- [IPFS Docs](https://docs.ipfs.tech/)
+- [IPFS Concepts](https://docs.ipfs.tech/concepts/)
+- [Content Addressing](https://docs.ipfs.tech/concepts/content-addressing/)
+- [IPNS](https://docs.ipfs.tech/concepts/ipns/)
+
+</details>
+
+<details>
+<summary>🌐 4EVERLAND</summary>
+
+- [4EVERLAND Docs](https://docs.4everland.org/)
+- [Hosting Guide](https://docs.4everland.org/hosting/overview)
+- [Bucket (Storage)](https://docs.4everland.org/storage/bucket)
+
+</details>
+
+<details>
+<summary>🔗 Public Gateways</summary>
+
+- [IPFS Gateway Checker](https://ipfs.github.io/public-gateway-checker/)
+- [Gateway List](https://docs.ipfs.tech/concepts/ipfs-gateway/#gateway-providers)
+
+</details>
+
+---
+
+**Good luck!** 🌐
+
+> **Remember:** Decentralized hosting trades some convenience for resilience and censorship resistance. Content-addressed storage ensures integrity - the same content always has the same identifier.
diff --git a/labs/lab18/index.html b/labs/lab18/index.html
index b3de65bc8b..7d9ae2ac7d 100644
--- a/labs/lab18/index.html
+++ b/labs/lab18/index.html
@@ -1,927 +1,927 @@
-<!DOCTYPE html>
-<html lang="en">
-<head>
-    <meta charset="UTF-8">
-    <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>DevOps Core Course | Production-Grade Practices</title>
-    <meta name="description" content="Master production-grade DevOps practices through 16 hands-on labs. Build, containerize, deploy, monitor, and scale applications using industry-standard tools.">
-    <link rel="preconnect" href="https://fonts.googleapis.com">
-    <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
-    <link href="https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700&family=JetBrains+Mono:wght@400;500&display=swap" rel="stylesheet">
-    <style>
-        :root {
-            --bg-primary: #0a0a0f;
-            --bg-secondary: #12121a;
-            --bg-card: #1a1a24;
-            --accent-primary: #6366f1;
-            --accent-secondary: #8b5cf6;
-            --accent-tertiary: #06b6d4;
-            --accent-success: #10b981;
-            --accent-warning: #f59e0b;
-            --accent-danger: #ef4444;
-            --text-primary: #f8fafc;
-            --text-secondary: #94a3b8;
-            --text-muted: #64748b;
-            --border-color: #2d2d3a;
-            --gradient-1: linear-gradient(135deg, #6366f1 0%, #8b5cf6 50%, #06b6d4 100%);
-            --gradient-2: linear-gradient(135deg, #1a1a24 0%, #0a0a0f 100%);
-        }
-
-        * {
-            box-sizing: border-box;
-            margin: 0;
-            padding: 0;
-        }
-
-        html {
-            scroll-behavior: smooth;
-        }
-
-        body {
-            font-family: 'Inter', -apple-system, BlinkMacSystemFont, sans-serif;
-            background: var(--bg-primary);
-            color: var(--text-primary);
-            line-height: 1.7;
-            overflow-x: hidden;
-        }
-
-        .container {
-            max-width: 1200px;
-            margin: 0 auto;
-            padding: 0 2rem;
-        }
-
-        /* Navigation */
-        header {
-            position: fixed;
-            top: 0;
-            left: 0;
-            right: 0;
-            z-index: 1000;
-            background: rgba(10, 10, 15, 0.8);
-            backdrop-filter: blur(20px);
-            border-bottom: 1px solid var(--border-color);
-        }
-
-        nav {
-            display: flex;
-            justify-content: space-between;
-            align-items: center;
-            padding: 1rem 2rem;
-            max-width: 1200px;
-            margin: 0 auto;
-        }
-
-        .logo {
-            font-size: 1.25rem;
-            font-weight: 700;
-            background: var(--gradient-1);
-            -webkit-background-clip: text;
-            -webkit-text-fill-color: transparent;
-            background-clip: text;
-        }
-
-        .nav-links {
-            display: flex;
-            gap: 2rem;
-            list-style: none;
-        }
-
-        .nav-links a {
-            color: var(--text-secondary);
-            text-decoration: none;
-            font-size: 0.9rem;
-            font-weight: 500;
-            transition: color 0.3s ease;
-        }
-
-        .nav-links a:hover {
-            color: var(--text-primary);
-        }
-
-        /* Hero Section */
-        .hero {
-            min-height: 100vh;
-            display: flex;
-            align-items: center;
-            position: relative;
-            padding-top: 80px;
-            overflow: hidden;
-        }
-
-        .hero::before {
-            content: '';
-            position: absolute;
-            top: 0;
-            left: 0;
-            right: 0;
-            bottom: 0;
-            background:
-                radial-gradient(ellipse at 20% 20%, rgba(99, 102, 241, 0.15) 0%, transparent 50%),
-                radial-gradient(ellipse at 80% 80%, rgba(6, 182, 212, 0.1) 0%, transparent 50%),
-                radial-gradient(ellipse at 50% 50%, rgba(139, 92, 246, 0.05) 0%, transparent 70%);
-            pointer-events: none;
-        }
-
-        .hero-content {
-            position: relative;
-            z-index: 1;
-            text-align: center;
-            max-width: 900px;
-            margin: 0 auto;
-        }
-
-        .hero-badge {
-            display: inline-flex;
-            align-items: center;
-            gap: 0.5rem;
-            background: var(--bg-card);
-            border: 1px solid var(--border-color);
-            padding: 0.5rem 1rem;
-            border-radius: 50px;
-            font-size: 0.85rem;
-            color: var(--text-secondary);
-            margin-bottom: 2rem;
-        }
-
-        .hero-badge span {
-            color: var(--accent-success);
-        }
-
-        .hero h1 {
-            font-size: clamp(2.5rem, 6vw, 4.5rem);
-            font-weight: 700;
-            line-height: 1.1;
-            margin-bottom: 1.5rem;
-            background: linear-gradient(135deg, var(--text-primary) 0%, var(--text-secondary) 100%);
-            -webkit-background-clip: text;
-            -webkit-text-fill-color: transparent;
-            background-clip: text;
-        }
-
-        .hero h1 .highlight {
-            background: var(--gradient-1);
-            -webkit-background-clip: text;
-            -webkit-text-fill-color: transparent;
-            background-clip: text;
-        }
-
-        .hero p {
-            font-size: 1.25rem;
-            color: var(--text-secondary);
-            max-width: 600px;
-            margin: 0 auto 2.5rem;
-        }
-
-        .hero-buttons {
-            display: flex;
-            gap: 1rem;
-            justify-content: center;
-            flex-wrap: wrap;
-        }
-
-        .btn {
-            display: inline-flex;
-            align-items: center;
-            gap: 0.5rem;
-            padding: 0.875rem 1.75rem;
-            border-radius: 12px;
-            font-size: 1rem;
-            font-weight: 600;
-            text-decoration: none;
-            transition: all 0.3s ease;
-            cursor: pointer;
-            border: none;
-        }
-
-        .btn-primary {
-            background: var(--gradient-1);
-            color: white;
-            box-shadow: 0 4px 20px rgba(99, 102, 241, 0.3);
-        }
-
-        .btn-primary:hover {
-            transform: translateY(-2px);
-            box-shadow: 0 6px 30px rgba(99, 102, 241, 0.4);
-        }
-
-        .btn-secondary {
-            background: var(--bg-card);
-            color: var(--text-primary);
-            border: 1px solid var(--border-color);
-        }
-
-        .btn-secondary:hover {
-            background: var(--bg-secondary);
-            border-color: var(--accent-primary);
-        }
-
-        /* Stats Section */
-        .stats {
-            display: grid;
-            grid-template-columns: repeat(4, 1fr);
-            gap: 2rem;
-            padding: 4rem 0;
-            border-top: 1px solid var(--border-color);
-            border-bottom: 1px solid var(--border-color);
-            margin: 4rem 0;
-        }
-
-        .stat-item {
-            text-align: center;
-        }
-
-        .stat-value {
-            font-size: 2.5rem;
-            font-weight: 700;
-            background: var(--gradient-1);
-            -webkit-background-clip: text;
-            -webkit-text-fill-color: transparent;
-            background-clip: text;
-        }
-
-        .stat-label {
-            color: var(--text-secondary);
-            font-size: 0.9rem;
-            margin-top: 0.5rem;
-        }
-
-        /* Section Styles */
-        section {
-            padding: 6rem 0;
-        }
-
-        .section-header {
-            text-align: center;
-            max-width: 700px;
-            margin: 0 auto 4rem;
-        }
-
-        .section-header h2 {
-            font-size: 2.5rem;
-            font-weight: 700;
-            margin-bottom: 1rem;
-        }
-
-        .section-header p {
-            color: var(--text-secondary);
-            font-size: 1.1rem;
-        }
-
-        /* Features Grid */
-        .features-grid {
-            display: grid;
-            grid-template-columns: repeat(auto-fit, minmax(300px, 1fr));
-            gap: 2rem;
-        }
-
-        .feature-card {
-            background: var(--bg-card);
-            border: 1px solid var(--border-color);
-            border-radius: 16px;
-            padding: 2rem;
-            transition: all 0.3s ease;
-        }
-
-        .feature-card:hover {
-            border-color: var(--accent-primary);
-            transform: translateY(-4px);
-        }
-
-        .feature-icon {
-            width: 48px;
-            height: 48px;
-            background: var(--gradient-1);
-            border-radius: 12px;
-            display: flex;
-            align-items: center;
-            justify-content: center;
-            font-size: 1.5rem;
-            margin-bottom: 1.5rem;
-        }
-
-        .feature-card h3 {
-            font-size: 1.25rem;
-            margin-bottom: 0.75rem;
-        }
-
-        .feature-card p {
-            color: var(--text-secondary);
-            font-size: 0.95rem;
-        }
-
-        /* Labs Section */
-        .labs-grid {
-            display: grid;
-            grid-template-columns: repeat(auto-fill, minmax(280px, 1fr));
-            gap: 1.5rem;
-        }
-
-        .lab-card {
-            background: var(--bg-card);
-            border: 1px solid var(--border-color);
-            border-radius: 12px;
-            padding: 1.5rem;
-            display: flex;
-            gap: 1rem;
-            align-items: flex-start;
-            transition: all 0.3s ease;
-        }
-
-        .lab-card:hover {
-            border-color: var(--accent-primary);
-        }
-
-        .lab-number {
-            width: 40px;
-            height: 40px;
-            background: var(--bg-secondary);
-            border-radius: 10px;
-            display: flex;
-            align-items: center;
-            justify-content: center;
-            font-weight: 700;
-            font-size: 0.9rem;
-            color: var(--accent-primary);
-            flex-shrink: 0;
-        }
-
-        .lab-card.bonus .lab-number {
-            background: linear-gradient(135deg, var(--accent-warning) 0%, var(--accent-danger) 100%);
-            color: white;
-        }
-
-        .lab-content h4 {
-            font-size: 1rem;
-            margin-bottom: 0.25rem;
-        }
-
-        .lab-content p {
-            color: var(--text-muted);
-            font-size: 0.85rem;
-        }
-
-        .lab-tag {
-            display: inline-block;
-            font-size: 0.7rem;
-            padding: 0.2rem 0.5rem;
-            border-radius: 4px;
-            background: var(--bg-secondary);
-            color: var(--text-secondary);
-            margin-top: 0.5rem;
-        }
-
-        .lab-tag.exam-alt {
-            background: rgba(245, 158, 11, 0.2);
-            color: var(--accent-warning);
-        }
-
-        /* Roadmap */
-        .roadmap {
-            display: grid;
-            gap: 2rem;
-        }
-
-        .phase {
-            background: var(--bg-card);
-            border: 1px solid var(--border-color);
-            border-radius: 16px;
-            padding: 2rem;
-            display: grid;
-            grid-template-columns: auto 1fr;
-            gap: 2rem;
-            align-items: center;
-        }
-
-        .phase-number {
-            width: 80px;
-            height: 80px;
-            background: var(--gradient-1);
-            border-radius: 16px;
-            display: flex;
-            flex-direction: column;
-            align-items: center;
-            justify-content: center;
-            color: white;
-        }
-
-        .phase-number span {
-            font-size: 0.7rem;
-            text-transform: uppercase;
-            letter-spacing: 1px;
-            opacity: 0.8;
-        }
-
-        .phase-number strong {
-            font-size: 1.75rem;
-        }
-
-        .phase-content h3 {
-            font-size: 1.25rem;
-            margin-bottom: 0.5rem;
-        }
-
-        .phase-content p {
-            color: var(--text-secondary);
-        }
-
-        .phase-topics {
-            display: flex;
-            flex-wrap: wrap;
-            gap: 0.5rem;
-            margin-top: 1rem;
-        }
-
-        .topic-tag {
-            background: var(--bg-secondary);
-            border: 1px solid var(--border-color);
-            padding: 0.25rem 0.75rem;
-            border-radius: 6px;
-            font-size: 0.8rem;
-            color: var(--text-secondary);
-        }
-
-        /* CTA Section */
-        .cta {
-            background: var(--bg-card);
-            border: 1px solid var(--border-color);
-            border-radius: 24px;
-            padding: 4rem;
-            text-align: center;
-            position: relative;
-            overflow: hidden;
-        }
-
-        .cta::before {
-            content: '';
-            position: absolute;
-            top: 0;
-            left: 0;
-            right: 0;
-            bottom: 0;
-            background:
-                radial-gradient(ellipse at 30% 0%, rgba(99, 102, 241, 0.1) 0%, transparent 50%),
-                radial-gradient(ellipse at 70% 100%, rgba(6, 182, 212, 0.1) 0%, transparent 50%);
-            pointer-events: none;
-        }
-
-        .cta h2 {
-            font-size: 2rem;
-            margin-bottom: 1rem;
-            position: relative;
-        }
-
-        .cta p {
-            color: var(--text-secondary);
-            margin-bottom: 2rem;
-            position: relative;
-        }
-
-        /* Footer */
-        footer {
-            padding: 3rem 0;
-            border-top: 1px solid var(--border-color);
-            text-align: center;
-        }
-
-        footer p {
-            color: var(--text-muted);
-            font-size: 0.9rem;
-        }
-
-        footer a {
-            color: var(--accent-primary);
-            text-decoration: none;
-        }
-
-        footer a:hover {
-            text-decoration: underline;
-        }
-
-        .footer-links {
-            display: flex;
-            justify-content: center;
-            gap: 2rem;
-            margin-top: 1rem;
-        }
-
-        /* Deployed Badge */
-        .deployed-badge {
-            position: fixed;
-            bottom: 2rem;
-            right: 2rem;
-            background: var(--bg-card);
-            border: 1px solid var(--border-color);
-            border-radius: 12px;
-            padding: 1rem 1.5rem;
-            display: flex;
-            align-items: center;
-            gap: 0.75rem;
-            font-size: 0.85rem;
-            z-index: 100;
-            box-shadow: 0 10px 40px rgba(0, 0, 0, 0.3);
-        }
-
-        .deployed-badge .icon {
-            width: 32px;
-            height: 32px;
-            background: var(--gradient-1);
-            border-radius: 8px;
-            display: flex;
-            align-items: center;
-            justify-content: center;
-        }
-
-        .deployed-badge span {
-            color: var(--text-secondary);
-        }
-
-        .deployed-badge strong {
-            color: var(--accent-tertiary);
-        }
-
-        /* Responsive */
-        @media (max-width: 768px) {
-            .nav-links {
-                display: none;
-            }
-
-            .stats {
-                grid-template-columns: repeat(2, 1fr);
-            }
-
-            .phase {
-                grid-template-columns: 1fr;
-                text-align: center;
-            }
-
-            .phase-number {
-                margin: 0 auto;
-            }
-
-            .phase-topics {
-                justify-content: center;
-            }
-
-            .cta {
-                padding: 2rem;
-            }
-
-            .deployed-badge {
-                bottom: 1rem;
-                right: 1rem;
-                left: 1rem;
-            }
-        }
-    </style>
-</head>
-<body>
-    <header>
-        <nav>
-            <div class="logo">DevOps Core</div>
-            <ul class="nav-links">
-                <li><a href="#features">Features</a></li>
-                <li><a href="#labs">Labs</a></li>
-                <li><a href="#roadmap">Roadmap</a></li>
-                <li><a href="https://github.com/inno-devops-labs/S25-core-course-labs">GitHub</a></li>
-            </ul>
-        </nav>
-    </header>
-
-    <main>
-        <section class="hero">
-            <div class="container">
-                <div class="hero-content">
-                    <div class="hero-badge">
-                        <span>&#x2713;</span> 2026 Edition &mdash; 7th Year &mdash; Evolved every semester
-                    </div>
-                    <h1>Master <span class="highlight">Production-Grade</span> DevOps Practices</h1>
-                    <p>16 lectures and hands-on labs covering Kubernetes, GitOps, CI/CD, Monitoring, and beyond. 18 weeks of learning to build real-world skills.</p>
-                    <div class="hero-buttons">
-                        <a href="https://github.com/inno-devops-labs/S25-core-course-labs" class="btn btn-primary">
-                            Start Learning &rarr;
-                        </a>
-                        <a href="#labs" class="btn btn-secondary">
-                            View Curriculum
-                        </a>
-                    </div>
-                </div>
-            </div>
-        </section>
-
-        <section class="container">
-            <div class="stats">
-                <div class="stat-item">
-                    <div class="stat-value">7</div>
-                    <div class="stat-label">Years Running</div>
-                </div>
-                <div class="stat-item">
-                    <div class="stat-value">1000+</div>
-                    <div class="stat-label">Students Trained</div>
-                </div>
-                <div class="stat-item">
-                    <div class="stat-value">16</div>
-                    <div class="stat-label">Lectures & Labs</div>
-                </div>
-                <div class="stat-item">
-                    <div class="stat-value">18</div>
-                    <div class="stat-label">Weeks of Learning</div>
-                </div>
-            </div>
-        </section>
-
-        <section id="features" class="container">
-            <div class="section-header">
-                <h2>Why This Course?</h2>
-                <p>Build production-ready skills through hands-on practice with tools used by top tech companies worldwide.</p>
-            </div>
-            <div class="features-grid">
-                <div class="feature-card">
-                    <div class="feature-icon">&#x2601;</div>
-                    <h3>Cloud-Native Architecture</h3>
-                    <p>Master Kubernetes, Helm, StatefulSets, and container orchestration for scalable deployments.</p>
-                </div>
-                <div class="feature-card">
-                    <div class="feature-icon">&#x21BB;</div>
-                    <h3>GitOps & Automation</h3>
-                    <p>Implement ArgoCD, Argo Rollouts, and progressive delivery for safe, automated deployments.</p>
-                </div>
-                <div class="feature-card">
-                    <div class="feature-icon">&#x1F512;</div>
-                    <h3>Security & Secrets</h3>
-                    <p>Learn HashiCorp Vault, Kubernetes Secrets, and secure configuration management practices.</p>
-                </div>
-                <div class="feature-card">
-                    <div class="feature-icon">&#x1F4CA;</div>
-                    <h3>Observability</h3>
-                    <p>Build monitoring stacks with Prometheus, Grafana, Loki, and implement effective alerting.</p>
-                </div>
-                <div class="feature-card">
-                    <div class="feature-icon">&#x2699;</div>
-                    <h3>Infrastructure as Code</h3>
-                    <p>Automate infrastructure with Terraform and Ansible for reproducible environments.</p>
-                </div>
-                <div class="feature-card">
-                    <div class="feature-icon">&#x1F310;</div>
-                    <h3>Beyond Kubernetes</h3>
-                    <p>Explore edge computing with Fly.io and decentralized hosting with IPFS and 4EVERLAND.</p>
-                </div>
-            </div>
-        </section>
-
-        <section id="labs" class="container">
-            <div class="section-header">
-                <h2>Lectures & Labs</h2>
-                <p>16 lectures with corresponding hands-on labs, plus 2 bonus labs as exam alternatives.</p>
-            </div>
-            <div class="labs-grid">
-                <div class="lab-card">
-                    <div class="lab-number">01</div>
-                    <div class="lab-content">
-                        <h4>Web Application Development</h4>
-                        <p>Python/Go, Best Practices</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">02</div>
-                    <div class="lab-content">
-                        <h4>Containerization</h4>
-                        <p>Docker, Multi-stage Builds</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">03</div>
-                    <div class="lab-content">
-                        <h4>Continuous Integration</h4>
-                        <p>GitHub Actions, Snyk</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">04</div>
-                    <div class="lab-content">
-                        <h4>Infrastructure as Code</h4>
-                        <p>Terraform, Cloud Providers</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">05</div>
-                    <div class="lab-content">
-                        <h4>Configuration Management</h4>
-                        <p>Ansible Basics</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">06</div>
-                    <div class="lab-content">
-                        <h4>Continuous Deployment</h4>
-                        <p>Ansible Advanced</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">07</div>
-                    <div class="lab-content">
-                        <h4>Logging</h4>
-                        <p>Promtail, Loki, Grafana</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">08</div>
-                    <div class="lab-content">
-                        <h4>Monitoring</h4>
-                        <p>Prometheus, Grafana</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">09</div>
-                    <div class="lab-content">
-                        <h4>Kubernetes Basics</h4>
-                        <p>Minikube, Deployments, Services</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">10</div>
-                    <div class="lab-content">
-                        <h4>Helm Charts</h4>
-                        <p>Templating, Hooks</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">11</div>
-                    <div class="lab-content">
-                        <h4>Secrets Management</h4>
-                        <p>K8s Secrets, HashiCorp Vault</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">12</div>
-                    <div class="lab-content">
-                        <h4>Configuration & Storage</h4>
-                        <p>ConfigMaps, PVCs</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">13</div>
-                    <div class="lab-content">
-                        <h4>GitOps</h4>
-                        <p>ArgoCD</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">14</div>
-                    <div class="lab-content">
-                        <h4>Progressive Delivery</h4>
-                        <p>Argo Rollouts</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">15</div>
-                    <div class="lab-content">
-                        <h4>StatefulSets</h4>
-                        <p>Persistent Storage, Headless Services</p>
-                    </div>
-                </div>
-                <div class="lab-card">
-                    <div class="lab-number">16</div>
-                    <div class="lab-content">
-                        <h4>Cluster Monitoring</h4>
-                        <p>Kube-Prometheus, Init Containers</p>
-                    </div>
-                </div>
-                <div class="lab-card bonus">
-                    <div class="lab-number">17</div>
-                    <div class="lab-content">
-                        <h4>Fly.io Edge Deployment</h4>
-                        <p>Global Distribution, PaaS</p>
-                        <span class="lab-tag exam-alt">Exam Alternative</span>
-                    </div>
-                </div>
-                <div class="lab-card bonus">
-                    <div class="lab-number">18</div>
-                    <div class="lab-content">
-                        <h4>4EVERLAND & IPFS</h4>
-                        <p>Decentralized Hosting</p>
-                        <span class="lab-tag exam-alt">Exam Alternative</span>
-                    </div>
-                </div>
-            </div>
-        </section>
-
-        <section id="roadmap" class="container">
-            <div class="section-header">
-                <h2>Learning Roadmap</h2>
-                <p>A structured 16-week journey from foundations to advanced production patterns, plus 2 weeks for bonus labs or exam preparation.</p>
-            </div>
-            <div class="roadmap">
-                <div class="phase">
-                    <div class="phase-number">
-                        <span>Phase</span>
-                        <strong>1</strong>
-                    </div>
-                    <div class="phase-content">
-                        <h3>Foundations (Weeks 1-6)</h3>
-                        <p>Build core skills in containerization, CI/CD, and infrastructure automation.</p>
-                        <div class="phase-topics">
-                            <span class="topic-tag">Docker</span>
-                            <span class="topic-tag">GitHub Actions</span>
-                            <span class="topic-tag">Terraform</span>
-                            <span class="topic-tag">Ansible</span>
-                        </div>
-                    </div>
-                </div>
-                <div class="phase">
-                    <div class="phase-number">
-                        <span>Phase</span>
-                        <strong>2</strong>
-                    </div>
-                    <div class="phase-content">
-                        <h3>Observability (Weeks 7-8)</h3>
-                        <p>Master logging and monitoring for production visibility.</p>
-                        <div class="phase-topics">
-                            <span class="topic-tag">Prometheus</span>
-                            <span class="topic-tag">Grafana</span>
-                            <span class="topic-tag">Loki</span>
-                            <span class="topic-tag">Alerting</span>
-                        </div>
-                    </div>
-                </div>
-                <div class="phase">
-                    <div class="phase-number">
-                        <span>Phase</span>
-                        <strong>3</strong>
-                    </div>
-                    <div class="phase-content">
-                        <h3>Kubernetes Core (Weeks 9-12)</h3>
-                        <p>Deep dive into Kubernetes orchestration and package management.</p>
-                        <div class="phase-topics">
-                            <span class="topic-tag">Kubernetes</span>
-                            <span class="topic-tag">Helm</span>
-                            <span class="topic-tag">Secrets</span>
-                            <span class="topic-tag">ConfigMaps</span>
-                        </div>
-                    </div>
-                </div>
-                <div class="phase">
-                    <div class="phase-number">
-                        <span>Phase</span>
-                        <strong>4</strong>
-                    </div>
-                    <div class="phase-content">
-                        <h3>Advanced Patterns (Weeks 13-16)</h3>
-                        <p>Implement GitOps, progressive delivery, stateful workloads, and production monitoring.</p>
-                        <div class="phase-topics">
-                            <span class="topic-tag">ArgoCD</span>
-                            <span class="topic-tag">Argo Rollouts</span>
-                            <span class="topic-tag">StatefulSets</span>
-                            <span class="topic-tag">Vault</span>
-                        </div>
-                    </div>
-                </div>
-                <div class="phase">
-                    <div class="phase-number">
-                        <span>Bonus</span>
-                        <strong>+2</strong>
-                    </div>
-                    <div class="phase-content">
-                        <h3>Bonus Labs / Exam Prep (Weeks 17-18)</h3>
-                        <p>Complete exam alternative labs or prepare for the final exam.</p>
-                        <div class="phase-topics">
-                            <span class="topic-tag">Fly.io</span>
-                            <span class="topic-tag">IPFS</span>
-                            <span class="topic-tag">4EVERLAND</span>
-                            <span class="topic-tag">Edge Computing</span>
-                        </div>
-                    </div>
-                </div>
-            </div>
-        </section>
-
-        <section class="container">
-            <div class="cta">
-                <h2>Ready to Start Your DevOps Journey?</h2>
-                <p>Join 1000+ students who have built production-ready skills through this battle-tested curriculum.</p>
-                <a href="https://github.com/inno-devops-labs/S25-core-course-labs" class="btn btn-primary">
-                    Get Started Free &rarr;
-                </a>
-            </div>
-        </section>
-    </main>
-
-    <footer>
-        <div class="container">
-            <p>&copy; 2020&ndash;2026 DevOps Core Course. 7 years of continuous improvement. Open source educational content.</p>
-            <div class="footer-links">
-                <a href="https://github.com/inno-devops-labs/S25-core-course-labs">GitHub</a>
-                <a href="mailto:devops@example.com">Contact</a>
-            </div>
-        </div>
-    </footer>
-
-    <div class="deployed-badge">
-        <div class="icon">&#x1F310;</div>
-        <div>
-            <span>Deployed on</span><br>
-            <strong>IPFS via 4EVERLAND</strong>
-        </div>
-    </div>
-</body>
-</html>
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>DevOps Core Course | Production-Grade Practices</title>
+    <meta name="description" content="Master production-grade DevOps practices through 16 hands-on labs. Build, containerize, deploy, monitor, and scale applications using industry-standard tools.">
+    <link rel="preconnect" href="https://fonts.googleapis.com">
+    <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
+    <link href="https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700&family=JetBrains+Mono:wght@400;500&display=swap" rel="stylesheet">
+    <style>
+        :root {
+            --bg-primary: #0a0a0f;
+            --bg-secondary: #12121a;
+            --bg-card: #1a1a24;
+            --accent-primary: #6366f1;
+            --accent-secondary: #8b5cf6;
+            --accent-tertiary: #06b6d4;
+            --accent-success: #10b981;
+            --accent-warning: #f59e0b;
+            --accent-danger: #ef4444;
+            --text-primary: #f8fafc;
+            --text-secondary: #94a3b8;
+            --text-muted: #64748b;
+            --border-color: #2d2d3a;
+            --gradient-1: linear-gradient(135deg, #6366f1 0%, #8b5cf6 50%, #06b6d4 100%);
+            --gradient-2: linear-gradient(135deg, #1a1a24 0%, #0a0a0f 100%);
+        }
+
+        * {
+            box-sizing: border-box;
+            margin: 0;
+            padding: 0;
+        }
+
+        html {
+            scroll-behavior: smooth;
+        }
+
+        body {
+            font-family: 'Inter', -apple-system, BlinkMacSystemFont, sans-serif;
+            background: var(--bg-primary);
+            color: var(--text-primary);
+            line-height: 1.7;
+            overflow-x: hidden;
+        }
+
+        .container {
+            max-width: 1200px;
+            margin: 0 auto;
+            padding: 0 2rem;
+        }
+
+        /* Navigation */
+        header {
+            position: fixed;
+            top: 0;
+            left: 0;
+            right: 0;
+            z-index: 1000;
+            background: rgba(10, 10, 15, 0.8);
+            backdrop-filter: blur(20px);
+            border-bottom: 1px solid var(--border-color);
+        }
+
+        nav {
+            display: flex;
+            justify-content: space-between;
+            align-items: center;
+            padding: 1rem 2rem;
+            max-width: 1200px;
+            margin: 0 auto;
+        }
+
+        .logo {
+            font-size: 1.25rem;
+            font-weight: 700;
+            background: var(--gradient-1);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            background-clip: text;
+        }
+
+        .nav-links {
+            display: flex;
+            gap: 2rem;
+            list-style: none;
+        }
+
+        .nav-links a {
+            color: var(--text-secondary);
+            text-decoration: none;
+            font-size: 0.9rem;
+            font-weight: 500;
+            transition: color 0.3s ease;
+        }
+
+        .nav-links a:hover {
+            color: var(--text-primary);
+        }
+
+        /* Hero Section */
+        .hero {
+            min-height: 100vh;
+            display: flex;
+            align-items: center;
+            position: relative;
+            padding-top: 80px;
+            overflow: hidden;
+        }
+
+        .hero::before {
+            content: '';
+            position: absolute;
+            top: 0;
+            left: 0;
+            right: 0;
+            bottom: 0;
+            background:
+                radial-gradient(ellipse at 20% 20%, rgba(99, 102, 241, 0.15) 0%, transparent 50%),
+                radial-gradient(ellipse at 80% 80%, rgba(6, 182, 212, 0.1) 0%, transparent 50%),
+                radial-gradient(ellipse at 50% 50%, rgba(139, 92, 246, 0.05) 0%, transparent 70%);
+            pointer-events: none;
+        }
+
+        .hero-content {
+            position: relative;
+            z-index: 1;
+            text-align: center;
+            max-width: 900px;
+            margin: 0 auto;
+        }
+
+        .hero-badge {
+            display: inline-flex;
+            align-items: center;
+            gap: 0.5rem;
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            padding: 0.5rem 1rem;
+            border-radius: 50px;
+            font-size: 0.85rem;
+            color: var(--text-secondary);
+            margin-bottom: 2rem;
+        }
+
+        .hero-badge span {
+            color: var(--accent-success);
+        }
+
+        .hero h1 {
+            font-size: clamp(2.5rem, 6vw, 4.5rem);
+            font-weight: 700;
+            line-height: 1.1;
+            margin-bottom: 1.5rem;
+            background: linear-gradient(135deg, var(--text-primary) 0%, var(--text-secondary) 100%);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            background-clip: text;
+        }
+
+        .hero h1 .highlight {
+            background: var(--gradient-1);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            background-clip: text;
+        }
+
+        .hero p {
+            font-size: 1.25rem;
+            color: var(--text-secondary);
+            max-width: 600px;
+            margin: 0 auto 2.5rem;
+        }
+
+        .hero-buttons {
+            display: flex;
+            gap: 1rem;
+            justify-content: center;
+            flex-wrap: wrap;
+        }
+
+        .btn {
+            display: inline-flex;
+            align-items: center;
+            gap: 0.5rem;
+            padding: 0.875rem 1.75rem;
+            border-radius: 12px;
+            font-size: 1rem;
+            font-weight: 600;
+            text-decoration: none;
+            transition: all 0.3s ease;
+            cursor: pointer;
+            border: none;
+        }
+
+        .btn-primary {
+            background: var(--gradient-1);
+            color: white;
+            box-shadow: 0 4px 20px rgba(99, 102, 241, 0.3);
+        }
+
+        .btn-primary:hover {
+            transform: translateY(-2px);
+            box-shadow: 0 6px 30px rgba(99, 102, 241, 0.4);
+        }
+
+        .btn-secondary {
+            background: var(--bg-card);
+            color: var(--text-primary);
+            border: 1px solid var(--border-color);
+        }
+
+        .btn-secondary:hover {
+            background: var(--bg-secondary);
+            border-color: var(--accent-primary);
+        }
+
+        /* Stats Section */
+        .stats {
+            display: grid;
+            grid-template-columns: repeat(4, 1fr);
+            gap: 2rem;
+            padding: 4rem 0;
+            border-top: 1px solid var(--border-color);
+            border-bottom: 1px solid var(--border-color);
+            margin: 4rem 0;
+        }
+
+        .stat-item {
+            text-align: center;
+        }
+
+        .stat-value {
+            font-size: 2.5rem;
+            font-weight: 700;
+            background: var(--gradient-1);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            background-clip: text;
+        }
+
+        .stat-label {
+            color: var(--text-secondary);
+            font-size: 0.9rem;
+            margin-top: 0.5rem;
+        }
+
+        /* Section Styles */
+        section {
+            padding: 6rem 0;
+        }
+
+        .section-header {
+            text-align: center;
+            max-width: 700px;
+            margin: 0 auto 4rem;
+        }
+
+        .section-header h2 {
+            font-size: 2.5rem;
+            font-weight: 700;
+            margin-bottom: 1rem;
+        }
+
+        .section-header p {
+            color: var(--text-secondary);
+            font-size: 1.1rem;
+        }
+
+        /* Features Grid */
+        .features-grid {
+            display: grid;
+            grid-template-columns: repeat(auto-fit, minmax(300px, 1fr));
+            gap: 2rem;
+        }
+
+        .feature-card {
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            border-radius: 16px;
+            padding: 2rem;
+            transition: all 0.3s ease;
+        }
+
+        .feature-card:hover {
+            border-color: var(--accent-primary);
+            transform: translateY(-4px);
+        }
+
+        .feature-icon {
+            width: 48px;
+            height: 48px;
+            background: var(--gradient-1);
+            border-radius: 12px;
+            display: flex;
+            align-items: center;
+            justify-content: center;
+            font-size: 1.5rem;
+            margin-bottom: 1.5rem;
+        }
+
+        .feature-card h3 {
+            font-size: 1.25rem;
+            margin-bottom: 0.75rem;
+        }
+
+        .feature-card p {
+            color: var(--text-secondary);
+            font-size: 0.95rem;
+        }
+
+        /* Labs Section */
+        .labs-grid {
+            display: grid;
+            grid-template-columns: repeat(auto-fill, minmax(280px, 1fr));
+            gap: 1.5rem;
+        }
+
+        .lab-card {
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            border-radius: 12px;
+            padding: 1.5rem;
+            display: flex;
+            gap: 1rem;
+            align-items: flex-start;
+            transition: all 0.3s ease;
+        }
+
+        .lab-card:hover {
+            border-color: var(--accent-primary);
+        }
+
+        .lab-number {
+            width: 40px;
+            height: 40px;
+            background: var(--bg-secondary);
+            border-radius: 10px;
+            display: flex;
+            align-items: center;
+            justify-content: center;
+            font-weight: 700;
+            font-size: 0.9rem;
+            color: var(--accent-primary);
+            flex-shrink: 0;
+        }
+
+        .lab-card.bonus .lab-number {
+            background: linear-gradient(135deg, var(--accent-warning) 0%, var(--accent-danger) 100%);
+            color: white;
+        }
+
+        .lab-content h4 {
+            font-size: 1rem;
+            margin-bottom: 0.25rem;
+        }
+
+        .lab-content p {
+            color: var(--text-muted);
+            font-size: 0.85rem;
+        }
+
+        .lab-tag {
+            display: inline-block;
+            font-size: 0.7rem;
+            padding: 0.2rem 0.5rem;
+            border-radius: 4px;
+            background: var(--bg-secondary);
+            color: var(--text-secondary);
+            margin-top: 0.5rem;
+        }
+
+        .lab-tag.exam-alt {
+            background: rgba(245, 158, 11, 0.2);
+            color: var(--accent-warning);
+        }
+
+        /* Roadmap */
+        .roadmap {
+            display: grid;
+            gap: 2rem;
+        }
+
+        .phase {
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            border-radius: 16px;
+            padding: 2rem;
+            display: grid;
+            grid-template-columns: auto 1fr;
+            gap: 2rem;
+            align-items: center;
+        }
+
+        .phase-number {
+            width: 80px;
+            height: 80px;
+            background: var(--gradient-1);
+            border-radius: 16px;
+            display: flex;
+            flex-direction: column;
+            align-items: center;
+            justify-content: center;
+            color: white;
+        }
+
+        .phase-number span {
+            font-size: 0.7rem;
+            text-transform: uppercase;
+            letter-spacing: 1px;
+            opacity: 0.8;
+        }
+
+        .phase-number strong {
+            font-size: 1.75rem;
+        }
+
+        .phase-content h3 {
+            font-size: 1.25rem;
+            margin-bottom: 0.5rem;
+        }
+
+        .phase-content p {
+            color: var(--text-secondary);
+        }
+
+        .phase-topics {
+            display: flex;
+            flex-wrap: wrap;
+            gap: 0.5rem;
+            margin-top: 1rem;
+        }
+
+        .topic-tag {
+            background: var(--bg-secondary);
+            border: 1px solid var(--border-color);
+            padding: 0.25rem 0.75rem;
+            border-radius: 6px;
+            font-size: 0.8rem;
+            color: var(--text-secondary);
+        }
+
+        /* CTA Section */
+        .cta {
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            border-radius: 24px;
+            padding: 4rem;
+            text-align: center;
+            position: relative;
+            overflow: hidden;
+        }
+
+        .cta::before {
+            content: '';
+            position: absolute;
+            top: 0;
+            left: 0;
+            right: 0;
+            bottom: 0;
+            background:
+                radial-gradient(ellipse at 30% 0%, rgba(99, 102, 241, 0.1) 0%, transparent 50%),
+                radial-gradient(ellipse at 70% 100%, rgba(6, 182, 212, 0.1) 0%, transparent 50%);
+            pointer-events: none;
+        }
+
+        .cta h2 {
+            font-size: 2rem;
+            margin-bottom: 1rem;
+            position: relative;
+        }
+
+        .cta p {
+            color: var(--text-secondary);
+            margin-bottom: 2rem;
+            position: relative;
+        }
+
+        /* Footer */
+        footer {
+            padding: 3rem 0;
+            border-top: 1px solid var(--border-color);
+            text-align: center;
+        }
+
+        footer p {
+            color: var(--text-muted);
+            font-size: 0.9rem;
+        }
+
+        footer a {
+            color: var(--accent-primary);
+            text-decoration: none;
+        }
+
+        footer a:hover {
+            text-decoration: underline;
+        }
+
+        .footer-links {
+            display: flex;
+            justify-content: center;
+            gap: 2rem;
+            margin-top: 1rem;
+        }
+
+        /* Deployed Badge */
+        .deployed-badge {
+            position: fixed;
+            bottom: 2rem;
+            right: 2rem;
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            border-radius: 12px;
+            padding: 1rem 1.5rem;
+            display: flex;
+            align-items: center;
+            gap: 0.75rem;
+            font-size: 0.85rem;
+            z-index: 100;
+            box-shadow: 0 10px 40px rgba(0, 0, 0, 0.3);
+        }
+
+        .deployed-badge .icon {
+            width: 32px;
+            height: 32px;
+            background: var(--gradient-1);
+            border-radius: 8px;
+            display: flex;
+            align-items: center;
+            justify-content: center;
+        }
+
+        .deployed-badge span {
+            color: var(--text-secondary);
+        }
+
+        .deployed-badge strong {
+            color: var(--accent-tertiary);
+        }
+
+        /* Responsive */
+        @media (max-width: 768px) {
+            .nav-links {
+                display: none;
+            }
+
+            .stats {
+                grid-template-columns: repeat(2, 1fr);
+            }
+
+            .phase {
+                grid-template-columns: 1fr;
+                text-align: center;
+            }
+
+            .phase-number {
+                margin: 0 auto;
+            }
+
+            .phase-topics {
+                justify-content: center;
+            }
+
+            .cta {
+                padding: 2rem;
+            }
+
+            .deployed-badge {
+                bottom: 1rem;
+                right: 1rem;
+                left: 1rem;
+            }
+        }
+    </style>
+</head>
+<body>
+    <header>
+        <nav>
+            <div class="logo">DevOps Core</div>
+            <ul class="nav-links">
+                <li><a href="#features">Features</a></li>
+                <li><a href="#labs">Labs</a></li>
+                <li><a href="#roadmap">Roadmap</a></li>
+                <li><a href="https://github.com/inno-devops-labs/S25-core-course-labs">GitHub</a></li>
+            </ul>
+        </nav>
+    </header>
+
+    <main>
+        <section class="hero">
+            <div class="container">
+                <div class="hero-content">
+                    <div class="hero-badge">
+                        <span>&#x2713;</span> 2026 Edition &mdash; 7th Year &mdash; Evolved every semester
+                    </div>
+                    <h1>Master <span class="highlight">Production-Grade</span> DevOps Practices</h1>
+                    <p>16 lectures and hands-on labs covering Kubernetes, GitOps, CI/CD, Monitoring, and beyond. 18 weeks of learning to build real-world skills.</p>
+                    <div class="hero-buttons">
+                        <a href="https://github.com/inno-devops-labs/S25-core-course-labs" class="btn btn-primary">
+                            Start Learning &rarr;
+                        </a>
+                        <a href="#labs" class="btn btn-secondary">
+                            View Curriculum
+                        </a>
+                    </div>
+                </div>
+            </div>
+        </section>
+
+        <section class="container">
+            <div class="stats">
+                <div class="stat-item">
+                    <div class="stat-value">7</div>
+                    <div class="stat-label">Years Running</div>
+                </div>
+                <div class="stat-item">
+                    <div class="stat-value">1000+</div>
+                    <div class="stat-label">Students Trained</div>
+                </div>
+                <div class="stat-item">
+                    <div class="stat-value">16</div>
+                    <div class="stat-label">Lectures & Labs</div>
+                </div>
+                <div class="stat-item">
+                    <div class="stat-value">18</div>
+                    <div class="stat-label">Weeks of Learning</div>
+                </div>
+            </div>
+        </section>
+
+        <section id="features" class="container">
+            <div class="section-header">
+                <h2>Why This Course?</h2>
+                <p>Build production-ready skills through hands-on practice with tools used by top tech companies worldwide.</p>
+            </div>
+            <div class="features-grid">
+                <div class="feature-card">
+                    <div class="feature-icon">&#x2601;</div>
+                    <h3>Cloud-Native Architecture</h3>
+                    <p>Master Kubernetes, Helm, StatefulSets, and container orchestration for scalable deployments.</p>
+                </div>
+                <div class="feature-card">
+                    <div class="feature-icon">&#x21BB;</div>
+                    <h3>GitOps & Automation</h3>
+                    <p>Implement ArgoCD, Argo Rollouts, and progressive delivery for safe, automated deployments.</p>
+                </div>
+                <div class="feature-card">
+                    <div class="feature-icon">&#x1F512;</div>
+                    <h3>Security & Secrets</h3>
+                    <p>Learn HashiCorp Vault, Kubernetes Secrets, and secure configuration management practices.</p>
+                </div>
+                <div class="feature-card">
+                    <div class="feature-icon">&#x1F4CA;</div>
+                    <h3>Observability</h3>
+                    <p>Build monitoring stacks with Prometheus, Grafana, Loki, and implement effective alerting.</p>
+                </div>
+                <div class="feature-card">
+                    <div class="feature-icon">&#x2699;</div>
+                    <h3>Infrastructure as Code</h3>
+                    <p>Automate infrastructure with Terraform and Ansible for reproducible environments.</p>
+                </div>
+                <div class="feature-card">
+                    <div class="feature-icon">&#x1F310;</div>
+                    <h3>Beyond Kubernetes</h3>
+                    <p>Explore edge computing with Fly.io and decentralized hosting with IPFS and 4EVERLAND.</p>
+                </div>
+            </div>
+        </section>
+
+        <section id="labs" class="container">
+            <div class="section-header">
+                <h2>Lectures & Labs</h2>
+                <p>16 lectures with corresponding hands-on labs, plus 2 bonus labs as exam alternatives.</p>
+            </div>
+            <div class="labs-grid">
+                <div class="lab-card">
+                    <div class="lab-number">01</div>
+                    <div class="lab-content">
+                        <h4>Web Application Development</h4>
+                        <p>Python/Go, Best Practices</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">02</div>
+                    <div class="lab-content">
+                        <h4>Containerization</h4>
+                        <p>Docker, Multi-stage Builds</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">03</div>
+                    <div class="lab-content">
+                        <h4>Continuous Integration</h4>
+                        <p>GitHub Actions, Snyk</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">04</div>
+                    <div class="lab-content">
+                        <h4>Infrastructure as Code</h4>
+                        <p>Terraform, Cloud Providers</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">05</div>
+                    <div class="lab-content">
+                        <h4>Configuration Management</h4>
+                        <p>Ansible Basics</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">06</div>
+                    <div class="lab-content">
+                        <h4>Continuous Deployment</h4>
+                        <p>Ansible Advanced</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">07</div>
+                    <div class="lab-content">
+                        <h4>Logging</h4>
+                        <p>Promtail, Loki, Grafana</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">08</div>
+                    <div class="lab-content">
+                        <h4>Monitoring</h4>
+                        <p>Prometheus, Grafana</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">09</div>
+                    <div class="lab-content">
+                        <h4>Kubernetes Basics</h4>
+                        <p>Minikube, Deployments, Services</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">10</div>
+                    <div class="lab-content">
+                        <h4>Helm Charts</h4>
+                        <p>Templating, Hooks</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">11</div>
+                    <div class="lab-content">
+                        <h4>Secrets Management</h4>
+                        <p>K8s Secrets, HashiCorp Vault</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">12</div>
+                    <div class="lab-content">
+                        <h4>Configuration & Storage</h4>
+                        <p>ConfigMaps, PVCs</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">13</div>
+                    <div class="lab-content">
+                        <h4>GitOps</h4>
+                        <p>ArgoCD</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">14</div>
+                    <div class="lab-content">
+                        <h4>Progressive Delivery</h4>
+                        <p>Argo Rollouts</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">15</div>
+                    <div class="lab-content">
+                        <h4>StatefulSets</h4>
+                        <p>Persistent Storage, Headless Services</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">16</div>
+                    <div class="lab-content">
+                        <h4>Cluster Monitoring</h4>
+                        <p>Kube-Prometheus, Init Containers</p>
+                    </div>
+                </div>
+                <div class="lab-card bonus">
+                    <div class="lab-number">17</div>
+                    <div class="lab-content">
+                        <h4>Fly.io Edge Deployment</h4>
+                        <p>Global Distribution, PaaS</p>
+                        <span class="lab-tag exam-alt">Exam Alternative</span>
+                    </div>
+                </div>
+                <div class="lab-card bonus">
+                    <div class="lab-number">18</div>
+                    <div class="lab-content">
+                        <h4>4EVERLAND & IPFS</h4>
+                        <p>Decentralized Hosting</p>
+                        <span class="lab-tag exam-alt">Exam Alternative</span>
+                    </div>
+                </div>
+            </div>
+        </section>
+
+        <section id="roadmap" class="container">
+            <div class="section-header">
+                <h2>Learning Roadmap</h2>
+                <p>A structured 16-week journey from foundations to advanced production patterns, plus 2 weeks for bonus labs or exam preparation.</p>
+            </div>
+            <div class="roadmap">
+                <div class="phase">
+                    <div class="phase-number">
+                        <span>Phase</span>
+                        <strong>1</strong>
+                    </div>
+                    <div class="phase-content">
+                        <h3>Foundations (Weeks 1-6)</h3>
+                        <p>Build core skills in containerization, CI/CD, and infrastructure automation.</p>
+                        <div class="phase-topics">
+                            <span class="topic-tag">Docker</span>
+                            <span class="topic-tag">GitHub Actions</span>
+                            <span class="topic-tag">Terraform</span>
+                            <span class="topic-tag">Ansible</span>
+                        </div>
+                    </div>
+                </div>
+                <div class="phase">
+                    <div class="phase-number">
+                        <span>Phase</span>
+                        <strong>2</strong>
+                    </div>
+                    <div class="phase-content">
+                        <h3>Observability (Weeks 7-8)</h3>
+                        <p>Master logging and monitoring for production visibility.</p>
+                        <div class="phase-topics">
+                            <span class="topic-tag">Prometheus</span>
+                            <span class="topic-tag">Grafana</span>
+                            <span class="topic-tag">Loki</span>
+                            <span class="topic-tag">Alerting</span>
+                        </div>
+                    </div>
+                </div>
+                <div class="phase">
+                    <div class="phase-number">
+                        <span>Phase</span>
+                        <strong>3</strong>
+                    </div>
+                    <div class="phase-content">
+                        <h3>Kubernetes Core (Weeks 9-12)</h3>
+                        <p>Deep dive into Kubernetes orchestration and package management.</p>
+                        <div class="phase-topics">
+                            <span class="topic-tag">Kubernetes</span>
+                            <span class="topic-tag">Helm</span>
+                            <span class="topic-tag">Secrets</span>
+                            <span class="topic-tag">ConfigMaps</span>
+                        </div>
+                    </div>
+                </div>
+                <div class="phase">
+                    <div class="phase-number">
+                        <span>Phase</span>
+                        <strong>4</strong>
+                    </div>
+                    <div class="phase-content">
+                        <h3>Advanced Patterns (Weeks 13-16)</h3>
+                        <p>Implement GitOps, progressive delivery, stateful workloads, and production monitoring.</p>
+                        <div class="phase-topics">
+                            <span class="topic-tag">ArgoCD</span>
+                            <span class="topic-tag">Argo Rollouts</span>
+                            <span class="topic-tag">StatefulSets</span>
+                            <span class="topic-tag">Vault</span>
+                        </div>
+                    </div>
+                </div>
+                <div class="phase">
+                    <div class="phase-number">
+                        <span>Bonus</span>
+                        <strong>+2</strong>
+                    </div>
+                    <div class="phase-content">
+                        <h3>Bonus Labs / Exam Prep (Weeks 17-18)</h3>
+                        <p>Complete exam alternative labs or prepare for the final exam.</p>
+                        <div class="phase-topics">
+                            <span class="topic-tag">Fly.io</span>
+                            <span class="topic-tag">IPFS</span>
+                            <span class="topic-tag">4EVERLAND</span>
+                            <span class="topic-tag">Edge Computing</span>
+                        </div>
+                    </div>
+                </div>
+            </div>
+        </section>
+
+        <section class="container">
+            <div class="cta">
+                <h2>Ready to Start Your DevOps Journey?</h2>
+                <p>Join 1000+ students who have built production-ready skills through this battle-tested curriculum.</p>
+                <a href="https://github.com/inno-devops-labs/S25-core-course-labs" class="btn btn-primary">
+                    Get Started Free &rarr;
+                </a>
+            </div>
+        </section>
+    </main>
+
+    <footer>
+        <div class="container">
+            <p>&copy; 2020&ndash;2026 DevOps Core Course. 7 years of continuous improvement. Open source educational content.</p>
+            <div class="footer-links">
+                <a href="https://github.com/inno-devops-labs/S25-core-course-labs">GitHub</a>
+                <a href="mailto:devops@example.com">Contact</a>
+            </div>
+        </div>
+    </footer>
+
+    <div class="deployed-badge">
+        <div class="icon">&#x1F310;</div>
+        <div>
+            <span>Deployed on</span><br>
+            <strong>IPFS via 4EVERLAND</strong>
+        </div>
+    </div>
+</body>
+</html>
diff --git a/lectures/lec1.md b/lectures/lec1.md
index 00ead8aabc..48d2674bd9 100644
--- a/lectures/lec1.md
+++ b/lectures/lec1.md
@@ -1,761 +1,761 @@
-# 📌 Lecture 1 — Introduction to DevOps: From Chaos to Flow
-
-## 📍 Slide 1 – 🚀 Welcome to DevOps
-
-* 🌍 **Software is eating the world** — but shipping it is hard
-* 😰 Teams struggle with slow releases, broken deploys, finger-pointing
-* 🌉 **DevOps bridges the gap** between **building** and **running** software
-* 🎯 This course: practical skills to transform how you deliver software
-
-```mermaid
-flowchart LR
-  Chaos[😱 Chaos] -->|DevOps| Flow[🌊 Flow]
-  Flow --> Value[💎 Deliver Value Faster]
-```
-
----
-
-## 📍 Slide 2 – 🎯 What You Will Learn
-
-* ✅ Understand what DevOps is (and isn't)
-* ✅ Identify problems DevOps solves
-* ✅ Apply DevOps thinking to real scenarios
-* ✅ Map DevOps practices to your future workflow
-
-**🎓 Learning Outcomes:**
-| # | Outcome |
-|---|---------|
-| 1 | 🧠 Define DevOps and its core principles |
-| 2 | 🔍 Recognize pre-DevOps problems |
-| 3 | 🛠️ Apply DevOps solutions to scenarios |
-| 4 | 🗺️ Navigate the DevOps lifecycle |
-
----
-
-## 📍 Slide 3 – 📋 How This Lecture Works
-
-* 📚 **Concepts + Diagrams** — visual learning
-* 🎮 **Real-world scenarios** — you decide!
-* 📝 **3 quiz checkpoints**: PRE / MID / POST
-* 🕹️ **Interactive simulation**: "DevOps as a Game"
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction (now)     → 📝 PRE Quiz
-Section 1: The Problem
-Section 2: What DevOps Is
-Section 3: DevOps as a Game       → 📝 MID Quiz
-Section 4: Lifecycle & Metrics
-Section 5: Real Life
-Section 6: Reflection             → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – ❓ The Big Question
-
-* 📊 **70%** of IT projects experience significant delays
-* ⏱️ Average time from code complete to production: **weeks to months**
-* 💥 Most outages caused by **changes** (deploys, configs)
-
-> 💬 *"It worked on my machine"* — Every developer, ever
-
-**🤔 Think about it:**
-* Why is software delivery so hard?
-* Why do teams fear deployments?
-* What would "good" look like?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L1_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Problem Before DevOps
-
-* 👨‍💻 **Development** and ⚙️ **Operations** = separate teams, separate goals
-* 🚀 Dev wants: **ship features fast**
-* 🛡️ Ops wants: **keep systems stable**
-* 💥 Result: **conflict, blame, slow delivery**
-
-```mermaid
-flowchart LR
-  Dev[👨‍💻 Dev Team] -->|🎯 New Features| Goal1[Ship Fast]
-  Ops[⚙️ Ops Team] -->|🛡️ Stability| Goal2[Don't Break]
-  Goal1 -.->|❌ Conflict| Goal2
-```
-
----
-
-## 📍 Slide 7 – 🧱 The Wall of Confusion
-
-* 🧱 **The Wall** = invisible barrier between Dev and Ops
-* 📦 Dev "throws code over the wall"
-* 🔥 Ops catches the blame when it breaks
-* 🔄 Ops rejects changes to avoid risk
-
-```mermaid
-flowchart LR
-  Dev[👨‍💻 Dev Team] -->|📦 Throws code over| Wall[🧱 Wall of Confusion]
-  Wall -->|🔥 Catches blame| Ops[⚙️ Ops Team]
-  Ops -->|❌ Rejects changes| Dev
-```
-
-> 🤔 **Think:** Have you seen this pattern before?
-
----
-
-## 📍 Slide 8 – 😱 Manual Release Hell
-
-* 📅 Deployments are rare (monthly, quarterly)
-* 🎰 Each release = **high-risk event**
-* 📋 Manual steps, checklists, weekend work
-* 💀 One mistake = hours of rollback
-
-```mermaid
-flowchart TD
-  Code[✅ Code Complete] --> Wait[📅 Wait for Release Window]
-  Wait --> Manual[📋 Manual Deploy Steps]
-  Manual --> Pray[🙏 Pray It Works]
-  Pray -->|💥 Failure| Blame[👉 Blame Game]
-  Pray -->|😮‍💨 Success| Relief[Temporary Relief]
-```
-
-**📊 The Numbers:**
-* 🐢 Average release cycle: **3-6 months**
-* 📉 Success rate: **~60%**
-* ⏱️ Rollback time: **4-8 hours**
-
----
-
-## 📍 Slide 9 – 😨 Fear and Blame Culture
-
-* 🌙 Incident happens at 2am
-* 👉 First question: *"Who did this?"*
-* 🙈 Engineers hide mistakes
-* 🚫 Nobody wants to deploy on Friday
-* 💀 Innovation stops
-
-> ⚠️ **Fear kills velocity**
-
-**😰 Signs of Blame Culture:**
-* 🔇 People afraid to speak up
-* 📝 Excessive documentation "for protection"
-* 🐌 Slow decision-making
-* 🚪 High turnover
-
-**💬 Discussion:** Why does blame make things worse?
-
----
-
-## 📍 Slide 10 – 💸 The Cost of Chaos
-
-| 🔥 Problem | 💥 Impact |
-|------------|-----------|
-| 🐢 Slow releases | Lost market opportunity |
-| 📋 Manual processes | Human error, burnout |
-| 👉 Blame culture | Talent leaves |
-| 🙈 No visibility | Firefighting mode |
-
-**📈 Real Numbers:**
-* 🏢 **Amazon pre-DevOps**: deploys took **weeks**
-* 🚀 **Amazon post-DevOps**: deploys every **11.7 seconds**
-
-**💰 Cost of Downtime:**
-* 💵 Small business: **$427/minute**
-* 🏢 Enterprise: **$9,000/minute**
-* 🌐 Amazon: **$220,000/minute**
-
----
-
-## 📍 Slide 11 – 💡 Section 2: What DevOps Really Is
-
-* 🤝 **DevOps** = Development + Operations working as **one team**
-* 🌱 A **culture** of collaboration and shared responsibility
-* 🔧 A set of **practices** for fast, reliable delivery
-* 🚫 NOT just tools, NOT a job title, NOT a team
-
-```mermaid
-flowchart LR
-  Dev[👨‍💻 Development] -->|🤝 Collaboration| DevOps[🚀 DevOps]
-  Ops[⚙️ Operations] -->|🤝 Collaboration| DevOps
-  DevOps --> Value[💎 Fast, Reliable Value]
-```
-
-**📖 Definition:**
-> *DevOps is a set of practices that combines software development (Dev) and IT operations (Ops) to shorten the development lifecycle while delivering features, fixes, and updates frequently in close alignment with business objectives.*
-
----
-
-## 📍 Slide 12 – 🚫 What DevOps is NOT
-
-| ❌ Myth | ✅ Reality |
-|---------|-----------|
-| "We hired a DevOps engineer, we're done" | 👥 Everyone participates |
-| "DevOps means using Kubernetes" | 🛠️ Tools support culture |
-| "DevOps replaces developers/ops" | 🤝 It unites them |
-| "DevOps = just automation" | 🧩 Automation + Culture + Measurement |
-| "DevOps is a team" | 🌍 It's a way of working |
-
-> 🔥 **Hot take:** You can't buy DevOps. You build it.
-
-**🎯 DevOps is about:**
-* 🧠 Mindset change
-* 🤝 Breaking silos
-* 🔄 Continuous improvement
-* 📊 Data-driven decisions
-
----
-
-## 📍 Slide 13 – 🔄 The Three Ways of DevOps
-
-```mermaid
-flowchart LR
-  W1[1️⃣ Flow] --> W2[2️⃣ Feedback]
-  W2 --> W3[3️⃣ Learning]
-  W3 --> W1
-```
-
-| 🛤️ Way | 🎯 Focus | 💡 Example |
-|--------|---------|-----------|
-| 1️⃣ **Flow** | Fast Dev → Prod | 🚀 CI/CD pipelines |
-| 2️⃣ **Feedback** | Fast Prod → Dev | 📊 Monitoring, alerts |
-| 3️⃣ **Learning** | Experiment safely | 📝 Blameless postmortems |
-
-**📚 Source:** *The Phoenix Project* by Gene Kim
-
----
-
-## 📍 Slide 14 – 🧩 The CAMS Model
-
-```mermaid
-graph TD
-  C[🌱 Culture] --> DevOps[🚀 DevOps]
-  A[🤖 Automation] --> DevOps
-  M[📊 Measurement] --> DevOps
-  S[🔗 Sharing] --> DevOps
-```
-
-* 🌱 **C = Culture** — Trust, collaboration, shared ownership
-* 🤖 **A = Automation** — Eliminate manual, error-prone work
-* 📊 **M = Measurement** — Track metrics, decide with data
-* 🔗 **S = Sharing** — Knowledge flows, blameless postmortems
-
-**🎯 Key Metrics:**
-* ⏱️ **MTTR** = Mean Time to Recovery
-* ❌ **CFR** = Change Failure Rate
-* 📦 **DF** = Deployment Frequency
-* 🚀 **LT** = Lead Time
-
----
-
-## 📍 Slide 15 – ⚡ Before vs After DevOps
-
-| 😰 Before | 🚀 After |
-|----------|---------|
-| 📅 Releases every few months | 📆 Releases daily/weekly |
-| 📋 Manual deployments | 🤖 Automated pipelines |
-| 👉 Blame when things break | 📝 Blameless postmortems |
-| 🙅 "Not my problem" | 🤝 Shared ownership |
-| 😨 Fear of change | 💪 Embrace change |
-| 🐌 Weeks to deploy | ⚡ Minutes to deploy |
-
-> 🤔 Which column describes your current environment?
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: DevOps as a Game
-
-## 🕹️ Simulation: You're the CTO
-
-* 🏢 Welcome to **FlowStart Inc.** — a growing startup
-* 👥 You have: 5 developers, 2 ops engineers
-* 🌐 A web application with 10K users
-* 📈 Pressure to ship new features
-
-**❓ What could go wrong?**
-
-> 💀 **Everything.**
-
-🎮 **Let's play.**
-
----
-
-## 📍 Slide 17 – 💥 Scenario 1: Release Failure
-
-**📅 Friday 5pm:**
-* 👨‍💻 Developer pushes "small fix"
-* 🚫 No tests, no review, straight to production
-* 💥 App crashes, users can't log in
-* 🤷 Nobody knows what changed
-
-```mermaid
-flowchart LR
-  Push[📤 Code Push] --> Prod[🌐 Production]
-  Prod --> Crash[💥 Crash]
-  Crash --> Panic[😱 Weekend Panic]
-```
-
-**📊 Impact:**
-* 👥 10,000 users affected
-* ⏱️ 4 hours downtime
-* 💰 $50,000 lost revenue
-* 😤 Angry customers on Twitter
-
-> ❓ **What would you do?**
-
----
-
-## 📍 Slide 18 – ✅ Solution: CI/CD
-
-## 🛠️ Fix: Continuous Integration & Delivery
-
-```mermaid
-flowchart LR
-  Push[📤 Push] --> CI[🧪 Tests]
-  CI -->|✅ Pass| Review[👀 Review]
-  Review --> CD[🚀 Deploy]
-  CD --> Monitor[📊 Monitor]
-  CI -->|❌ Fail| Fix[🔧 Fix]
-```
-
-* ✅ Every change triggers **automated tests**
-* ✅ **Code review** required before merge
-* ✅ **Automated deployment** pipeline
-* ✅ **One-click rollback**
-
-**🎯 Result:** Deploy with confidence, not prayers
-
-**📊 CI/CD Benefits:**
-* 🐛 Catch bugs early (80% cheaper to fix)
-* 🚀 Deploy 200x more frequently
-* ⏱️ 24x faster recovery from failures
-
----
-
-## 📍 Slide 19 – 🐾 Scenario 2: Infrastructure Drift
-
-**😰 Situation:**
-* 🖥️ Production server configured manually over 2 years
-* 👋 Ops engineer who set it up **left the company**
-* 📈 Need to scale — but **can't recreate the setup**
-
-```mermaid
-flowchart TD
-  S1[🖥️ Server 1: Ubuntu 18 + mystery configs]
-  S2[🖥️ Server 2: Ubuntu 20 + different configs]
-  S3[🖥️ Server 3: Who knows? 🤷]
-  S1 --> Drift[😱 Configuration Drift]
-  S2 --> Drift
-  S3 --> Drift
-```
-
-> 🐶🐄 **"Pets vs Cattle"** — Which do you have?
-
-**🐶 Pets:** Unique, irreplaceable, nursed back to health
-**🐄 Cattle:** Identical, replaceable, automated
-
----
-
-## 📍 Slide 20 – ✅ Solution: Infrastructure as Code
-
-## 🛠️ Fix: IaC
-
-* 📝 Define infrastructure in **version-controlled files**
-* 🔄 Servers are **reproducible**, not unique
-* ⚡ Spin up identical environments in **minutes**
-
-```hcl
-# 🌍 Terraform example
-resource "aws_instance" "web" {
-  ami           = "ami-0c55b159cbfafe1f0"
-  instance_type = "t2.micro"
-  count         = 3  # 🔢 3 identical servers
-}
-```
-
-**🎯 Result:** Cattle, not pets. Replace, don't repair.
-
-**🛠️ IaC Tools:**
-* 🌍 **Terraform** — Multi-cloud
-* 🧩 **Ansible** — Configuration management
-* 📦 **Pulumi** — Code-based IaC
-
----
-
-## 📍 Slide 21 – 🔓 Scenario 3: Secret Leak
-
-**💀 What happened:**
-* 👨‍💻 Developer commits database password to GitHub
-* 🤖 Bot scrapes it within **minutes**
-* 💥 Attackers access production database
-
-```mermaid
-flowchart LR
-  Commit[📤 Commit + Secret] --> GitHub[🐙 Public Repo]
-  GitHub --> Bot[🤖 Scraper Bot]
-  Bot --> Breach[💀 Database Breach]
-```
-
-> ⏱️ **How fast do bots find secrets?** Under 5 minutes.
-
-**📊 Real Stats:**
-* 🔍 GitHub scans 100M+ repos for secrets
-* ⏱️ Average time to exploit: **<1 hour**
-* 💰 Average breach cost: **$4.45 million**
-
----
-
-## 📍 Slide 22 – ✅ Solution: Secrets Management
-
-## 🛠️ Fix: Vault & Secret Scanning
-
-* 🚫 **Never** store secrets in code
-* 🔐 Use secret management tools (Vault, AWS Secrets Manager)
-* 🔍 Pre-commit hooks scan for secrets
-* 🔄 Rotate credentials automatically
-
-```yaml
-# ❌ Bad
-password: "super_secret_123"
-
-# ✅ Good
-password: ${VAULT_DB_PASSWORD}
-```
-
-**🎯 Result:** Secrets stay secret
-
-**🛠️ Secret Tools:**
-* 🔐 **HashiCorp Vault**
-* 🔑 **AWS Secrets Manager**
-* 🔒 **Azure Key Vault**
-* 🔍 **git-secrets** (pre-commit)
-
----
-
-## 📍 Slide 23 – 🙈 Scenario 4: Blind Operations
-
-**👥 Users report:** *"App is slow"*
-
-**🤷 Team asks:**
-* Is it? How slow?
-* Which part is slow?
-* Since when?
-* How many users affected?
-
-**😰 Answer:** No idea. No metrics. No logs. No visibility.
-
-⏱️ **Hours spent guessing.**
-
----
-
-## 📍 Slide 24 – ✅ Solution: Observability
-
-## 🛠️ Fix: Logs, Metrics, Traces
-
-```mermaid
-graph TD
-  Logs[📋 Logs: What happened] --> Obs[🔍 Observability]
-  Metrics[📊 Metrics: How much/fast] --> Obs
-  Traces[🔗 Traces: Where] --> Obs
-  Obs --> Action[⚡ Fix in minutes, not hours]
-```
-
-| 📊 Pillar | 🛠️ Tools |
-|-----------|----------|
-| 📋 Logs | ELK, Loki, CloudWatch |
-| 📊 Metrics | Prometheus, Grafana, Datadog |
-| 🔗 Traces | Jaeger, Zipkin, X-Ray |
-
-**🎯 Result:** See problems before users report them
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L1_MID
-
----
-
-## 📍 Slide 26 – ♾️ Section 4: DevOps Lifecycle
-
-## 🔄 The Infinity Loop
-
-* ♾️ DevOps is **continuous** — no "done" state
-* 🔄 Each stage feeds the next
-* 🔁 Forever improving
-
-```mermaid
-flowchart LR
-  Plan[📋 Plan] --> Code[💻 Code]
-  Code --> Build[🔨 Build]
-  Build --> Test[🧪 Test]
-  Test --> Release[📦 Release]
-  Release --> Deploy[🚀 Deploy]
-  Deploy --> Operate[⚙️ Operate]
-  Operate --> Monitor[📊 Monitor]
-  Monitor --> Plan
-```
-
----
-
-## 📍 Slide 27 – 🔁 Lifecycle Phases
-
-| 📍 Phase | 🎯 Activity | 🛠️ Tools |
-|----------|------------|----------|
-| 📋 Plan | Requirements, design | Jira, GitHub Issues |
-| 💻 Code | Write & review | Git, VS Code |
-| 🔨 Build | Compile, package | Docker, npm, Maven |
-| 🧪 Test | Automated testing | pytest, Jest, Selenium |
-| 📦 Release | Version, approve | GitHub Releases, Tags |
-| 🚀 Deploy | Push to environment | ArgoCD, Ansible, Helm |
-| ⚙️ Operate | Run, scale | Kubernetes, Terraform |
-| 📊 Monitor | Observe, alert | Prometheus, Grafana |
-
----
-
-## 📍 Slide 28 – 🗺️ Course Map
-
-## 📚 How This Course Covers the Lifecycle
-
-```mermaid
-flowchart TD
-  subgraph 📋 Plan & Code
-    L1[🔬 Labs 1-3: Git, GitHub]
-  end
-  subgraph 🔨 Build & Test
-    L2[🐳 Labs 4-6: Docker, CI/CD]
-  end
-  subgraph 🚀 Deploy & Operate
-    L3[☸️ Labs 7-10: K8s, Helm]
-  end
-  subgraph 🔐 Secure & Monitor
-    L4[📊 Labs 11-15: Vault, Monitoring]
-  end
-```
-
-✅ **Every lab maps to a real DevOps skill.**
-
----
-
-## 📍 Slide 29 – 📊 DORA Metrics
-
-## 📈 Measuring DevOps Success
-
-| 📊 Metric | 📏 Measures | 🏆 Elite |
-|-----------|------------|---------|
-| ⏱️ **Lead Time** | Commit → Prod | < 1 hour |
-| 📦 **Deploy Frequency** | How often | Multiple/day |
-| ❌ **Change Failure Rate** | % broken deploys | < 15% |
-| 🔧 **MTTR** | Recovery time | < 1 hour |
-
-> 📚 These 4 metrics predict software delivery performance.
-> *Source: DORA State of DevOps Report*
-
-**🤔 Question:** Where does your team stand?
-
----
-
-## 📍 Slide 30 – 🌊 From Chaos to Flow
-
-## 🎯 The Goal
-
-```mermaid
-flowchart LR
-  subgraph 😱 Chaos
-    Manual[📋 Manual Work]
-    Silos[🧱 Silos]
-    Fear[😨 Fear]
-  end
-  subgraph 🌊 Flow
-    Auto[🤖 Automation]
-    Collab[🤝 Collaboration]
-    Confidence[💪 Confidence]
-  end
-  Chaos -->|🚀 DevOps| Flow
-```
-
-**🎯 Flow State:**
-* ⚡ Changes flow smoothly from idea to production
-* 🔄 Feedback loops are fast
-* 📈 Teams continuously improve
-
----
-
-## 📍 Slide 31 – 🏢 Section 5: DevOps in Real Life
-
-## 📅 A Day in DevOps
-
-**☀️ Morning:**
-* 📊 Check dashboards — all green ✅
-* 👀 Review pull requests
-* 🔀 Merge → auto-deploy
-
-**🌤️ Afternoon:**
-* 🚨 Alert: latency spike
-* 🔍 Check traces → slow DB query
-* 🔧 Fix, test, deploy — **20 min total**
-
-**🌙 Evening:**
-* 🤖 Systems run themselves
-* 🏠 Go home on time
-
----
-
-## 📍 Slide 32 – 👥 DevOps Roles
-
-| 👤 Role | 🎯 Focus |
-|---------|---------|
-| 🔧 **DevOps Engineer** | Pipelines, automation, infra |
-| 🛡️ **SRE** | Reliability, SLOs, incidents |
-| 🏗️ **Platform Engineer** | Developer experience, internal tools |
-| ☁️ **Cloud Engineer** | Cloud infra, cost optimization |
-
-**🔗 Common thread:** Collaboration, automation, ownership
-
-**💰 Salary Range (2024):**
-* 🔧 DevOps Engineer: $100K - $180K
-* 🛡️ SRE: $120K - $200K
-* 🏗️ Platform Engineer: $130K - $220K
-
----
-
-## 📍 Slide 33 – 🤝 Team Collaboration
-
-```mermaid
-flowchart TD
-  Dev[👨‍💻 Developers] --> Shared[🤝 Shared Ownership]
-  Ops[⚙️ Operations] --> Shared
-  QA[🧪 QA] --> Shared
-  Sec[🔐 Security] --> Shared
-  Shared --> Ship[🚀 Ship Better Software]
-```
-
-**🤝 Collaboration Practices:**
-* 📟 Shared on-call rotations
-* 📝 Blameless incident reviews
-* 👥 Cross-functional squads
-* 🔓 Everyone can deploy
-
----
-
-## 📍 Slide 34 – 📈 Career Path
-
-```mermaid
-flowchart LR
-  Junior[🌱 Junior] --> Mid[💼 Mid-level]
-  Mid --> Senior[⭐ Senior]
-  Senior --> Staff[🏆 Staff/Principal]
-  Senior --> Manager[👔 Manager]
-  Staff --> Architect[🏛️ Architect]
-```
-
-**🛠️ Skills to Build:**
-* 🐧 Linux, networking
-* 📝 Scripting (Bash, Python)
-* 🐳 Containers & K8s
-* 🔄 CI/CD pipelines
-* ☁️ Cloud platforms (AWS, GCP, Azure)
-
----
-
-## 📍 Slide 35 – 🌍 Real Company Examples
-
-**🎬 Netflix:**
-* 🚀 1000+ deploys/day
-* 🐒 Chaos Monkey breaks things on purpose
-* 🔄 Self-healing infrastructure
-
-**📦 Amazon:**
-* ⚡ Deploy every **11.7 seconds**
-* 🔧 "You build it, you run it"
-* 👥 Two-pizza teams
-
-**🔍 Google:**
-* 🛡️ Invented **SRE**
-* 📊 Error budgets balance speed & reliability
-* 📝 Blameless postmortems
-
----
-
-## 📍 Slide 36 – 🎯 Section 6: Reflection
-
-## 📝 Key Takeaways
-
-1. 🧩 **DevOps = Culture + Practices + Tools**
-2. 🧱 **Break down silos** between Dev and Ops
-3. 🤖 **Automate everything** repeatable
-4. 📊 **Measure what matters** (DORA metrics)
-5. 📝 **Learn from failures**, don't assign blame
-
-> 💡 DevOps isn't a destination. It's a direction.
-
----
-
-## 📍 Slide 37 – 🧠 The Mindset Shift
-
-| 😰 Old Mindset | 🚀 DevOps Mindset |
-|---------------|------------------|
-| 🙅 "Not my job" | 🤝 "Our responsibility" |
-| 🚫 "Don't touch prod" | 💪 "Deploy with confidence" |
-| 👉 "Who broke it?" | 🔍 "How do we prevent this?" |
-| 😨 "Change is risky" | ✅ "Small changes = less risk" |
-| 💻 "Works on my machine" | 🌍 "Works everywhere" |
-
-> ❓ Which mindset do you want?
-
----
-
-## 📍 Slide 38 – ✅ Your Progress
-
-## 🎓 What You Now Understand
-
-* ✅ Why DevOps emerged and what it solves
-* ✅ The Three Ways and CAMS model
-* ✅ How CI/CD, IaC, and observability fit together
-* ✅ The DevOps lifecycle and how to measure it
-* ✅ Real-world application of DevOps
-
-> 🚀 **You're ready for the labs.**
-
----
-
-## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L1_POST
-
----
-
-## 📍 Slide 40 – 🚀 What Comes Next
-
-## 📚 Next Lecture: Version Control with Git
-
-* 🐙 Git fundamentals
-* 🌿 Branching strategies
-* 🤝 Collaboration workflows
-* 💻 Hands-on: Your first pull request
-
-**🎉 Your journey has begun.**
-
-> 🌊 From chaos to flow — one commit at a time.
-
-```mermaid
-flowchart LR
-  You[👤 You] --> Skills[🛠️ DevOps Skills]
-  Skills --> Impact[💎 Real Impact]
-  Impact --> Career[🚀 Career Growth]
-```
-
-**👋 See you in the next lecture!**
-
----
-
-## 📚 Resources & Further Reading
-
-**📕 Books:**
-* 📖 *The Phoenix Project* — Gene Kim
-* 📖 *The DevOps Handbook* — Gene Kim et al.
-* 📖 *Accelerate* — Nicole Forsgren
-
-**🔗 Links:**
-* 🌐 [DORA State of DevOps](https://dora.dev)
-* 🌐 [DevOps Roadmap](https://roadmap.sh/devops)
-* 🌐 [12 Factor App](https://12factor.net)
-
----
+# 📌 Lecture 1 — Introduction to DevOps: From Chaos to Flow
+
+## 📍 Slide 1 – 🚀 Welcome to DevOps
+
+* 🌍 **Software is eating the world** — but shipping it is hard
+* 😰 Teams struggle with slow releases, broken deploys, finger-pointing
+* 🌉 **DevOps bridges the gap** between **building** and **running** software
+* 🎯 This course: practical skills to transform how you deliver software
+
+```mermaid
+flowchart LR
+  Chaos[😱 Chaos] -->|DevOps| Flow[🌊 Flow]
+  Flow --> Value[💎 Deliver Value Faster]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand what DevOps is (and isn't)
+* ✅ Identify problems DevOps solves
+* ✅ Apply DevOps thinking to real scenarios
+* ✅ Map DevOps practices to your future workflow
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Define DevOps and its core principles |
+| 2 | 🔍 Recognize pre-DevOps problems |
+| 3 | 🛠️ Apply DevOps solutions to scenarios |
+| 4 | 🗺️ Navigate the DevOps lifecycle |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + Diagrams** — visual learning
+* 🎮 **Real-world scenarios** — you decide!
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🕹️ **Interactive simulation**: "DevOps as a Game"
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Problem
+Section 2: What DevOps Is
+Section 3: DevOps as a Game       → 📝 MID Quiz
+Section 4: Lifecycle & Metrics
+Section 5: Real Life
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **70%** of IT projects experience significant delays
+* ⏱️ Average time from code complete to production: **weeks to months**
+* 💥 Most outages caused by **changes** (deploys, configs)
+
+> 💬 *"It worked on my machine"* — Every developer, ever
+
+**🤔 Think about it:**
+* Why is software delivery so hard?
+* Why do teams fear deployments?
+* What would "good" look like?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L1_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Problem Before DevOps
+
+* 👨‍💻 **Development** and ⚙️ **Operations** = separate teams, separate goals
+* 🚀 Dev wants: **ship features fast**
+* 🛡️ Ops wants: **keep systems stable**
+* 💥 Result: **conflict, blame, slow delivery**
+
+```mermaid
+flowchart LR
+  Dev[👨‍💻 Dev Team] -->|🎯 New Features| Goal1[Ship Fast]
+  Ops[⚙️ Ops Team] -->|🛡️ Stability| Goal2[Don't Break]
+  Goal1 -.->|❌ Conflict| Goal2
+```
+
+---
+
+## 📍 Slide 7 – 🧱 The Wall of Confusion
+
+* 🧱 **The Wall** = invisible barrier between Dev and Ops
+* 📦 Dev "throws code over the wall"
+* 🔥 Ops catches the blame when it breaks
+* 🔄 Ops rejects changes to avoid risk
+
+```mermaid
+flowchart LR
+  Dev[👨‍💻 Dev Team] -->|📦 Throws code over| Wall[🧱 Wall of Confusion]
+  Wall -->|🔥 Catches blame| Ops[⚙️ Ops Team]
+  Ops -->|❌ Rejects changes| Dev
+```
+
+> 🤔 **Think:** Have you seen this pattern before?
+
+---
+
+## 📍 Slide 8 – 😱 Manual Release Hell
+
+* 📅 Deployments are rare (monthly, quarterly)
+* 🎰 Each release = **high-risk event**
+* 📋 Manual steps, checklists, weekend work
+* 💀 One mistake = hours of rollback
+
+```mermaid
+flowchart TD
+  Code[✅ Code Complete] --> Wait[📅 Wait for Release Window]
+  Wait --> Manual[📋 Manual Deploy Steps]
+  Manual --> Pray[🙏 Pray It Works]
+  Pray -->|💥 Failure| Blame[👉 Blame Game]
+  Pray -->|😮‍💨 Success| Relief[Temporary Relief]
+```
+
+**📊 The Numbers:**
+* 🐢 Average release cycle: **3-6 months**
+* 📉 Success rate: **~60%**
+* ⏱️ Rollback time: **4-8 hours**
+
+---
+
+## 📍 Slide 9 – 😨 Fear and Blame Culture
+
+* 🌙 Incident happens at 2am
+* 👉 First question: *"Who did this?"*
+* 🙈 Engineers hide mistakes
+* 🚫 Nobody wants to deploy on Friday
+* 💀 Innovation stops
+
+> ⚠️ **Fear kills velocity**
+
+**😰 Signs of Blame Culture:**
+* 🔇 People afraid to speak up
+* 📝 Excessive documentation "for protection"
+* 🐌 Slow decision-making
+* 🚪 High turnover
+
+**💬 Discussion:** Why does blame make things worse?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Chaos
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow releases | Lost market opportunity |
+| 📋 Manual processes | Human error, burnout |
+| 👉 Blame culture | Talent leaves |
+| 🙈 No visibility | Firefighting mode |
+
+**📈 Real Numbers:**
+* 🏢 **Amazon pre-DevOps**: deploys took **weeks**
+* 🚀 **Amazon post-DevOps**: deploys every **11.7 seconds**
+
+**💰 Cost of Downtime:**
+* 💵 Small business: **$427/minute**
+* 🏢 Enterprise: **$9,000/minute**
+* 🌐 Amazon: **$220,000/minute**
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What DevOps Really Is
+
+* 🤝 **DevOps** = Development + Operations working as **one team**
+* 🌱 A **culture** of collaboration and shared responsibility
+* 🔧 A set of **practices** for fast, reliable delivery
+* 🚫 NOT just tools, NOT a job title, NOT a team
+
+```mermaid
+flowchart LR
+  Dev[👨‍💻 Development] -->|🤝 Collaboration| DevOps[🚀 DevOps]
+  Ops[⚙️ Operations] -->|🤝 Collaboration| DevOps
+  DevOps --> Value[💎 Fast, Reliable Value]
+```
+
+**📖 Definition:**
+> *DevOps is a set of practices that combines software development (Dev) and IT operations (Ops) to shorten the development lifecycle while delivering features, fixes, and updates frequently in close alignment with business objectives.*
+
+---
+
+## 📍 Slide 12 – 🚫 What DevOps is NOT
+
+| ❌ Myth | ✅ Reality |
+|---------|-----------|
+| "We hired a DevOps engineer, we're done" | 👥 Everyone participates |
+| "DevOps means using Kubernetes" | 🛠️ Tools support culture |
+| "DevOps replaces developers/ops" | 🤝 It unites them |
+| "DevOps = just automation" | 🧩 Automation + Culture + Measurement |
+| "DevOps is a team" | 🌍 It's a way of working |
+
+> 🔥 **Hot take:** You can't buy DevOps. You build it.
+
+**🎯 DevOps is about:**
+* 🧠 Mindset change
+* 🤝 Breaking silos
+* 🔄 Continuous improvement
+* 📊 Data-driven decisions
+
+---
+
+## 📍 Slide 13 – 🔄 The Three Ways of DevOps
+
+```mermaid
+flowchart LR
+  W1[1️⃣ Flow] --> W2[2️⃣ Feedback]
+  W2 --> W3[3️⃣ Learning]
+  W3 --> W1
+```
+
+| 🛤️ Way | 🎯 Focus | 💡 Example |
+|--------|---------|-----------|
+| 1️⃣ **Flow** | Fast Dev → Prod | 🚀 CI/CD pipelines |
+| 2️⃣ **Feedback** | Fast Prod → Dev | 📊 Monitoring, alerts |
+| 3️⃣ **Learning** | Experiment safely | 📝 Blameless postmortems |
+
+**📚 Source:** *The Phoenix Project* by Gene Kim
+
+---
+
+## 📍 Slide 14 – 🧩 The CAMS Model
+
+```mermaid
+graph TD
+  C[🌱 Culture] --> DevOps[🚀 DevOps]
+  A[🤖 Automation] --> DevOps
+  M[📊 Measurement] --> DevOps
+  S[🔗 Sharing] --> DevOps
+```
+
+* 🌱 **C = Culture** — Trust, collaboration, shared ownership
+* 🤖 **A = Automation** — Eliminate manual, error-prone work
+* 📊 **M = Measurement** — Track metrics, decide with data
+* 🔗 **S = Sharing** — Knowledge flows, blameless postmortems
+
+**🎯 Key Metrics:**
+* ⏱️ **MTTR** = Mean Time to Recovery
+* ❌ **CFR** = Change Failure Rate
+* 📦 **DF** = Deployment Frequency
+* 🚀 **LT** = Lead Time
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After DevOps
+
+| 😰 Before | 🚀 After |
+|----------|---------|
+| 📅 Releases every few months | 📆 Releases daily/weekly |
+| 📋 Manual deployments | 🤖 Automated pipelines |
+| 👉 Blame when things break | 📝 Blameless postmortems |
+| 🙅 "Not my problem" | 🤝 Shared ownership |
+| 😨 Fear of change | 💪 Embrace change |
+| 🐌 Weeks to deploy | ⚡ Minutes to deploy |
+
+> 🤔 Which column describes your current environment?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: DevOps as a Game
+
+## 🕹️ Simulation: You're the CTO
+
+* 🏢 Welcome to **FlowStart Inc.** — a growing startup
+* 👥 You have: 5 developers, 2 ops engineers
+* 🌐 A web application with 10K users
+* 📈 Pressure to ship new features
+
+**❓ What could go wrong?**
+
+> 💀 **Everything.**
+
+🎮 **Let's play.**
+
+---
+
+## 📍 Slide 17 – 💥 Scenario 1: Release Failure
+
+**📅 Friday 5pm:**
+* 👨‍💻 Developer pushes "small fix"
+* 🚫 No tests, no review, straight to production
+* 💥 App crashes, users can't log in
+* 🤷 Nobody knows what changed
+
+```mermaid
+flowchart LR
+  Push[📤 Code Push] --> Prod[🌐 Production]
+  Prod --> Crash[💥 Crash]
+  Crash --> Panic[😱 Weekend Panic]
+```
+
+**📊 Impact:**
+* 👥 10,000 users affected
+* ⏱️ 4 hours downtime
+* 💰 $50,000 lost revenue
+* 😤 Angry customers on Twitter
+
+> ❓ **What would you do?**
+
+---
+
+## 📍 Slide 18 – ✅ Solution: CI/CD
+
+## 🛠️ Fix: Continuous Integration & Delivery
+
+```mermaid
+flowchart LR
+  Push[📤 Push] --> CI[🧪 Tests]
+  CI -->|✅ Pass| Review[👀 Review]
+  Review --> CD[🚀 Deploy]
+  CD --> Monitor[📊 Monitor]
+  CI -->|❌ Fail| Fix[🔧 Fix]
+```
+
+* ✅ Every change triggers **automated tests**
+* ✅ **Code review** required before merge
+* ✅ **Automated deployment** pipeline
+* ✅ **One-click rollback**
+
+**🎯 Result:** Deploy with confidence, not prayers
+
+**📊 CI/CD Benefits:**
+* 🐛 Catch bugs early (80% cheaper to fix)
+* 🚀 Deploy 200x more frequently
+* ⏱️ 24x faster recovery from failures
+
+---
+
+## 📍 Slide 19 – 🐾 Scenario 2: Infrastructure Drift
+
+**😰 Situation:**
+* 🖥️ Production server configured manually over 2 years
+* 👋 Ops engineer who set it up **left the company**
+* 📈 Need to scale — but **can't recreate the setup**
+
+```mermaid
+flowchart TD
+  S1[🖥️ Server 1: Ubuntu 18 + mystery configs]
+  S2[🖥️ Server 2: Ubuntu 20 + different configs]
+  S3[🖥️ Server 3: Who knows? 🤷]
+  S1 --> Drift[😱 Configuration Drift]
+  S2 --> Drift
+  S3 --> Drift
+```
+
+> 🐶🐄 **"Pets vs Cattle"** — Which do you have?
+
+**🐶 Pets:** Unique, irreplaceable, nursed back to health
+**🐄 Cattle:** Identical, replaceable, automated
+
+---
+
+## 📍 Slide 20 – ✅ Solution: Infrastructure as Code
+
+## 🛠️ Fix: IaC
+
+* 📝 Define infrastructure in **version-controlled files**
+* 🔄 Servers are **reproducible**, not unique
+* ⚡ Spin up identical environments in **minutes**
+
+```hcl
+# 🌍 Terraform example
+resource "aws_instance" "web" {
+  ami           = "ami-0c55b159cbfafe1f0"
+  instance_type = "t2.micro"
+  count         = 3  # 🔢 3 identical servers
+}
+```
+
+**🎯 Result:** Cattle, not pets. Replace, don't repair.
+
+**🛠️ IaC Tools:**
+* 🌍 **Terraform** — Multi-cloud
+* 🧩 **Ansible** — Configuration management
+* 📦 **Pulumi** — Code-based IaC
+
+---
+
+## 📍 Slide 21 – 🔓 Scenario 3: Secret Leak
+
+**💀 What happened:**
+* 👨‍💻 Developer commits database password to GitHub
+* 🤖 Bot scrapes it within **minutes**
+* 💥 Attackers access production database
+
+```mermaid
+flowchart LR
+  Commit[📤 Commit + Secret] --> GitHub[🐙 Public Repo]
+  GitHub --> Bot[🤖 Scraper Bot]
+  Bot --> Breach[💀 Database Breach]
+```
+
+> ⏱️ **How fast do bots find secrets?** Under 5 minutes.
+
+**📊 Real Stats:**
+* 🔍 GitHub scans 100M+ repos for secrets
+* ⏱️ Average time to exploit: **<1 hour**
+* 💰 Average breach cost: **$4.45 million**
+
+---
+
+## 📍 Slide 22 – ✅ Solution: Secrets Management
+
+## 🛠️ Fix: Vault & Secret Scanning
+
+* 🚫 **Never** store secrets in code
+* 🔐 Use secret management tools (Vault, AWS Secrets Manager)
+* 🔍 Pre-commit hooks scan for secrets
+* 🔄 Rotate credentials automatically
+
+```yaml
+# ❌ Bad
+password: "super_secret_123"
+
+# ✅ Good
+password: ${VAULT_DB_PASSWORD}
+```
+
+**🎯 Result:** Secrets stay secret
+
+**🛠️ Secret Tools:**
+* 🔐 **HashiCorp Vault**
+* 🔑 **AWS Secrets Manager**
+* 🔒 **Azure Key Vault**
+* 🔍 **git-secrets** (pre-commit)
+
+---
+
+## 📍 Slide 23 – 🙈 Scenario 4: Blind Operations
+
+**👥 Users report:** *"App is slow"*
+
+**🤷 Team asks:**
+* Is it? How slow?
+* Which part is slow?
+* Since when?
+* How many users affected?
+
+**😰 Answer:** No idea. No metrics. No logs. No visibility.
+
+⏱️ **Hours spent guessing.**
+
+---
+
+## 📍 Slide 24 – ✅ Solution: Observability
+
+## 🛠️ Fix: Logs, Metrics, Traces
+
+```mermaid
+graph TD
+  Logs[📋 Logs: What happened] --> Obs[🔍 Observability]
+  Metrics[📊 Metrics: How much/fast] --> Obs
+  Traces[🔗 Traces: Where] --> Obs
+  Obs --> Action[⚡ Fix in minutes, not hours]
+```
+
+| 📊 Pillar | 🛠️ Tools |
+|-----------|----------|
+| 📋 Logs | ELK, Loki, CloudWatch |
+| 📊 Metrics | Prometheus, Grafana, Datadog |
+| 🔗 Traces | Jaeger, Zipkin, X-Ray |
+
+**🎯 Result:** See problems before users report them
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L1_MID
+
+---
+
+## 📍 Slide 26 – ♾️ Section 4: DevOps Lifecycle
+
+## 🔄 The Infinity Loop
+
+* ♾️ DevOps is **continuous** — no "done" state
+* 🔄 Each stage feeds the next
+* 🔁 Forever improving
+
+```mermaid
+flowchart LR
+  Plan[📋 Plan] --> Code[💻 Code]
+  Code --> Build[🔨 Build]
+  Build --> Test[🧪 Test]
+  Test --> Release[📦 Release]
+  Release --> Deploy[🚀 Deploy]
+  Deploy --> Operate[⚙️ Operate]
+  Operate --> Monitor[📊 Monitor]
+  Monitor --> Plan
+```
+
+---
+
+## 📍 Slide 27 – 🔁 Lifecycle Phases
+
+| 📍 Phase | 🎯 Activity | 🛠️ Tools |
+|----------|------------|----------|
+| 📋 Plan | Requirements, design | Jira, GitHub Issues |
+| 💻 Code | Write & review | Git, VS Code |
+| 🔨 Build | Compile, package | Docker, npm, Maven |
+| 🧪 Test | Automated testing | pytest, Jest, Selenium |
+| 📦 Release | Version, approve | GitHub Releases, Tags |
+| 🚀 Deploy | Push to environment | ArgoCD, Ansible, Helm |
+| ⚙️ Operate | Run, scale | Kubernetes, Terraform |
+| 📊 Monitor | Observe, alert | Prometheus, Grafana |
+
+---
+
+## 📍 Slide 28 – 🗺️ Course Map
+
+## 📚 How This Course Covers the Lifecycle
+
+```mermaid
+flowchart TD
+  subgraph 📋 Plan & Code
+    L1[🔬 Labs 1-3: Git, GitHub]
+  end
+  subgraph 🔨 Build & Test
+    L2[🐳 Labs 4-6: Docker, CI/CD]
+  end
+  subgraph 🚀 Deploy & Operate
+    L3[☸️ Labs 7-10: K8s, Helm]
+  end
+  subgraph 🔐 Secure & Monitor
+    L4[📊 Labs 11-15: Vault, Monitoring]
+  end
+```
+
+✅ **Every lab maps to a real DevOps skill.**
+
+---
+
+## 📍 Slide 29 – 📊 DORA Metrics
+
+## 📈 Measuring DevOps Success
+
+| 📊 Metric | 📏 Measures | 🏆 Elite |
+|-----------|------------|---------|
+| ⏱️ **Lead Time** | Commit → Prod | < 1 hour |
+| 📦 **Deploy Frequency** | How often | Multiple/day |
+| ❌ **Change Failure Rate** | % broken deploys | < 15% |
+| 🔧 **MTTR** | Recovery time | < 1 hour |
+
+> 📚 These 4 metrics predict software delivery performance.
+> *Source: DORA State of DevOps Report*
+
+**🤔 Question:** Where does your team stand?
+
+---
+
+## 📍 Slide 30 – 🌊 From Chaos to Flow
+
+## 🎯 The Goal
+
+```mermaid
+flowchart LR
+  subgraph 😱 Chaos
+    Manual[📋 Manual Work]
+    Silos[🧱 Silos]
+    Fear[😨 Fear]
+  end
+  subgraph 🌊 Flow
+    Auto[🤖 Automation]
+    Collab[🤝 Collaboration]
+    Confidence[💪 Confidence]
+  end
+  Chaos -->|🚀 DevOps| Flow
+```
+
+**🎯 Flow State:**
+* ⚡ Changes flow smoothly from idea to production
+* 🔄 Feedback loops are fast
+* 📈 Teams continuously improve
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: DevOps in Real Life
+
+## 📅 A Day in DevOps
+
+**☀️ Morning:**
+* 📊 Check dashboards — all green ✅
+* 👀 Review pull requests
+* 🔀 Merge → auto-deploy
+
+**🌤️ Afternoon:**
+* 🚨 Alert: latency spike
+* 🔍 Check traces → slow DB query
+* 🔧 Fix, test, deploy — **20 min total**
+
+**🌙 Evening:**
+* 🤖 Systems run themselves
+* 🏠 Go home on time
+
+---
+
+## 📍 Slide 32 – 👥 DevOps Roles
+
+| 👤 Role | 🎯 Focus |
+|---------|---------|
+| 🔧 **DevOps Engineer** | Pipelines, automation, infra |
+| 🛡️ **SRE** | Reliability, SLOs, incidents |
+| 🏗️ **Platform Engineer** | Developer experience, internal tools |
+| ☁️ **Cloud Engineer** | Cloud infra, cost optimization |
+
+**🔗 Common thread:** Collaboration, automation, ownership
+
+**💰 Salary Range (2024):**
+* 🔧 DevOps Engineer: $100K - $180K
+* 🛡️ SRE: $120K - $200K
+* 🏗️ Platform Engineer: $130K - $220K
+
+---
+
+## 📍 Slide 33 – 🤝 Team Collaboration
+
+```mermaid
+flowchart TD
+  Dev[👨‍💻 Developers] --> Shared[🤝 Shared Ownership]
+  Ops[⚙️ Operations] --> Shared
+  QA[🧪 QA] --> Shared
+  Sec[🔐 Security] --> Shared
+  Shared --> Ship[🚀 Ship Better Software]
+```
+
+**🤝 Collaboration Practices:**
+* 📟 Shared on-call rotations
+* 📝 Blameless incident reviews
+* 👥 Cross-functional squads
+* 🔓 Everyone can deploy
+
+---
+
+## 📍 Slide 34 – 📈 Career Path
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior] --> Mid[💼 Mid-level]
+  Mid --> Senior[⭐ Senior]
+  Senior --> Staff[🏆 Staff/Principal]
+  Senior --> Manager[👔 Manager]
+  Staff --> Architect[🏛️ Architect]
+```
+
+**🛠️ Skills to Build:**
+* 🐧 Linux, networking
+* 📝 Scripting (Bash, Python)
+* 🐳 Containers & K8s
+* 🔄 CI/CD pipelines
+* ☁️ Cloud platforms (AWS, GCP, Azure)
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🎬 Netflix:**
+* 🚀 1000+ deploys/day
+* 🐒 Chaos Monkey breaks things on purpose
+* 🔄 Self-healing infrastructure
+
+**📦 Amazon:**
+* ⚡ Deploy every **11.7 seconds**
+* 🔧 "You build it, you run it"
+* 👥 Two-pizza teams
+
+**🔍 Google:**
+* 🛡️ Invented **SRE**
+* 📊 Error budgets balance speed & reliability
+* 📝 Blameless postmortems
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🧩 **DevOps = Culture + Practices + Tools**
+2. 🧱 **Break down silos** between Dev and Ops
+3. 🤖 **Automate everything** repeatable
+4. 📊 **Measure what matters** (DORA metrics)
+5. 📝 **Learn from failures**, don't assign blame
+
+> 💡 DevOps isn't a destination. It's a direction.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🚀 DevOps Mindset |
+|---------------|------------------|
+| 🙅 "Not my job" | 🤝 "Our responsibility" |
+| 🚫 "Don't touch prod" | 💪 "Deploy with confidence" |
+| 👉 "Who broke it?" | 🔍 "How do we prevent this?" |
+| 😨 "Change is risky" | ✅ "Small changes = less risk" |
+| 💻 "Works on my machine" | 🌍 "Works everywhere" |
+
+> ❓ Which mindset do you want?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Why DevOps emerged and what it solves
+* ✅ The Three Ways and CAMS model
+* ✅ How CI/CD, IaC, and observability fit together
+* ✅ The DevOps lifecycle and how to measure it
+* ✅ Real-world application of DevOps
+
+> 🚀 **You're ready for the labs.**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L1_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Version Control with Git
+
+* 🐙 Git fundamentals
+* 🌿 Branching strategies
+* 🤝 Collaboration workflows
+* 💻 Hands-on: Your first pull request
+
+**🎉 Your journey has begun.**
+
+> 🌊 From chaos to flow — one commit at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Skills[🛠️ DevOps Skills]
+  Skills --> Impact[💎 Real Impact]
+  Impact --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *The Phoenix Project* — Gene Kim
+* 📖 *The DevOps Handbook* — Gene Kim et al.
+* 📖 *Accelerate* — Nicole Forsgren
+
+**🔗 Links:**
+* 🌐 [DORA State of DevOps](https://dora.dev)
+* 🌐 [DevOps Roadmap](https://roadmap.sh/devops)
+* 🌐 [12 Factor App](https://12factor.net)
+
+---
diff --git a/lectures/lec10.md b/lectures/lec10.md
index ff30eefd3e..193c105fb4 100644
--- a/lectures/lec10.md
+++ b/lectures/lec10.md
@@ -1,840 +1,840 @@
-# 📌 Lecture 10 — Helm Package Management: Templating Kubernetes
-
-## 📍 Slide 1 – 🚀 Welcome to Helm
-
-* 🌍 **Kubernetes manifests are powerful** — but repetitive
-* 😰 Copy-pasting YAML for different environments is error-prone
-* ⛵ **Helm** = the package manager for Kubernetes
-* 🎯 This lecture: master charts, templating, and values management
-
-```mermaid
-flowchart LR
-  Manifests[📝 Raw YAML] -->|⛵ Helm| Charts[📦 Charts]
-  Charts --> Templating[🔧 Templating]
-  Templating --> Environments[🌍 Any Environment]
-```
-
----
-
-## 📍 Slide 2 – 🎯 What You Will Learn
-
-* ✅ Understand Helm architecture and concepts
-* ✅ Create production-ready Helm charts
-* ✅ Use templating for multi-environment deployments
-* ✅ Implement lifecycle hooks for advanced scenarios
-
-**🎓 Learning Outcomes:**
-| # | Outcome |
-|---|---------|
-| 1 | 🧠 Explain charts, releases, and repositories |
-| 2 | 🔍 Create charts with proper templating |
-| 3 | 🛠️ Manage values for different environments |
-| 4 | 🗺️ Implement hooks for lifecycle management |
-
----
-
-## 📍 Slide 3 – 📋 How This Lecture Works
-
-* 📚 **Concepts + Go templates** — hands-on focus
-* 🎮 **Real-world scenarios** — multi-environment challenges
-* 📝 **3 quiz checkpoints**: PRE / MID / POST
-* 🛠️ **Best practices**: DRY, hooks, library charts
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction (now)     → 📝 PRE Quiz
-Section 1: The Manifest Problem
-Section 2: Helm Fundamentals
-Section 3: Templating Deep Dive   → 📝 MID Quiz
-Section 4: Hooks & Advanced
-Section 5: Production Helm
-Section 6: Reflection             → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – ❓ The Big Question
-
-* 📊 **89%** of Kubernetes users use Helm
-* ⏱️ Managing 100+ YAML files manually is **chaos**
-* 💥 Different configs per environment = **copy-paste errors**
-
-> 💬 *"Is this the dev or prod manifest? Why are they different?"* — Every DevOps engineer
-
-**🤔 Think about it:**
-* How do you manage configs for dev, staging, and prod?
-* How do you share common patterns across applications?
-* How do you version your Kubernetes deployments?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L10_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Manifest Problem
-
-* 📝 **Raw YAML** works for one environment
-* 📋 Need different values for dev, staging, prod
-* 🔧 Copy-paste → divergence → bugs
-* 💥 Result: **manifest sprawl**
-
-```mermaid
-flowchart LR
-  Base[📝 Base YAML] --> Dev[📝 Dev YAML]
-  Base --> Staging[📝 Staging YAML]
-  Base --> Prod[📝 Prod YAML]
-  Dev --> Drift1[😱 Drift]
-  Staging --> Drift2[😱 Drift]
-  Prod --> Drift3[😱 Drift]
-```
-
----
-
-## 📍 Slide 7 – 😱 YAML Duplication
-
-* 📋 Same deployment, different image tags
-* 📊 Same service, different replicas
-* 🔧 Same ingress, different domains
-* 💀 Changes require updating multiple files
-
-```yaml
-# 😰 dev-deployment.yaml
-replicas: 1
-image: myapp:latest
-
-# 😰 staging-deployment.yaml
-replicas: 2
-image: myapp:v1.2.3
-
-# 😰 prod-deployment.yaml
-replicas: 5
-image: myapp:v1.2.3
-```
-
-**📊 The Problem:**
-* 🔍 Fix a bug? Update 3 files
-* 🆕 New field? Add to all files
-* 😰 Easy to miss one file
-
----
-
-## 📍 Slide 8 – 🔧 Manual Substitution Problems
-
-* 📝 `sed` and `envsubst` are fragile
-* 🔍 No validation of resulting YAML
-* 📊 No understanding of Kubernetes resources
-* 💀 Silent failures
-
-> ⚠️ **sed is not a package manager**
-
-```bash
-# 😰 This is fragile
-sed -i "s/REPLICAS/3/g" deployment.yaml
-envsubst < deployment.yaml.template > deployment.yaml
-```
-
-**💬 Discussion:** How do you currently manage environment differences?
-
----
-
-## 📍 Slide 9 – 😨 Version Chaos
-
-* 📅 "Which version is deployed in prod?"
-* 🔧 No rollback mechanism
-* 📋 No deployment history
-* 💀 Can't reproduce past deployments
-
-> ⚠️ **Without versioning, you can't roll back safely**
-
-```mermaid
-flowchart TD
-  Deploy1[📦 Deploy v1] --> Deploy2[📦 Deploy v2]
-  Deploy2 --> Deploy3[📦 Deploy v3]
-  Deploy3 --> Broken[💥 Broken!]
-  Broken --> Question[❓ What was v2?]
-```
-
----
-
-## 📍 Slide 10 – 💸 The Cost of Manifest Sprawl
-
-| 🔥 Problem | 💥 Impact |
-|------------|-----------|
-| 🐢 Update all files | Slow, error-prone |
-| 📋 Inconsistency | "Works in dev, not prod" |
-| 👉 No history | Can't audit changes |
-| 🙈 No versioning | Risky rollbacks |
-
-**📈 Real Numbers:**
-* 🏢 **Average K8s app**: 5-20 YAML files
-* 🔄 **Environments**: 3-5 (dev, staging, prod, etc.)
-* 📊 **Total files**: 15-100 per app (without Helm)
-* ⛵ **With Helm**: 1 chart, unlimited environments
-
----
-
-## 📍 Slide 11 – 💡 Section 2: What Helm Is
-
-* ⛵ **Package manager** for Kubernetes
-* 📦 **Charts** = packages of K8s resources
-* 🔧 **Templating** = dynamic manifest generation
-* 🔄 **Releases** = installed chart instances
-
-```mermaid
-flowchart LR
-  Chart[📦 Chart] -->|🔧 + Values| Template[🔄 Templating]
-  Template --> Manifest[📝 K8s Manifests]
-  Manifest --> Release[🚀 Release]
-```
-
-**📖 Definition:**
-> *Helm is a package manager for Kubernetes that helps you define, install, and upgrade complex Kubernetes applications using charts (packages of pre-configured resources).*
-
----
-
-## 📍 Slide 12 – 📦 Core Concepts
-
-```mermaid
-flowchart TD
-  Chart[📦 Chart] --> Templates[📝 Templates]
-  Chart --> Values[📊 Values]
-  Chart --> ChartYaml[📋 Chart.yaml]
-  Templates -->|+| Values
-  Values --> Release[🚀 Release]
-```
-
-| 📦 Concept | 🎯 Purpose |
-|-----------|----------|
-| 📦 **Chart** | Package of K8s resources |
-| 🚀 **Release** | Installed instance of chart |
-| 📊 **Values** | Configuration parameters |
-| 📁 **Repository** | Collection of charts |
-
----
-
-## 📍 Slide 13 – 📁 Chart Structure
-
-```
-mychart/
-├── Chart.yaml          # 📋 Chart metadata
-├── values.yaml         # 📊 Default values
-├── charts/             # 📦 Dependencies
-└── templates/          # 📝 K8s manifests
-    ├── deployment.yaml
-    ├── service.yaml
-    ├── _helpers.tpl    # 🔧 Template helpers
-    └── NOTES.txt       # 📝 Post-install notes
-```
-
-**🔑 Key Files:**
-* 📋 `Chart.yaml` — Name, version, description
-* 📊 `values.yaml` — Default configuration
-* 📝 `templates/` — Go templates for manifests
-* 🔧 `_helpers.tpl` — Reusable template snippets
-
----
-
-## 📍 Slide 14 – 📋 Chart.yaml
-
-```yaml
-apiVersion: v2
-name: my-web-app
-description: A Helm chart for my web application
-type: application
-
-# 📊 Chart version (SemVer)
-version: 0.1.0
-
-# 📦 Application version
-appVersion: "1.0.0"
-
-# 📦 Dependencies
-dependencies:
-  - name: common
-    version: 0.1.0
-    repository: "file://../common"
-```
-
-**🔑 Important Fields:**
-* `version` — Chart version (bump when chart changes)
-* `appVersion` — Application version (your app's version)
-* `dependencies` — Other charts this depends on
-
----
-
-## 📍 Slide 15 – ⚡ Before vs After Helm
-
-| 😰 Before | 🚀 After |
-|----------|---------|
-| 📅 Multiple YAML files per env | 📊 One values file per env |
-| 📋 Manual substitution | 🔧 Go templating |
-| 👉 No versioning | 📦 SemVer releases |
-| 😨 Risky rollbacks | 🔙 `helm rollback` |
-| 🐌 Copy-paste changes | ⚡ Single source of truth |
-| 📝 No sharing | 📁 Chart repositories |
-
-> 🤔 Ready to package your Kubernetes apps?
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: Templating Deep Dive
-
-## 🔧 Go Template Basics
-
-```yaml
-# templates/deployment.yaml
-apiVersion: apps/v1
-kind: Deployment
-metadata:
-  name: {{ .Release.Name }}-app
-  labels:
-    app: {{ .Values.appName }}
-spec:
-  replicas: {{ .Values.replicaCount }}
-  template:
-    spec:
-      containers:
-      - name: {{ .Chart.Name }}
-        image: "{{ .Values.image.repository }}:{{ .Values.image.tag }}"
-```
-
-**🔧 Template Syntax:**
-* `{{ }}` — Template action
-* `.Values` — From values.yaml
-* `.Release` — Release information
-* `.Chart` — From Chart.yaml
-
----
-
-## 📍 Slide 17 – 📊 Values Management
-
-```yaml
-# values.yaml (defaults)
-replicaCount: 1
-appName: my-app
-
-image:
-  repository: myuser/myapp
-  tag: latest
-  pullPolicy: IfNotPresent
-
-service:
-  type: ClusterIP
-  port: 80
-
-resources:
-  limits:
-    cpu: 200m
-    memory: 256Mi
-  requests:
-    cpu: 100m
-    memory: 128Mi
-```
-
-**🔧 Override Values:**
-```bash
-# File override
-helm install myrelease ./mychart -f values-prod.yaml
-
-# Command line override
-helm install myrelease ./mychart --set replicaCount=5
-```
-
----
-
-## 📍 Slide 18 – 🌍 Multi-Environment Values
-
-```yaml
-# values-dev.yaml
-replicaCount: 1
-image:
-  tag: latest
-resources:
-  limits:
-    cpu: 100m
-    memory: 128Mi
-
-# values-prod.yaml
-replicaCount: 5
-image:
-  tag: v1.2.3
-resources:
-  limits:
-    cpu: 500m
-    memory: 512Mi
-```
-
-**🚀 Deploy to Different Environments:**
-```bash
-# Development
-helm install myapp-dev ./mychart -f values-dev.yaml
-
-# Production
-helm install myapp-prod ./mychart -f values-prod.yaml
-```
-
----
-
-## 📍 Slide 19 – 🔧 Template Functions
-
-```yaml
-# Using functions
-name: {{ .Values.name | lower | trunc 63 }}
-
-# Default values
-tag: {{ .Values.image.tag | default .Chart.AppVersion }}
-
-# Conditional
-{{- if .Values.ingress.enabled }}
-# ... ingress resource
-{{- end }}
-
-# Range (loop)
-{{- range .Values.env }}
-- name: {{ .name }}
-  value: {{ .value | quote }}
-{{- end }}
-```
-
-**🔧 Common Functions:**
-| 🔧 Function | 🎯 Purpose |
-|------------|----------|
-| `default` | Provide fallback value |
-| `quote` | Add quotes |
-| `lower/upper` | Case conversion |
-| `trunc` | Truncate string |
-| `include` | Include template |
-
----
-
-## 📍 Slide 20 – 🔧 Helper Templates
-
-```yaml
-# templates/_helpers.tpl
-{{/*
-Create chart name and version as used by the chart label.
-*/}}
-{{- define "mychart.chart" -}}
-{{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" }}
-{{- end }}
-
-{{/*
-Common labels
-*/}}
-{{- define "mychart.labels" -}}
-helm.sh/chart: {{ include "mychart.chart" . }}
-app.kubernetes.io/name: {{ .Chart.Name }}
-app.kubernetes.io/instance: {{ .Release.Name }}
-app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
-app.kubernetes.io/managed-by: {{ .Release.Service }}
-{{- end }}
-```
-
-**🔧 Using Helpers:**
-```yaml
-metadata:
-  labels:
-    {{- include "mychart.labels" . | nindent 4 }}
-```
-
----
-
-## 📍 Slide 21 – 📊 Built-in Objects
-
-```mermaid
-flowchart TD
-  Objects[📦 Built-in Objects]
-  Objects --> Values[.Values]
-  Objects --> Chart[.Chart]
-  Objects --> Release[.Release]
-  Objects --> Template[.Template]
-  Objects --> Files[.Files]
-```
-
-| 📦 Object | 🎯 Contains |
-|----------|----------|
-| `.Values` | Values from values.yaml + overrides |
-| `.Chart` | Contents of Chart.yaml |
-| `.Release` | Release name, namespace, revision |
-| `.Template` | Current template info |
-| `.Files` | Access to non-template files |
-
----
-
-## 📍 Slide 22 – 🧪 Testing Charts
-
-```bash
-# 📋 Lint chart for errors
-helm lint ./mychart
-
-# 📝 Render templates locally
-helm template myrelease ./mychart
-
-# 🔍 Dry run against cluster
-helm install --dry-run --debug myrelease ./mychart
-
-# 📊 Show computed values
-helm get values myrelease
-
-# 📝 Show rendered manifests
-helm get manifest myrelease
-```
-
-**🧪 Testing Workflow:**
-1. 📋 `helm lint` — syntax check
-2. 📝 `helm template` — verify output
-3. 🔍 `--dry-run` — validate against cluster
-4. 🚀 `helm install` — deploy
-
----
-
-## 📍 Slide 23 – 📊 Helm Commands
-
-```bash
-# 📦 Create new chart
-helm create mychart
-
-# 🚀 Install chart
-helm install myrelease ./mychart
-
-# 📋 List releases
-helm list
-
-# 🔄 Upgrade release
-helm upgrade myrelease ./mychart
-
-# 🔙 Rollback release
-helm rollback myrelease 1
-
-# 🗑️ Uninstall release
-helm uninstall myrelease
-
-# 📊 Show release history
-helm history myrelease
-```
-
----
-
-## 📍 Slide 24 – 🔗 Chart Dependencies
-
-```yaml
-# Chart.yaml
-dependencies:
-  - name: postgresql
-    version: 12.0.0
-    repository: https://charts.bitnami.com/bitnami
-    condition: postgresql.enabled
-```
-
-```bash
-# Download dependencies
-helm dependency update ./mychart
-
-# Build dependencies
-helm dependency build ./mychart
-```
-
-**🔗 Dependency Features:**
-* 📦 Include other charts as sub-charts
-* 🔧 Override sub-chart values
-* 🔀 Conditional inclusion
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L10_MID
-
----
-
-## 📍 Slide 26 – 🎣 Section 4: Lifecycle Hooks
-
-## 🎣 What Are Hooks?
-
-* 🎯 **Execute actions** at specific points
-* 📦 Run jobs before/after install/upgrade
-* 🗑️ Cleanup after completion
-* 🔧 Database migrations, tests, notifications
-
-```mermaid
-flowchart LR
-  PreInstall[🎣 pre-install] --> Install[🚀 Install]
-  Install --> PostInstall[🎣 post-install]
-```
-
----
-
-## 📍 Slide 27 – 🎣 Hook Types
-
-| 🎣 Hook | ⏱️ When |
-|--------|--------|
-| `pre-install` | Before resources installed |
-| `post-install` | After all resources ready |
-| `pre-upgrade` | Before upgrade |
-| `post-upgrade` | After upgrade complete |
-| `pre-delete` | Before deletion |
-| `post-delete` | After deletion |
-| `pre-rollback` | Before rollback |
-| `post-rollback` | After rollback |
-
----
-
-## 📍 Slide 28 – 📝 Hook Example
-
-```yaml
-# templates/pre-install-job.yaml
-apiVersion: batch/v1
-kind: Job
-metadata:
-  name: {{ .Release.Name }}-pre-install
-  annotations:
-    "helm.sh/hook": pre-install
-    "helm.sh/hook-weight": "-5"
-    "helm.sh/hook-delete-policy": hook-succeeded
-spec:
-  template:
-    spec:
-      restartPolicy: Never
-      containers:
-      - name: pre-install
-        image: busybox
-        command: ['sh', '-c', 'echo Pre-install running && sleep 5']
-```
-
-**🔑 Hook Annotations:**
-* `helm.sh/hook` — Hook type
-* `helm.sh/hook-weight` — Execution order (lower first)
-* `helm.sh/hook-delete-policy` — When to delete
-
----
-
-## 📍 Slide 29 – 🏗️ Library Charts
-
-```mermaid
-flowchart TD
-  Library[📚 Library Chart] --> App1[📦 App 1]
-  Library --> App2[📦 App 2]
-  Library --> App3[📦 App 3]
-```
-
-**📚 Library Chart:**
-* 🚫 Cannot be installed directly
-* 📝 Contains only templates
-* 🔄 Shared across multiple charts
-
-```yaml
-# Chart.yaml
-apiVersion: v2
-name: common-lib
-type: library  # 📚 Library type
-version: 0.1.0
-```
-
----
-
-## 📍 Slide 30 – 📊 Helm Metrics
-
-| 📊 Metric | 📏 Measures | 🏆 Target |
-|-----------|------------|---------|
-| 📦 **Chart Version** | Tracking | SemVer |
-| 🔄 **Release Revision** | Upgrade count | Documented |
-| ⏱️ **Deploy Time** | Chart install | < 5 min |
-| 🧪 **Lint Errors** | Chart quality | 0 |
-
-> 📚 Version everything!
-
-**🤔 Question:** How do you track what's deployed?
-
----
-
-## 📍 Slide 31 – 🏢 Section 5: Production Helm
-
-## 📅 A Day with Helm
-
-**☀️ Morning:**
-* 📋 Review chart PR
-* 🧪 `helm lint` and `helm template`
-* ✅ Merge changes
-
-**🌤️ Afternoon:**
-* 📊 Update values-prod.yaml
-* 🚀 `helm upgrade myapp ./mychart -f values-prod.yaml`
-* 📈 Watch rollout: `kubectl rollout status`
-
-**🌙 Evening:**
-* 💥 Issue detected
-* 🔙 `helm rollback myapp 3`
-* ⏱️ **Rollback in 30 seconds**
-
----
-
-## 📍 Slide 32 – 👥 Team Helm Workflow
-
-| 👤 Role | 🎯 Helm Responsibility |
-|---------|----------------------|
-| 👨‍💻 **Developer** | Define values requirements |
-| 🔧 **DevOps** | Create and maintain charts |
-| 🛡️ **SRE** | Manage releases, rollbacks |
-| 📊 **Platform** | Build chart standards |
-
-**🔗 GitOps Flow:**
-```mermaid
-flowchart LR
-  PR[📝 Chart PR] --> Lint[🧪 Lint]
-  Lint --> Review[👀 Review]
-  Review --> Merge[✅ Merge]
-  Merge --> ArgoCD[🔄 ArgoCD]
-  ArgoCD --> Helm[⛵ Helm Install]
-```
-
----
-
-## 📍 Slide 33 – 🔐 Production Best Practices
-
-```yaml
-# ✅ Good: Specific versions
-image:
-  tag: v1.2.3  # Not 'latest'
-
-# ✅ Good: Resource limits always
-resources:
-  limits:
-    cpu: 500m
-    memory: 512Mi
-
-# ✅ Good: Health probes always
-livenessProbe:
-  enabled: true
-readinessProbe:
-  enabled: true
-```
-
-**🛡️ Production Checklist:**
-* ✅ Specific image tags (not `latest`)
-* ✅ Resource limits defined
-* ✅ Health probes enabled
-* ✅ Values documented
-* ✅ Chart versioned with SemVer
-
----
-
-## 📍 Slide 34 – 📈 Career Path: Helm Skills
-
-```mermaid
-flowchart LR
-  Junior[🌱 Junior: Using charts] --> Mid[💼 Mid: Creating charts]
-  Mid --> Senior[⭐ Senior: Library charts & standards]
-  Senior --> Principal[🏆 Principal: Chart ecosystem]
-```
-
-**🛠️ Skills to Build:**
-* 📝 Go template fluency
-* 📦 Chart design patterns
-* 🔗 Dependency management
-* 🎣 Hook implementation
-* 📁 Repository management
-
----
-
-## 📍 Slide 35 – 🌍 Real Company Examples
-
-**🏢 Helm at Scale:**
-* 📦 **Bitnami**: 100+ production charts
-* 🔍 **Google**: GKE uses Helm internally
-* 🎬 **Netflix**: Custom chart ecosystem
-
-**☁️ Public Charts:**
-* 📊 **Prometheus**: helm-charts/prometheus
-* 📋 **Grafana**: helm-charts/grafana
-* 🐘 **PostgreSQL**: bitnami/postgresql
-
-**📊 Stats:**
-* ⛵ **10,000+** public charts
-* 📦 **89%** K8s users use Helm
-* 🏢 **Standard** for K8s packaging
-
----
-
-## 📍 Slide 36 – 🎯 Section 6: Reflection
-
-## 📝 Key Takeaways
-
-1. ⛵ **Helm is the package manager** for Kubernetes
-2. 📦 **Charts package** related K8s resources
-3. 🔧 **Templating** enables multi-environment deploys
-4. 📊 **Values** customize without changing templates
-5. 🎣 **Hooks** handle lifecycle events
-
-> 💡 Never hardcode in templates — parametrize everything.
-
----
-
-## 📍 Slide 37 – 🧠 The Mindset Shift
-
-| 😰 Old Mindset | ⛵ Helm Mindset |
-|---------------|------------------|
-| 🙅 "Copy YAML for each env" | 📊 "Different values, same chart" |
-| 🚫 "sed for substitution" | 🔧 "Go templates" |
-| 👉 "Manual versioning" | 📦 "SemVer releases" |
-| 😨 "Risky rollbacks" | 🔙 "helm rollback" |
-| 💻 "My chart, my rules" | 📚 "Shared libraries" |
-
-> ❓ Which mindset describes your team?
-
----
-
-## 📍 Slide 38 – ✅ Your Progress
-
-## 🎓 What You Now Understand
-
-* ✅ Helm architecture and concepts
-* ✅ Chart creation and structure
-* ✅ Go template syntax
-* ✅ Multi-environment values management
-* ✅ Lifecycle hooks
-
-> 🚀 **You're ready for Lab 10: Helm Charts**
-
----
-
-## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L10_POST
-
----
-
-## 📍 Slide 40 – 🚀 What Comes Next
-
-## 📚 Course Continuation
-
-* 🔐 Lab 11: Secrets with Vault
-* ⚙️ Lab 12: ConfigMaps
-* 🔄 Lab 13: ArgoCD GitOps
-* 📊 Lab 14: StatefulSets
-* 🔍 Lab 15: K8s Monitoring
-
-**🎉 You've completed the Helm fundamentals!**
-
-> ⛵ From raw YAML to packaged charts — one template at a time.
-
-```mermaid
-flowchart LR
-  You[👤 You] --> Helm[⛵ Helm Skills]
-  Helm --> Packaging[📦 K8s Packaging]
-  Packaging --> Career[🚀 Career Growth]
-```
-
-**👋 Continue your DevOps journey!**
-
----
-
-## 📚 Resources & Further Reading
-
-**📕 Books:**
-* 📖 *Learning Helm* — Matt Butcher
-* 📖 *Helm in Action* — Matt Palmer
-* 📖 *Kubernetes Patterns* — Bilgin Ibryam
-
-**🔗 Links:**
-* 🌐 [Helm Documentation](https://helm.sh/docs/)
-* 🌐 [Chart Best Practices](https://helm.sh/docs/chart_best_practices/)
-* 🌐 [Artifact Hub](https://artifacthub.io/)
-
----
+# 📌 Lecture 10 — Helm Package Management: Templating Kubernetes
+
+## 📍 Slide 1 – 🚀 Welcome to Helm
+
+* 🌍 **Kubernetes manifests are powerful** — but repetitive
+* 😰 Copy-pasting YAML for different environments is error-prone
+* ⛵ **Helm** = the package manager for Kubernetes
+* 🎯 This lecture: master charts, templating, and values management
+
+```mermaid
+flowchart LR
+  Manifests[📝 Raw YAML] -->|⛵ Helm| Charts[📦 Charts]
+  Charts --> Templating[🔧 Templating]
+  Templating --> Environments[🌍 Any Environment]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand Helm architecture and concepts
+* ✅ Create production-ready Helm charts
+* ✅ Use templating for multi-environment deployments
+* ✅ Implement lifecycle hooks for advanced scenarios
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Explain charts, releases, and repositories |
+| 2 | 🔍 Create charts with proper templating |
+| 3 | 🛠️ Manage values for different environments |
+| 4 | 🗺️ Implement hooks for lifecycle management |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + Go templates** — hands-on focus
+* 🎮 **Real-world scenarios** — multi-environment challenges
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Best practices**: DRY, hooks, library charts
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Manifest Problem
+Section 2: Helm Fundamentals
+Section 3: Templating Deep Dive   → 📝 MID Quiz
+Section 4: Hooks & Advanced
+Section 5: Production Helm
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **89%** of Kubernetes users use Helm
+* ⏱️ Managing 100+ YAML files manually is **chaos**
+* 💥 Different configs per environment = **copy-paste errors**
+
+> 💬 *"Is this the dev or prod manifest? Why are they different?"* — Every DevOps engineer
+
+**🤔 Think about it:**
+* How do you manage configs for dev, staging, and prod?
+* How do you share common patterns across applications?
+* How do you version your Kubernetes deployments?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L10_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Manifest Problem
+
+* 📝 **Raw YAML** works for one environment
+* 📋 Need different values for dev, staging, prod
+* 🔧 Copy-paste → divergence → bugs
+* 💥 Result: **manifest sprawl**
+
+```mermaid
+flowchart LR
+  Base[📝 Base YAML] --> Dev[📝 Dev YAML]
+  Base --> Staging[📝 Staging YAML]
+  Base --> Prod[📝 Prod YAML]
+  Dev --> Drift1[😱 Drift]
+  Staging --> Drift2[😱 Drift]
+  Prod --> Drift3[😱 Drift]
+```
+
+---
+
+## 📍 Slide 7 – 😱 YAML Duplication
+
+* 📋 Same deployment, different image tags
+* 📊 Same service, different replicas
+* 🔧 Same ingress, different domains
+* 💀 Changes require updating multiple files
+
+```yaml
+# 😰 dev-deployment.yaml
+replicas: 1
+image: myapp:latest
+
+# 😰 staging-deployment.yaml
+replicas: 2
+image: myapp:v1.2.3
+
+# 😰 prod-deployment.yaml
+replicas: 5
+image: myapp:v1.2.3
+```
+
+**📊 The Problem:**
+* 🔍 Fix a bug? Update 3 files
+* 🆕 New field? Add to all files
+* 😰 Easy to miss one file
+
+---
+
+## 📍 Slide 8 – 🔧 Manual Substitution Problems
+
+* 📝 `sed` and `envsubst` are fragile
+* 🔍 No validation of resulting YAML
+* 📊 No understanding of Kubernetes resources
+* 💀 Silent failures
+
+> ⚠️ **sed is not a package manager**
+
+```bash
+# 😰 This is fragile
+sed -i "s/REPLICAS/3/g" deployment.yaml
+envsubst < deployment.yaml.template > deployment.yaml
+```
+
+**💬 Discussion:** How do you currently manage environment differences?
+
+---
+
+## 📍 Slide 9 – 😨 Version Chaos
+
+* 📅 "Which version is deployed in prod?"
+* 🔧 No rollback mechanism
+* 📋 No deployment history
+* 💀 Can't reproduce past deployments
+
+> ⚠️ **Without versioning, you can't roll back safely**
+
+```mermaid
+flowchart TD
+  Deploy1[📦 Deploy v1] --> Deploy2[📦 Deploy v2]
+  Deploy2 --> Deploy3[📦 Deploy v3]
+  Deploy3 --> Broken[💥 Broken!]
+  Broken --> Question[❓ What was v2?]
+```
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Manifest Sprawl
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Update all files | Slow, error-prone |
+| 📋 Inconsistency | "Works in dev, not prod" |
+| 👉 No history | Can't audit changes |
+| 🙈 No versioning | Risky rollbacks |
+
+**📈 Real Numbers:**
+* 🏢 **Average K8s app**: 5-20 YAML files
+* 🔄 **Environments**: 3-5 (dev, staging, prod, etc.)
+* 📊 **Total files**: 15-100 per app (without Helm)
+* ⛵ **With Helm**: 1 chart, unlimited environments
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Helm Is
+
+* ⛵ **Package manager** for Kubernetes
+* 📦 **Charts** = packages of K8s resources
+* 🔧 **Templating** = dynamic manifest generation
+* 🔄 **Releases** = installed chart instances
+
+```mermaid
+flowchart LR
+  Chart[📦 Chart] -->|🔧 + Values| Template[🔄 Templating]
+  Template --> Manifest[📝 K8s Manifests]
+  Manifest --> Release[🚀 Release]
+```
+
+**📖 Definition:**
+> *Helm is a package manager for Kubernetes that helps you define, install, and upgrade complex Kubernetes applications using charts (packages of pre-configured resources).*
+
+---
+
+## 📍 Slide 12 – 📦 Core Concepts
+
+```mermaid
+flowchart TD
+  Chart[📦 Chart] --> Templates[📝 Templates]
+  Chart --> Values[📊 Values]
+  Chart --> ChartYaml[📋 Chart.yaml]
+  Templates -->|+| Values
+  Values --> Release[🚀 Release]
+```
+
+| 📦 Concept | 🎯 Purpose |
+|-----------|----------|
+| 📦 **Chart** | Package of K8s resources |
+| 🚀 **Release** | Installed instance of chart |
+| 📊 **Values** | Configuration parameters |
+| 📁 **Repository** | Collection of charts |
+
+---
+
+## 📍 Slide 13 – 📁 Chart Structure
+
+```
+mychart/
+├── Chart.yaml          # 📋 Chart metadata
+├── values.yaml         # 📊 Default values
+├── charts/             # 📦 Dependencies
+└── templates/          # 📝 K8s manifests
+    ├── deployment.yaml
+    ├── service.yaml
+    ├── _helpers.tpl    # 🔧 Template helpers
+    └── NOTES.txt       # 📝 Post-install notes
+```
+
+**🔑 Key Files:**
+* 📋 `Chart.yaml` — Name, version, description
+* 📊 `values.yaml` — Default configuration
+* 📝 `templates/` — Go templates for manifests
+* 🔧 `_helpers.tpl` — Reusable template snippets
+
+---
+
+## 📍 Slide 14 – 📋 Chart.yaml
+
+```yaml
+apiVersion: v2
+name: my-web-app
+description: A Helm chart for my web application
+type: application
+
+# 📊 Chart version (SemVer)
+version: 0.1.0
+
+# 📦 Application version
+appVersion: "1.0.0"
+
+# 📦 Dependencies
+dependencies:
+  - name: common
+    version: 0.1.0
+    repository: "file://../common"
+```
+
+**🔑 Important Fields:**
+* `version` — Chart version (bump when chart changes)
+* `appVersion` — Application version (your app's version)
+* `dependencies` — Other charts this depends on
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After Helm
+
+| 😰 Before | 🚀 After |
+|----------|---------|
+| 📅 Multiple YAML files per env | 📊 One values file per env |
+| 📋 Manual substitution | 🔧 Go templating |
+| 👉 No versioning | 📦 SemVer releases |
+| 😨 Risky rollbacks | 🔙 `helm rollback` |
+| 🐌 Copy-paste changes | ⚡ Single source of truth |
+| 📝 No sharing | 📁 Chart repositories |
+
+> 🤔 Ready to package your Kubernetes apps?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Templating Deep Dive
+
+## 🔧 Go Template Basics
+
+```yaml
+# templates/deployment.yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: {{ .Release.Name }}-app
+  labels:
+    app: {{ .Values.appName }}
+spec:
+  replicas: {{ .Values.replicaCount }}
+  template:
+    spec:
+      containers:
+      - name: {{ .Chart.Name }}
+        image: "{{ .Values.image.repository }}:{{ .Values.image.tag }}"
+```
+
+**🔧 Template Syntax:**
+* `{{ }}` — Template action
+* `.Values` — From values.yaml
+* `.Release` — Release information
+* `.Chart` — From Chart.yaml
+
+---
+
+## 📍 Slide 17 – 📊 Values Management
+
+```yaml
+# values.yaml (defaults)
+replicaCount: 1
+appName: my-app
+
+image:
+  repository: myuser/myapp
+  tag: latest
+  pullPolicy: IfNotPresent
+
+service:
+  type: ClusterIP
+  port: 80
+
+resources:
+  limits:
+    cpu: 200m
+    memory: 256Mi
+  requests:
+    cpu: 100m
+    memory: 128Mi
+```
+
+**🔧 Override Values:**
+```bash
+# File override
+helm install myrelease ./mychart -f values-prod.yaml
+
+# Command line override
+helm install myrelease ./mychart --set replicaCount=5
+```
+
+---
+
+## 📍 Slide 18 – 🌍 Multi-Environment Values
+
+```yaml
+# values-dev.yaml
+replicaCount: 1
+image:
+  tag: latest
+resources:
+  limits:
+    cpu: 100m
+    memory: 128Mi
+
+# values-prod.yaml
+replicaCount: 5
+image:
+  tag: v1.2.3
+resources:
+  limits:
+    cpu: 500m
+    memory: 512Mi
+```
+
+**🚀 Deploy to Different Environments:**
+```bash
+# Development
+helm install myapp-dev ./mychart -f values-dev.yaml
+
+# Production
+helm install myapp-prod ./mychart -f values-prod.yaml
+```
+
+---
+
+## 📍 Slide 19 – 🔧 Template Functions
+
+```yaml
+# Using functions
+name: {{ .Values.name | lower | trunc 63 }}
+
+# Default values
+tag: {{ .Values.image.tag | default .Chart.AppVersion }}
+
+# Conditional
+{{- if .Values.ingress.enabled }}
+# ... ingress resource
+{{- end }}
+
+# Range (loop)
+{{- range .Values.env }}
+- name: {{ .name }}
+  value: {{ .value | quote }}
+{{- end }}
+```
+
+**🔧 Common Functions:**
+| 🔧 Function | 🎯 Purpose |
+|------------|----------|
+| `default` | Provide fallback value |
+| `quote` | Add quotes |
+| `lower/upper` | Case conversion |
+| `trunc` | Truncate string |
+| `include` | Include template |
+
+---
+
+## 📍 Slide 20 – 🔧 Helper Templates
+
+```yaml
+# templates/_helpers.tpl
+{{/*
+Create chart name and version as used by the chart label.
+*/}}
+{{- define "mychart.chart" -}}
+{{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" }}
+{{- end }}
+
+{{/*
+Common labels
+*/}}
+{{- define "mychart.labels" -}}
+helm.sh/chart: {{ include "mychart.chart" . }}
+app.kubernetes.io/name: {{ .Chart.Name }}
+app.kubernetes.io/instance: {{ .Release.Name }}
+app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
+app.kubernetes.io/managed-by: {{ .Release.Service }}
+{{- end }}
+```
+
+**🔧 Using Helpers:**
+```yaml
+metadata:
+  labels:
+    {{- include "mychart.labels" . | nindent 4 }}
+```
+
+---
+
+## 📍 Slide 21 – 📊 Built-in Objects
+
+```mermaid
+flowchart TD
+  Objects[📦 Built-in Objects]
+  Objects --> Values[.Values]
+  Objects --> Chart[.Chart]
+  Objects --> Release[.Release]
+  Objects --> Template[.Template]
+  Objects --> Files[.Files]
+```
+
+| 📦 Object | 🎯 Contains |
+|----------|----------|
+| `.Values` | Values from values.yaml + overrides |
+| `.Chart` | Contents of Chart.yaml |
+| `.Release` | Release name, namespace, revision |
+| `.Template` | Current template info |
+| `.Files` | Access to non-template files |
+
+---
+
+## 📍 Slide 22 – 🧪 Testing Charts
+
+```bash
+# 📋 Lint chart for errors
+helm lint ./mychart
+
+# 📝 Render templates locally
+helm template myrelease ./mychart
+
+# 🔍 Dry run against cluster
+helm install --dry-run --debug myrelease ./mychart
+
+# 📊 Show computed values
+helm get values myrelease
+
+# 📝 Show rendered manifests
+helm get manifest myrelease
+```
+
+**🧪 Testing Workflow:**
+1. 📋 `helm lint` — syntax check
+2. 📝 `helm template` — verify output
+3. 🔍 `--dry-run` — validate against cluster
+4. 🚀 `helm install` — deploy
+
+---
+
+## 📍 Slide 23 – 📊 Helm Commands
+
+```bash
+# 📦 Create new chart
+helm create mychart
+
+# 🚀 Install chart
+helm install myrelease ./mychart
+
+# 📋 List releases
+helm list
+
+# 🔄 Upgrade release
+helm upgrade myrelease ./mychart
+
+# 🔙 Rollback release
+helm rollback myrelease 1
+
+# 🗑️ Uninstall release
+helm uninstall myrelease
+
+# 📊 Show release history
+helm history myrelease
+```
+
+---
+
+## 📍 Slide 24 – 🔗 Chart Dependencies
+
+```yaml
+# Chart.yaml
+dependencies:
+  - name: postgresql
+    version: 12.0.0
+    repository: https://charts.bitnami.com/bitnami
+    condition: postgresql.enabled
+```
+
+```bash
+# Download dependencies
+helm dependency update ./mychart
+
+# Build dependencies
+helm dependency build ./mychart
+```
+
+**🔗 Dependency Features:**
+* 📦 Include other charts as sub-charts
+* 🔧 Override sub-chart values
+* 🔀 Conditional inclusion
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L10_MID
+
+---
+
+## 📍 Slide 26 – 🎣 Section 4: Lifecycle Hooks
+
+## 🎣 What Are Hooks?
+
+* 🎯 **Execute actions** at specific points
+* 📦 Run jobs before/after install/upgrade
+* 🗑️ Cleanup after completion
+* 🔧 Database migrations, tests, notifications
+
+```mermaid
+flowchart LR
+  PreInstall[🎣 pre-install] --> Install[🚀 Install]
+  Install --> PostInstall[🎣 post-install]
+```
+
+---
+
+## 📍 Slide 27 – 🎣 Hook Types
+
+| 🎣 Hook | ⏱️ When |
+|--------|--------|
+| `pre-install` | Before resources installed |
+| `post-install` | After all resources ready |
+| `pre-upgrade` | Before upgrade |
+| `post-upgrade` | After upgrade complete |
+| `pre-delete` | Before deletion |
+| `post-delete` | After deletion |
+| `pre-rollback` | Before rollback |
+| `post-rollback` | After rollback |
+
+---
+
+## 📍 Slide 28 – 📝 Hook Example
+
+```yaml
+# templates/pre-install-job.yaml
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: {{ .Release.Name }}-pre-install
+  annotations:
+    "helm.sh/hook": pre-install
+    "helm.sh/hook-weight": "-5"
+    "helm.sh/hook-delete-policy": hook-succeeded
+spec:
+  template:
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: pre-install
+        image: busybox
+        command: ['sh', '-c', 'echo Pre-install running && sleep 5']
+```
+
+**🔑 Hook Annotations:**
+* `helm.sh/hook` — Hook type
+* `helm.sh/hook-weight` — Execution order (lower first)
+* `helm.sh/hook-delete-policy` — When to delete
+
+---
+
+## 📍 Slide 29 – 🏗️ Library Charts
+
+```mermaid
+flowchart TD
+  Library[📚 Library Chart] --> App1[📦 App 1]
+  Library --> App2[📦 App 2]
+  Library --> App3[📦 App 3]
+```
+
+**📚 Library Chart:**
+* 🚫 Cannot be installed directly
+* 📝 Contains only templates
+* 🔄 Shared across multiple charts
+
+```yaml
+# Chart.yaml
+apiVersion: v2
+name: common-lib
+type: library  # 📚 Library type
+version: 0.1.0
+```
+
+---
+
+## 📍 Slide 30 – 📊 Helm Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| 📦 **Chart Version** | Tracking | SemVer |
+| 🔄 **Release Revision** | Upgrade count | Documented |
+| ⏱️ **Deploy Time** | Chart install | < 5 min |
+| 🧪 **Lint Errors** | Chart quality | 0 |
+
+> 📚 Version everything!
+
+**🤔 Question:** How do you track what's deployed?
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: Production Helm
+
+## 📅 A Day with Helm
+
+**☀️ Morning:**
+* 📋 Review chart PR
+* 🧪 `helm lint` and `helm template`
+* ✅ Merge changes
+
+**🌤️ Afternoon:**
+* 📊 Update values-prod.yaml
+* 🚀 `helm upgrade myapp ./mychart -f values-prod.yaml`
+* 📈 Watch rollout: `kubectl rollout status`
+
+**🌙 Evening:**
+* 💥 Issue detected
+* 🔙 `helm rollback myapp 3`
+* ⏱️ **Rollback in 30 seconds**
+
+---
+
+## 📍 Slide 32 – 👥 Team Helm Workflow
+
+| 👤 Role | 🎯 Helm Responsibility |
+|---------|----------------------|
+| 👨‍💻 **Developer** | Define values requirements |
+| 🔧 **DevOps** | Create and maintain charts |
+| 🛡️ **SRE** | Manage releases, rollbacks |
+| 📊 **Platform** | Build chart standards |
+
+**🔗 GitOps Flow:**
+```mermaid
+flowchart LR
+  PR[📝 Chart PR] --> Lint[🧪 Lint]
+  Lint --> Review[👀 Review]
+  Review --> Merge[✅ Merge]
+  Merge --> ArgoCD[🔄 ArgoCD]
+  ArgoCD --> Helm[⛵ Helm Install]
+```
+
+---
+
+## 📍 Slide 33 – 🔐 Production Best Practices
+
+```yaml
+# ✅ Good: Specific versions
+image:
+  tag: v1.2.3  # Not 'latest'
+
+# ✅ Good: Resource limits always
+resources:
+  limits:
+    cpu: 500m
+    memory: 512Mi
+
+# ✅ Good: Health probes always
+livenessProbe:
+  enabled: true
+readinessProbe:
+  enabled: true
+```
+
+**🛡️ Production Checklist:**
+* ✅ Specific image tags (not `latest`)
+* ✅ Resource limits defined
+* ✅ Health probes enabled
+* ✅ Values documented
+* ✅ Chart versioned with SemVer
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: Helm Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Using charts] --> Mid[💼 Mid: Creating charts]
+  Mid --> Senior[⭐ Senior: Library charts & standards]
+  Senior --> Principal[🏆 Principal: Chart ecosystem]
+```
+
+**🛠️ Skills to Build:**
+* 📝 Go template fluency
+* 📦 Chart design patterns
+* 🔗 Dependency management
+* 🎣 Hook implementation
+* 📁 Repository management
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 Helm at Scale:**
+* 📦 **Bitnami**: 100+ production charts
+* 🔍 **Google**: GKE uses Helm internally
+* 🎬 **Netflix**: Custom chart ecosystem
+
+**☁️ Public Charts:**
+* 📊 **Prometheus**: helm-charts/prometheus
+* 📋 **Grafana**: helm-charts/grafana
+* 🐘 **PostgreSQL**: bitnami/postgresql
+
+**📊 Stats:**
+* ⛵ **10,000+** public charts
+* 📦 **89%** K8s users use Helm
+* 🏢 **Standard** for K8s packaging
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. ⛵ **Helm is the package manager** for Kubernetes
+2. 📦 **Charts package** related K8s resources
+3. 🔧 **Templating** enables multi-environment deploys
+4. 📊 **Values** customize without changing templates
+5. 🎣 **Hooks** handle lifecycle events
+
+> 💡 Never hardcode in templates — parametrize everything.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | ⛵ Helm Mindset |
+|---------------|------------------|
+| 🙅 "Copy YAML for each env" | 📊 "Different values, same chart" |
+| 🚫 "sed for substitution" | 🔧 "Go templates" |
+| 👉 "Manual versioning" | 📦 "SemVer releases" |
+| 😨 "Risky rollbacks" | 🔙 "helm rollback" |
+| 💻 "My chart, my rules" | 📚 "Shared libraries" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Helm architecture and concepts
+* ✅ Chart creation and structure
+* ✅ Go template syntax
+* ✅ Multi-environment values management
+* ✅ Lifecycle hooks
+
+> 🚀 **You're ready for Lab 10: Helm Charts**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L10_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Course Continuation
+
+* 🔐 Lab 11: Secrets with Vault
+* ⚙️ Lab 12: ConfigMaps
+* 🔄 Lab 13: ArgoCD GitOps
+* 📊 Lab 14: StatefulSets
+* 🔍 Lab 15: K8s Monitoring
+
+**🎉 You've completed the Helm fundamentals!**
+
+> ⛵ From raw YAML to packaged charts — one template at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Helm[⛵ Helm Skills]
+  Helm --> Packaging[📦 K8s Packaging]
+  Packaging --> Career[🚀 Career Growth]
+```
+
+**👋 Continue your DevOps journey!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Learning Helm* — Matt Butcher
+* 📖 *Helm in Action* — Matt Palmer
+* 📖 *Kubernetes Patterns* — Bilgin Ibryam
+
+**🔗 Links:**
+* 🌐 [Helm Documentation](https://helm.sh/docs/)
+* 🌐 [Chart Best Practices](https://helm.sh/docs/chart_best_practices/)
+* 🌐 [Artifact Hub](https://artifacthub.io/)
+
+---
diff --git a/lectures/lec11.md b/lectures/lec11.md
index 779e7917bd..366b353ca4 100644
--- a/lectures/lec11.md
+++ b/lectures/lec11.md
@@ -1,759 +1,759 @@
-# 📌 Lecture 11 — Secret Management: Protecting Your Crown Jewels
-
-## 📍 Slide 1 – 🔐 Welcome to Secret Management
-
-* 🌍 **Your Helm charts are beautiful** — but where do passwords go?
-* 😰 Hardcoded secrets in code = ticking time bomb
-* 🔐 **Secret management** = keeping credentials safe AND accessible
-* 🎯 This lecture: from base64 encoding to enterprise-grade Vault
-
-```mermaid
-flowchart LR
-  Bad[😱 Hardcoded] -->|🔐 Secrets| K8s[☸️ K8s Secrets]
-  K8s -->|🏰 Enterprise| Vault[🔒 HashiCorp Vault]
-  Vault --> Secure[✅ Secure Apps]
-```
-
----
-
-## 📍 Slide 2 – 🎯 What You Will Learn
-
-* ✅ Understand why secret management matters
-* ✅ Create and consume Kubernetes Secrets
-* ✅ Recognize encoding vs encryption difference
-* ✅ Integrate HashiCorp Vault with Kubernetes
-
-**🎓 Learning Outcomes:**
-| # | Outcome |
-|---|---------|
-| 1 | 🧠 Explain the risks of poor secret management |
-| 2 | 🔍 Create K8s Secrets via kubectl and Helm |
-| 3 | 🛠️ Configure Vault sidecar injection |
-| 4 | 🗺️ Choose appropriate secret management strategy |
-
----
-
-## 📍 Slide 3 – 📋 How This Lecture Works
-
-* 🔐 **Security-first mindset** — think like an attacker
-* 🎮 **Real breach scenarios** — learn from others' mistakes
-* 📝 **3 quiz checkpoints**: PRE / MID / POST
-* 🛠️ **Hands-on patterns**: Secrets, Vault, injection
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction           → 📝 PRE Quiz
-Section 1: The Secrets Problem
-Section 2: Kubernetes Secrets
-Section 3: Encoding vs Encryption → 📝 MID Quiz
-Section 4: HashiCorp Vault
-Section 5: Production Patterns    → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – 💀 The Big Question
-
-> 💬 *"The only truly secure system is one that is powered off, cast in a block of concrete and sealed in a lead-lined room with armed guards."* — Gene Spafford
-
-**🔥 Shocking Stats:**
-* 😱 **83%** of organizations have experienced credential theft
-* 💸 Average cost of data breach: **$4.45 million** (2023)
-* ⏱️ Average time to detect breach: **277 days**
-
-> 🤔 **Think:** How many passwords are hardcoded in YOUR projects right now?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L11_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Secrets Problem
-
-* 🎯 **The Challenge:** Apps need credentials to function
-* ⚔️ **The Conflict:** Security vs Convenience
-
-```mermaid
-flowchart LR
-  subgraph 😰 Developer
-    D1[🚀 Ship Fast]
-    D2[🔧 Easy Access]
-  end
-  subgraph 🔐 Security
-    S1[🛡️ Protect Data]
-    S2[📋 Audit Access]
-  end
-  D1 <-->|⚔️ Tension| S1
-  D2 <-->|⚔️ Tension| S2
-```
-
-> 🤔 **Discussion:** Have you ever committed a password to git?
-
----
-
-## 📍 Slide 7 – 😱 The Hardcoding Horror
-
-**❌ What developers actually do:**
-
-```python
-# ❌ BAD: Hardcoded in code
-DATABASE_URL = "postgres://admin:SuperSecret123@db.prod.com/myapp"
-API_KEY = "sk-1234567890abcdef"
-
-# ❌ BAD: In docker-compose.yml committed to git
-environment:
-  - DB_PASSWORD=MyPassword123
-```
-
-**💥 What can go wrong:**
-* 🔍 Git history is forever (even after deletion)
-* 🌍 Public repos = public secrets
-* 👥 Every developer has production passwords
-* 📝 No audit trail of who accessed what
-
----
-
-## 📍 Slide 8 – 💥 Real Breach: Uber 2016
-
-**📰 What Happened:**
-* 😱 Developers hardcoded AWS credentials in GitHub repo
-* 🔓 Attackers found credentials, accessed S3 bucket
-* 💾 **57 million** user records stolen
-* 💸 **$148 million** settlement
-
-```mermaid
-flowchart LR
-  A[👨‍💻 Dev commits AWS keys] --> B[🔍 Attacker finds repo]
-  B --> C[🔓 Access S3 bucket]
-  C --> D[💾 57M records stolen]
-  D --> E[💸 $148M settlement]
-```
-
-> ⚠️ **Lesson:** Secrets in code = breach waiting to happen
-
----
-
-## 📍 Slide 9 – 🔓 Environment Variables: Better but Not Enough
-
-**✅ Better than hardcoding:**
-```bash
-export DATABASE_PASSWORD="secret123"
-```
-
-**❌ Still problematic:**
-* 📋 `ps aux` can expose env vars
-* 🐳 Docker inspect shows environment
-* 📝 No encryption at rest
-* 🔄 No rotation mechanism
-* 👥 No access control
-
-```bash
-# Anyone on the system can see:
-$ docker inspect myapp | grep -A 10 "Env"
-```
-
-> 🤔 **Think:** Where do YOUR environment variables come from?
-
----
-
-## 📍 Slide 10 – 📊 The Cost of Poor Secret Management
-
-| 🔥 Problem | 💥 Impact | 📊 Stats |
-|------------|-----------|----------|
-| 😱 Leaked credentials | 🔓 Unauthorized access | 83% of breaches |
-| 🔄 No rotation | 📅 Stale passwords | Avg age: 2+ years |
-| 👥 Shared secrets | 🕵️ No accountability | 65% share creds |
-| 📝 No audit | 🤷 Unknown access | 70% can't audit |
-
-**💡 The Solution Spectrum:**
-
-```mermaid
-flowchart LR
-  A[😱 Hardcoded] --> B[🔧 Env Vars]
-  B --> C[☸️ K8s Secrets]
-  C --> D[🔒 Vault]
-  style A fill:#ff6b6b
-  style B fill:#ffd93d
-  style C fill:#6bcb77
-  style D fill:#4d96ff
-```
-
----
-
-## 📍 Slide 11 – ☸️ Section 2: Kubernetes Secrets
-
-**🎯 What are K8s Secrets?**
-* 📦 First-class Kubernetes objects for sensitive data
-* 🔐 Separate from ConfigMaps (security-focused)
-* 🚀 Native integration with pods
-
-```mermaid
-flowchart TD
-  Secret[🔐 Secret] --> |Volume| Pod1[📦 Pod]
-  Secret --> |Env Var| Pod2[📦 Pod]
-  Secret --> |API| Pod3[📦 Pod]
-```
-
-**📋 Secret Types:**
-* 🔑 `Opaque` — generic key-value
-* 🐳 `docker-registry` — image pull credentials
-* 🔒 `tls` — TLS certificates
-
----
-
-## 📍 Slide 12 – 🛠️ Creating Secrets with kubectl
-
-**📝 From literals:**
-```bash
-kubectl create secret generic db-creds \
-  --from-literal=username=admin \
-  --from-literal=password=SuperSecret123
-```
-
-**📁 From files:**
-```bash
-kubectl create secret generic tls-cert \
-  --from-file=cert.pem \
-  --from-file=key.pem
-```
-
-**👀 Viewing secrets:**
-```bash
-kubectl get secret db-creds -o yaml
-# Data is base64 encoded
-
-# Decode:
-echo "U3VwZXJTZWNyZXQxMjM=" | base64 -d
-# Output: SuperSecret123
-```
-
----
-
-## 📍 Slide 13 – ⚠️ The Base64 Trap
-
-> ⚠️ **Critical Understanding:** Base64 is ENCODING, not ENCRYPTION!
-
-```bash
-# Encoding (reversible by anyone):
-echo "password123" | base64
-# cGFzc3dvcmQxMjMK
-
-# Decoding (no key needed):
-echo "cGFzc3dvcmQxMjMK" | base64 -d
-# password123
-```
-
-**🔐 Encryption vs Encoding:**
-
-| 🔄 Encoding | 🔐 Encryption |
-|-------------|---------------|
-| ✅ Reversible by anyone | 🔑 Needs key to decrypt |
-| 📝 Not secure | 🔒 Mathematically secure |
-| 🚀 Fast, no overhead | ⚡ Computational cost |
-| 📦 Data format change | 🛡️ Confidentiality |
-
----
-
-## 📍 Slide 14 – 📦 Consuming Secrets in Pods
-
-**🔧 As environment variables:**
-```yaml
-env:
-  - name: DB_PASSWORD
-    valueFrom:
-      secretKeyRef:
-        name: db-creds
-        key: password
-```
-
-**📁 As volume mount:**
-```yaml
-volumes:
-  - name: secret-volume
-    secret:
-      secretName: db-creds
-containers:
-  - volumeMounts:
-      - name: secret-volume
-        mountPath: /etc/secrets
-        readOnly: true
-```
-
-> 💡 **Best Practice:** Volume mounts are more secure than env vars (not visible in `docker inspect`)
-
----
-
-## 📍 Slide 15 – 📊 Before vs After: Basic Secret Management
-
-| 😱 Before (Hardcoded) | ✅ After (K8s Secrets) |
-|-----------------------|------------------------|
-| 📝 Secrets in code | 📦 Secrets in K8s API |
-| 🌍 Visible in git history | 🔐 Separate from code |
-| 👥 Everyone has access | 🛡️ RBAC controls |
-| 🔄 Change = redeploy code | 🔧 Change secret only |
-| 📋 No audit trail | 📝 K8s audit logs |
-
-> 🤔 **Question:** Is K8s Secrets enough for production?
-
----
-
-## 📍 Slide 16 – 🔒 Section 3: etcd Encryption
-
-**😰 The Problem:**
-* 🗄️ K8s stores secrets in etcd
-* 📝 By default: base64 encoded only
-* 🔓 etcd access = all secrets exposed
-
-**✅ The Solution: Encryption at Rest**
-```yaml
-apiVersion: apiserver.config.k8s.io/v1
-kind: EncryptionConfiguration
-resources:
-  - resources:
-      - secrets
-    providers:
-      - aescbc:
-          keys:
-            - name: key1
-              secret: <base64-encoded-key>
-      - identity: {}
-```
-
----
-
-## 📍 Slide 17 – 🔐 K8s Secrets Limitations
-
-**⚠️ Still Missing:**
-* 🔄 **No automatic rotation** — manual process
-* 📊 **Limited audit** — who accessed what?
-* 🌍 **K8s-only** — what about non-K8s apps?
-* 🔑 **Static secrets** — no dynamic generation
-* 🏢 **No centralization** — per-cluster management
-
-```mermaid
-flowchart TD
-  subgraph 😰 Limitations
-    A[🔄 No Rotation]
-    B[📊 Limited Audit]
-    C[🌍 K8s Only]
-    D[🔑 Static Only]
-  end
-  E[🏰 Need: Enterprise Solution] --> F[🔒 HashiCorp Vault]
-```
-
----
-
-## 📍 Slide 18 – 📝 QUIZ — DEVOPS_L11_MID
-
----
-
-## 📍 Slide 19 – 🏰 Section 4: HashiCorp Vault
-
-**🎯 What is Vault?**
-* 🔐 Enterprise-grade secret management
-* 🔑 Dynamic secret generation
-* 📊 Complete audit logging
-* 🔄 Automatic rotation
-* 🌍 Platform agnostic
-
-```mermaid
-flowchart LR
-  subgraph 🏰 Vault
-    A[🔐 Secret Engine]
-    B[🔑 Auth Methods]
-    C[📋 Policies]
-    D[📊 Audit]
-  end
-  K8s[☸️ Kubernetes] --> B
-  B --> A
-  A --> Apps[📦 Applications]
-  D --> Logs[📝 Audit Logs]
-```
-
----
-
-## 📍 Slide 20 – 🏗️ Vault Architecture
-
-```mermaid
-flowchart TD
-  subgraph 👥 Clients
-    K8s[☸️ K8s Pods]
-    CLI[💻 CLI]
-    API[🔌 API]
-  end
-  subgraph 🏰 Vault Server
-    Auth[🔑 Auth Methods]
-    Policy[📋 Policies]
-    Secrets[🔐 Secret Engines]
-    Audit[📊 Audit Device]
-  end
-  subgraph 💾 Storage
-    Backend[🗄️ Storage Backend]
-  end
-  K8s --> Auth
-  CLI --> Auth
-  API --> Auth
-  Auth --> Policy
-  Policy --> Secrets
-  Secrets --> Backend
-  Auth --> Audit
-```
-
-**🔑 Key Concepts:**
-* 🔐 **Secret Engines** — where secrets live (KV, database, PKI)
-* 🔑 **Auth Methods** — how clients authenticate
-* 📋 **Policies** — who can access what
-
----
-
-## 📍 Slide 21 – 🔑 Vault Auth Methods
-
-| 🔑 Method | 📝 Description | 🎯 Use Case |
-|-----------|----------------|-------------|
-| ☸️ Kubernetes | Service account JWT | K8s pods |
-| 🔐 AppRole | Role ID + Secret ID | CI/CD pipelines |
-| 👤 Userpass | Username/password | Humans |
-| 🌐 OIDC | SSO integration | Enterprise SSO |
-| ☁️ AWS/GCP/Azure | Cloud IAM | Cloud workloads |
-
-**☸️ Kubernetes Auth Flow:**
-```mermaid
-sequenceDiagram
-  Pod->>Vault: JWT token (ServiceAccount)
-  Vault->>K8s API: Validate token
-  K8s API->>Vault: Token valid ✅
-  Vault->>Pod: Vault token + secrets
-```
-
----
-
-## 📍 Slide 22 – 📋 Vault Policies
-
-**🎯 Policies control access:**
-```hcl
-# Allow read on specific path
-path "secret/data/myapp/*" {
-  capabilities = ["read", "list"]
-}
-
-# Deny access to admin secrets
-path "secret/data/admin/*" {
-  capabilities = ["deny"]
-}
-```
-
-**🛡️ Principle of Least Privilege:**
-* ✅ Apps only access their secrets
-* ✅ Read-only where possible
-* ✅ Separate policies per environment
-
----
-
-## 📍 Slide 23 – 💉 Vault Agent Sidecar Injection
-
-**🎯 The Pattern:**
-* 📦 Vault Agent runs as sidecar container
-* 🔄 Automatically fetches and renews secrets
-* 📁 Writes secrets to shared volume
-* 🚀 App reads from filesystem
-
-```mermaid
-flowchart LR
-  subgraph 📦 Pod
-    App[🚀 App Container]
-    Agent[🔐 Vault Agent]
-    Vol[📁 Shared Volume]
-  end
-  Vault[🏰 Vault Server]
-  Agent -->|🔑 Auth| Vault
-  Vault -->|🔐 Secrets| Agent
-  Agent -->|📝 Write| Vol
-  App -->|📖 Read| Vol
-```
-
----
-
-## 📍 Slide 24 – 🏷️ Vault Annotations
-
-**📝 Enable injection:**
-```yaml
-metadata:
-  annotations:
-    vault.hashicorp.com/agent-inject: "true"
-    vault.hashicorp.com/role: "myapp"
-    vault.hashicorp.com/agent-inject-secret-config: "secret/data/myapp/config"
-```
-
-**📁 Secrets appear at:**
-```
-/vault/secrets/config
-```
-
-**🔧 Template for custom format:**
-```yaml
-vault.hashicorp.com/agent-inject-template-config: |
-  {{- with secret "secret/data/myapp/config" -}}
-  DB_PASSWORD={{ .Data.data.password }}
-  {{- end -}}
-```
-
----
-
-## 📍 Slide 25 – 🚀 Vault in Kubernetes: Full Flow
-
-```mermaid
-sequenceDiagram
-  participant Pod
-  participant Injector as Vault Injector
-  participant Agent as Vault Agent
-  participant Vault
-
-  Pod->>Injector: Pod created with annotations
-  Injector->>Pod: Inject sidecar container
-  Agent->>Vault: Authenticate (K8s JWT)
-  Vault->>Agent: Return Vault token
-  Agent->>Vault: Request secrets
-  Vault->>Agent: Return secrets
-  Agent->>Pod: Write to /vault/secrets/
-  Pod->>Pod: App reads secrets
-```
-
----
-
-## 📍 Slide 26 – 🔄 Section 5: Dynamic Secrets
-
-**🎯 Static vs Dynamic:**
-
-| 🔑 Static Secrets | 🔄 Dynamic Secrets |
-|-------------------|-------------------|
-| 📝 Created manually | 🤖 Generated on-demand |
-| ♾️ Live forever | ⏱️ Short TTL |
-| 👥 Shared | 👤 Unique per request |
-| 🔄 Manual rotation | 🔄 Auto-expires |
-
-**💡 Example: Database credentials**
-```bash
-vault read database/creds/readonly
-# Key             Value
-# lease_id        database/creds/readonly/abc123
-# lease_duration  1h
-# username        v-kubernetes-readonly-xyz789
-# password        A1b2C3d4E5f6G7h8
-```
-
----
-
-## 📍 Slide 27 – 📊 Secret Management Comparison
-
-| 🔧 Feature | 🔓 Env Vars | ☸️ K8s Secrets | 🏰 Vault |
-|------------|-------------|----------------|----------|
-| 🔐 Encryption | ❌ None | ⚠️ Optional | ✅ Always |
-| 🔄 Rotation | ❌ Manual | ❌ Manual | ✅ Auto |
-| 📊 Audit | ❌ None | ⚠️ Basic | ✅ Full |
-| 🔑 Dynamic | ❌ No | ❌ No | ✅ Yes |
-| 🌍 Multi-platform | ✅ Yes | ❌ K8s only | ✅ Yes |
-| 📈 Complexity | 🟢 Low | 🟡 Medium | 🔴 High |
-
----
-
-## 📍 Slide 28 – 🗺️ Course Context: Where Secrets Fit
-
-```mermaid
-flowchart TD
-  subgraph 🏗️ Foundation
-    L2[📦 Lab 2: Docker]
-    L10[⛵ Lab 10: Helm]
-  end
-  subgraph 🔐 Security
-    L11[🔒 Lab 11: Secrets]
-  end
-  subgraph 📋 Config
-    L12[📁 Lab 12: ConfigMaps]
-  end
-  subgraph 🚀 Deployment
-    L13[🔄 Lab 13: ArgoCD]
-  end
-  L2 --> L10
-  L10 --> L11
-  L11 --> L12
-  L12 --> L13
-  style L11 fill:#4d96ff
-```
-
----
-
-## 📍 Slide 29 – 📈 Security Metrics
-
-| 📊 Metric | 📝 Description | 🎯 Target |
-|-----------|----------------|-----------|
-| 🔄 Secret Age | Time since rotation | < 90 days |
-| 📊 Access Audit | % of accesses logged | 100% |
-| 🔐 Encryption | % secrets encrypted | 100% |
-| 👥 Shared Secrets | Secrets used by >1 app | 0 |
-| ⏱️ TTL Compliance | Secrets with TTL | > 80% |
-
-> 🤔 **Question:** How would you measure secret security in your organization?
-
----
-
-## 📍 Slide 30 – ✅ Secret Management Best Practices
-
-**🛡️ The Golden Rules:**
-
-1. 🚫 **Never commit secrets** to version control
-2. 🔄 **Rotate regularly** — automate where possible
-3. 📋 **Audit everything** — know who accessed what
-4. 🔐 **Encrypt at rest** — etcd encryption minimum
-5. 👤 **Least privilege** — only what's needed
-6. ⏱️ **Short-lived** — dynamic secrets when possible
-
-```mermaid
-flowchart LR
-  A[🔐 Encrypt] --> B[🔄 Rotate]
-  B --> C[📋 Audit]
-  C --> D[👤 Least Privilege]
-  D --> A
-```
-
----
-
-## 📍 Slide 31 – 👨‍💻 Day in the Life: Secret Management
-
-**☀️ Morning:**
-* ☕ Check Vault audit logs for anomalies
-* 🔄 Review expiring secrets dashboard
-* 📋 Approve new secret access requests
-
-**🌤️ Afternoon:**
-* 🛠️ Help dev team configure Vault injection
-* 📝 Update policies for new microservice
-* 🔐 Rotate database credentials (automated)
-
-**🌙 Evening:**
-* 📊 Review daily access report
-* 🔔 Set up alerts for unusual patterns
-* 📚 Document new secret paths
-
----
-
-## 📍 Slide 32 – 👥 Roles & Secret Management
-
-| 👤 Role | 🔐 Secret Responsibilities |
-|---------|---------------------------|
-| 🧑‍💻 Developer | Use secrets correctly, never commit |
-| 🔧 DevOps | Configure injection, manage policies |
-| 🛡️ Security | Audit access, define requirements |
-| 🏗️ Platform | Maintain Vault infrastructure |
-| 📋 Compliance | Ensure rotation, audit trails |
-
-> 💡 **Common Thread:** Everyone shares responsibility for secrets
-
----
-
-## 📍 Slide 33 – 🏢 Real-World: How Companies Handle Secrets
-
-**🎬 Netflix:**
-* 🔐 Custom secret management platform
-* 🔄 Automatic rotation every 24 hours
-* 📊 Real-time access monitoring
-
-**📦 Shopify:**
-* 🏰 HashiCorp Vault at scale
-* 🔑 Dynamic database credentials
-* 👤 Per-service unique credentials
-
-**🚗 Uber:**
-* 📚 Learned from 2016 breach
-* 🔐 Zero hardcoded secrets policy
-* 🤖 Automated secret scanning in CI
-
----
-
-## 📍 Slide 34 – 🎯 Decision Framework: Choosing a Solution
-
-```mermaid
-flowchart TD
-  Start[🤔 Need Secret Management] --> Q1{Small team?<br/>Simple app?}
-  Q1 -->|Yes| K8s[☸️ K8s Secrets + etcd encryption]
-  Q1 -->|No| Q2{Multi-platform?<br/>Compliance needs?}
-  Q2 -->|Yes| Vault[🏰 HashiCorp Vault]
-  Q2 -->|No| Q3{Cloud-native only?}
-  Q3 -->|Yes| Cloud[☁️ Cloud Secret Manager]
-  Q3 -->|No| Vault
-```
-
----
-
-## 📍 Slide 35 – 📝 Key Takeaways
-
-1. 🚫 **Never hardcode secrets** — it's a breach waiting to happen
-2. 🔄 **Base64 ≠ encryption** — K8s Secrets need etcd encryption
-3. 🏰 **Vault for enterprise** — when you need rotation, audit, dynamic
-4. 💉 **Sidecar injection** — cleanest pattern for K8s + Vault
-5. 📋 **Audit everything** — you can't secure what you can't see
-
-> 💬 *"Security is not a product, but a process."* — Bruce Schneier
-
----
-
-## 📍 Slide 36 – 🔄 Mindset Shift
-
-| 😰 Old Mindset | 🚀 New Mindset |
-|----------------|----------------|
-| "Hardcode for convenience" | "Secrets are separate from code" |
-| "Base64 is secure enough" | "Encryption at rest is mandatory" |
-| "Rotate when breached" | "Rotate proactively and automatically" |
-| "Trust developers" | "Least privilege for everyone" |
-| "Hope nobody finds it" | "Assume breach, audit everything" |
-
-> 🤔 **Which mindset do you currently have?**
-
----
-
-## 📍 Slide 37 – ✅ Your Progress
-
-**🎓 You can now:**
-- [x] 🧠 Explain why secret management matters
-- [x] 🔍 Create K8s Secrets via kubectl and Helm
-- [x] ⚠️ Recognize encoding vs encryption
-- [x] 🛠️ Configure Vault sidecar injection
-- [x] 🗺️ Choose appropriate secret management strategy
-
-**🚀 Ready for:** Lab 11 — Kubernetes Secrets & HashiCorp Vault
-
----
-
-## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L11_POST
-
----
-
-## 📍 Slide 39 – 🚀 What's Next
-
-**📅 Next Lecture:** Configuration & Persistent Storage
-* 📁 ConfigMaps for non-sensitive config
-* 💾 Persistent Volumes for data
-* 🔧 Mounting strategies
-
-```mermaid
-flowchart LR
-  Now[🔐 Secrets] --> Next[📁 ConfigMaps]
-  Next --> Storage[💾 Storage]
-  Storage --> GitOps[🔄 GitOps]
-```
-
-> 💪 *"You've secured the secrets. Now let's configure everything else!"*
-
----
-
-## 📚 Resources
-
-**📖 Books:**
-* "HashiCorp Vault: Securing Secrets" — by various authors
-* "Kubernetes Security" — by Liz Rice
-* "Zero Trust Networks" — by Evan Gilman
-
-**🔗 Links:**
-* [Vault Documentation](https://developer.hashicorp.com/vault/docs)
-* [K8s Secrets Best Practices](https://kubernetes.io/docs/concepts/security/secrets-good-practices/)
-* [OWASP Secrets Management](https://cheatsheetseries.owasp.org/cheatsheets/Secrets_Management_Cheat_Sheet.html)
+# 📌 Lecture 11 — Secret Management: Protecting Your Crown Jewels
+
+## 📍 Slide 1 – 🔐 Welcome to Secret Management
+
+* 🌍 **Your Helm charts are beautiful** — but where do passwords go?
+* 😰 Hardcoded secrets in code = ticking time bomb
+* 🔐 **Secret management** = keeping credentials safe AND accessible
+* 🎯 This lecture: from base64 encoding to enterprise-grade Vault
+
+```mermaid
+flowchart LR
+  Bad[😱 Hardcoded] -->|🔐 Secrets| K8s[☸️ K8s Secrets]
+  K8s -->|🏰 Enterprise| Vault[🔒 HashiCorp Vault]
+  Vault --> Secure[✅ Secure Apps]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand why secret management matters
+* ✅ Create and consume Kubernetes Secrets
+* ✅ Recognize encoding vs encryption difference
+* ✅ Integrate HashiCorp Vault with Kubernetes
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Explain the risks of poor secret management |
+| 2 | 🔍 Create K8s Secrets via kubectl and Helm |
+| 3 | 🛠️ Configure Vault sidecar injection |
+| 4 | 🗺️ Choose appropriate secret management strategy |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 🔐 **Security-first mindset** — think like an attacker
+* 🎮 **Real breach scenarios** — learn from others' mistakes
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Hands-on patterns**: Secrets, Vault, injection
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction           → 📝 PRE Quiz
+Section 1: The Secrets Problem
+Section 2: Kubernetes Secrets
+Section 3: Encoding vs Encryption → 📝 MID Quiz
+Section 4: HashiCorp Vault
+Section 5: Production Patterns    → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – 💀 The Big Question
+
+> 💬 *"The only truly secure system is one that is powered off, cast in a block of concrete and sealed in a lead-lined room with armed guards."* — Gene Spafford
+
+**🔥 Shocking Stats:**
+* 😱 **83%** of organizations have experienced credential theft
+* 💸 Average cost of data breach: **$4.45 million** (2023)
+* ⏱️ Average time to detect breach: **277 days**
+
+> 🤔 **Think:** How many passwords are hardcoded in YOUR projects right now?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L11_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Secrets Problem
+
+* 🎯 **The Challenge:** Apps need credentials to function
+* ⚔️ **The Conflict:** Security vs Convenience
+
+```mermaid
+flowchart LR
+  subgraph 😰 Developer
+    D1[🚀 Ship Fast]
+    D2[🔧 Easy Access]
+  end
+  subgraph 🔐 Security
+    S1[🛡️ Protect Data]
+    S2[📋 Audit Access]
+  end
+  D1 <-->|⚔️ Tension| S1
+  D2 <-->|⚔️ Tension| S2
+```
+
+> 🤔 **Discussion:** Have you ever committed a password to git?
+
+---
+
+## 📍 Slide 7 – 😱 The Hardcoding Horror
+
+**❌ What developers actually do:**
+
+```python
+# ❌ BAD: Hardcoded in code
+DATABASE_URL = "postgres://admin:SuperSecret123@db.prod.com/myapp"
+API_KEY = "sk-1234567890abcdef"
+
+# ❌ BAD: In docker-compose.yml committed to git
+environment:
+  - DB_PASSWORD=MyPassword123
+```
+
+**💥 What can go wrong:**
+* 🔍 Git history is forever (even after deletion)
+* 🌍 Public repos = public secrets
+* 👥 Every developer has production passwords
+* 📝 No audit trail of who accessed what
+
+---
+
+## 📍 Slide 8 – 💥 Real Breach: Uber 2016
+
+**📰 What Happened:**
+* 😱 Developers hardcoded AWS credentials in GitHub repo
+* 🔓 Attackers found credentials, accessed S3 bucket
+* 💾 **57 million** user records stolen
+* 💸 **$148 million** settlement
+
+```mermaid
+flowchart LR
+  A[👨‍💻 Dev commits AWS keys] --> B[🔍 Attacker finds repo]
+  B --> C[🔓 Access S3 bucket]
+  C --> D[💾 57M records stolen]
+  D --> E[💸 $148M settlement]
+```
+
+> ⚠️ **Lesson:** Secrets in code = breach waiting to happen
+
+---
+
+## 📍 Slide 9 – 🔓 Environment Variables: Better but Not Enough
+
+**✅ Better than hardcoding:**
+```bash
+export DATABASE_PASSWORD="secret123"
+```
+
+**❌ Still problematic:**
+* 📋 `ps aux` can expose env vars
+* 🐳 Docker inspect shows environment
+* 📝 No encryption at rest
+* 🔄 No rotation mechanism
+* 👥 No access control
+
+```bash
+# Anyone on the system can see:
+$ docker inspect myapp | grep -A 10 "Env"
+```
+
+> 🤔 **Think:** Where do YOUR environment variables come from?
+
+---
+
+## 📍 Slide 10 – 📊 The Cost of Poor Secret Management
+
+| 🔥 Problem | 💥 Impact | 📊 Stats |
+|------------|-----------|----------|
+| 😱 Leaked credentials | 🔓 Unauthorized access | 83% of breaches |
+| 🔄 No rotation | 📅 Stale passwords | Avg age: 2+ years |
+| 👥 Shared secrets | 🕵️ No accountability | 65% share creds |
+| 📝 No audit | 🤷 Unknown access | 70% can't audit |
+
+**💡 The Solution Spectrum:**
+
+```mermaid
+flowchart LR
+  A[😱 Hardcoded] --> B[🔧 Env Vars]
+  B --> C[☸️ K8s Secrets]
+  C --> D[🔒 Vault]
+  style A fill:#ff6b6b
+  style B fill:#ffd93d
+  style C fill:#6bcb77
+  style D fill:#4d96ff
+```
+
+---
+
+## 📍 Slide 11 – ☸️ Section 2: Kubernetes Secrets
+
+**🎯 What are K8s Secrets?**
+* 📦 First-class Kubernetes objects for sensitive data
+* 🔐 Separate from ConfigMaps (security-focused)
+* 🚀 Native integration with pods
+
+```mermaid
+flowchart TD
+  Secret[🔐 Secret] --> |Volume| Pod1[📦 Pod]
+  Secret --> |Env Var| Pod2[📦 Pod]
+  Secret --> |API| Pod3[📦 Pod]
+```
+
+**📋 Secret Types:**
+* 🔑 `Opaque` — generic key-value
+* 🐳 `docker-registry` — image pull credentials
+* 🔒 `tls` — TLS certificates
+
+---
+
+## 📍 Slide 12 – 🛠️ Creating Secrets with kubectl
+
+**📝 From literals:**
+```bash
+kubectl create secret generic db-creds \
+  --from-literal=username=admin \
+  --from-literal=password=SuperSecret123
+```
+
+**📁 From files:**
+```bash
+kubectl create secret generic tls-cert \
+  --from-file=cert.pem \
+  --from-file=key.pem
+```
+
+**👀 Viewing secrets:**
+```bash
+kubectl get secret db-creds -o yaml
+# Data is base64 encoded
+
+# Decode:
+echo "U3VwZXJTZWNyZXQxMjM=" | base64 -d
+# Output: SuperSecret123
+```
+
+---
+
+## 📍 Slide 13 – ⚠️ The Base64 Trap
+
+> ⚠️ **Critical Understanding:** Base64 is ENCODING, not ENCRYPTION!
+
+```bash
+# Encoding (reversible by anyone):
+echo "password123" | base64
+# cGFzc3dvcmQxMjMK
+
+# Decoding (no key needed):
+echo "cGFzc3dvcmQxMjMK" | base64 -d
+# password123
+```
+
+**🔐 Encryption vs Encoding:**
+
+| 🔄 Encoding | 🔐 Encryption |
+|-------------|---------------|
+| ✅ Reversible by anyone | 🔑 Needs key to decrypt |
+| 📝 Not secure | 🔒 Mathematically secure |
+| 🚀 Fast, no overhead | ⚡ Computational cost |
+| 📦 Data format change | 🛡️ Confidentiality |
+
+---
+
+## 📍 Slide 14 – 📦 Consuming Secrets in Pods
+
+**🔧 As environment variables:**
+```yaml
+env:
+  - name: DB_PASSWORD
+    valueFrom:
+      secretKeyRef:
+        name: db-creds
+        key: password
+```
+
+**📁 As volume mount:**
+```yaml
+volumes:
+  - name: secret-volume
+    secret:
+      secretName: db-creds
+containers:
+  - volumeMounts:
+      - name: secret-volume
+        mountPath: /etc/secrets
+        readOnly: true
+```
+
+> 💡 **Best Practice:** Volume mounts are more secure than env vars (not visible in `docker inspect`)
+
+---
+
+## 📍 Slide 15 – 📊 Before vs After: Basic Secret Management
+
+| 😱 Before (Hardcoded) | ✅ After (K8s Secrets) |
+|-----------------------|------------------------|
+| 📝 Secrets in code | 📦 Secrets in K8s API |
+| 🌍 Visible in git history | 🔐 Separate from code |
+| 👥 Everyone has access | 🛡️ RBAC controls |
+| 🔄 Change = redeploy code | 🔧 Change secret only |
+| 📋 No audit trail | 📝 K8s audit logs |
+
+> 🤔 **Question:** Is K8s Secrets enough for production?
+
+---
+
+## 📍 Slide 16 – 🔒 Section 3: etcd Encryption
+
+**😰 The Problem:**
+* 🗄️ K8s stores secrets in etcd
+* 📝 By default: base64 encoded only
+* 🔓 etcd access = all secrets exposed
+
+**✅ The Solution: Encryption at Rest**
+```yaml
+apiVersion: apiserver.config.k8s.io/v1
+kind: EncryptionConfiguration
+resources:
+  - resources:
+      - secrets
+    providers:
+      - aescbc:
+          keys:
+            - name: key1
+              secret: <base64-encoded-key>
+      - identity: {}
+```
+
+---
+
+## 📍 Slide 17 – 🔐 K8s Secrets Limitations
+
+**⚠️ Still Missing:**
+* 🔄 **No automatic rotation** — manual process
+* 📊 **Limited audit** — who accessed what?
+* 🌍 **K8s-only** — what about non-K8s apps?
+* 🔑 **Static secrets** — no dynamic generation
+* 🏢 **No centralization** — per-cluster management
+
+```mermaid
+flowchart TD
+  subgraph 😰 Limitations
+    A[🔄 No Rotation]
+    B[📊 Limited Audit]
+    C[🌍 K8s Only]
+    D[🔑 Static Only]
+  end
+  E[🏰 Need: Enterprise Solution] --> F[🔒 HashiCorp Vault]
+```
+
+---
+
+## 📍 Slide 18 – 📝 QUIZ — DEVOPS_L11_MID
+
+---
+
+## 📍 Slide 19 – 🏰 Section 4: HashiCorp Vault
+
+**🎯 What is Vault?**
+* 🔐 Enterprise-grade secret management
+* 🔑 Dynamic secret generation
+* 📊 Complete audit logging
+* 🔄 Automatic rotation
+* 🌍 Platform agnostic
+
+```mermaid
+flowchart LR
+  subgraph 🏰 Vault
+    A[🔐 Secret Engine]
+    B[🔑 Auth Methods]
+    C[📋 Policies]
+    D[📊 Audit]
+  end
+  K8s[☸️ Kubernetes] --> B
+  B --> A
+  A --> Apps[📦 Applications]
+  D --> Logs[📝 Audit Logs]
+```
+
+---
+
+## 📍 Slide 20 – 🏗️ Vault Architecture
+
+```mermaid
+flowchart TD
+  subgraph 👥 Clients
+    K8s[☸️ K8s Pods]
+    CLI[💻 CLI]
+    API[🔌 API]
+  end
+  subgraph 🏰 Vault Server
+    Auth[🔑 Auth Methods]
+    Policy[📋 Policies]
+    Secrets[🔐 Secret Engines]
+    Audit[📊 Audit Device]
+  end
+  subgraph 💾 Storage
+    Backend[🗄️ Storage Backend]
+  end
+  K8s --> Auth
+  CLI --> Auth
+  API --> Auth
+  Auth --> Policy
+  Policy --> Secrets
+  Secrets --> Backend
+  Auth --> Audit
+```
+
+**🔑 Key Concepts:**
+* 🔐 **Secret Engines** — where secrets live (KV, database, PKI)
+* 🔑 **Auth Methods** — how clients authenticate
+* 📋 **Policies** — who can access what
+
+---
+
+## 📍 Slide 21 – 🔑 Vault Auth Methods
+
+| 🔑 Method | 📝 Description | 🎯 Use Case |
+|-----------|----------------|-------------|
+| ☸️ Kubernetes | Service account JWT | K8s pods |
+| 🔐 AppRole | Role ID + Secret ID | CI/CD pipelines |
+| 👤 Userpass | Username/password | Humans |
+| 🌐 OIDC | SSO integration | Enterprise SSO |
+| ☁️ AWS/GCP/Azure | Cloud IAM | Cloud workloads |
+
+**☸️ Kubernetes Auth Flow:**
+```mermaid
+sequenceDiagram
+  Pod->>Vault: JWT token (ServiceAccount)
+  Vault->>K8s API: Validate token
+  K8s API->>Vault: Token valid ✅
+  Vault->>Pod: Vault token + secrets
+```
+
+---
+
+## 📍 Slide 22 – 📋 Vault Policies
+
+**🎯 Policies control access:**
+```hcl
+# Allow read on specific path
+path "secret/data/myapp/*" {
+  capabilities = ["read", "list"]
+}
+
+# Deny access to admin secrets
+path "secret/data/admin/*" {
+  capabilities = ["deny"]
+}
+```
+
+**🛡️ Principle of Least Privilege:**
+* ✅ Apps only access their secrets
+* ✅ Read-only where possible
+* ✅ Separate policies per environment
+
+---
+
+## 📍 Slide 23 – 💉 Vault Agent Sidecar Injection
+
+**🎯 The Pattern:**
+* 📦 Vault Agent runs as sidecar container
+* 🔄 Automatically fetches and renews secrets
+* 📁 Writes secrets to shared volume
+* 🚀 App reads from filesystem
+
+```mermaid
+flowchart LR
+  subgraph 📦 Pod
+    App[🚀 App Container]
+    Agent[🔐 Vault Agent]
+    Vol[📁 Shared Volume]
+  end
+  Vault[🏰 Vault Server]
+  Agent -->|🔑 Auth| Vault
+  Vault -->|🔐 Secrets| Agent
+  Agent -->|📝 Write| Vol
+  App -->|📖 Read| Vol
+```
+
+---
+
+## 📍 Slide 24 – 🏷️ Vault Annotations
+
+**📝 Enable injection:**
+```yaml
+metadata:
+  annotations:
+    vault.hashicorp.com/agent-inject: "true"
+    vault.hashicorp.com/role: "myapp"
+    vault.hashicorp.com/agent-inject-secret-config: "secret/data/myapp/config"
+```
+
+**📁 Secrets appear at:**
+```
+/vault/secrets/config
+```
+
+**🔧 Template for custom format:**
+```yaml
+vault.hashicorp.com/agent-inject-template-config: |
+  {{- with secret "secret/data/myapp/config" -}}
+  DB_PASSWORD={{ .Data.data.password }}
+  {{- end -}}
+```
+
+---
+
+## 📍 Slide 25 – 🚀 Vault in Kubernetes: Full Flow
+
+```mermaid
+sequenceDiagram
+  participant Pod
+  participant Injector as Vault Injector
+  participant Agent as Vault Agent
+  participant Vault
+
+  Pod->>Injector: Pod created with annotations
+  Injector->>Pod: Inject sidecar container
+  Agent->>Vault: Authenticate (K8s JWT)
+  Vault->>Agent: Return Vault token
+  Agent->>Vault: Request secrets
+  Vault->>Agent: Return secrets
+  Agent->>Pod: Write to /vault/secrets/
+  Pod->>Pod: App reads secrets
+```
+
+---
+
+## 📍 Slide 26 – 🔄 Section 5: Dynamic Secrets
+
+**🎯 Static vs Dynamic:**
+
+| 🔑 Static Secrets | 🔄 Dynamic Secrets |
+|-------------------|-------------------|
+| 📝 Created manually | 🤖 Generated on-demand |
+| ♾️ Live forever | ⏱️ Short TTL |
+| 👥 Shared | 👤 Unique per request |
+| 🔄 Manual rotation | 🔄 Auto-expires |
+
+**💡 Example: Database credentials**
+```bash
+vault read database/creds/readonly
+# Key             Value
+# lease_id        database/creds/readonly/abc123
+# lease_duration  1h
+# username        v-kubernetes-readonly-xyz789
+# password        A1b2C3d4E5f6G7h8
+```
+
+---
+
+## 📍 Slide 27 – 📊 Secret Management Comparison
+
+| 🔧 Feature | 🔓 Env Vars | ☸️ K8s Secrets | 🏰 Vault |
+|------------|-------------|----------------|----------|
+| 🔐 Encryption | ❌ None | ⚠️ Optional | ✅ Always |
+| 🔄 Rotation | ❌ Manual | ❌ Manual | ✅ Auto |
+| 📊 Audit | ❌ None | ⚠️ Basic | ✅ Full |
+| 🔑 Dynamic | ❌ No | ❌ No | ✅ Yes |
+| 🌍 Multi-platform | ✅ Yes | ❌ K8s only | ✅ Yes |
+| 📈 Complexity | 🟢 Low | 🟡 Medium | 🔴 High |
+
+---
+
+## 📍 Slide 28 – 🗺️ Course Context: Where Secrets Fit
+
+```mermaid
+flowchart TD
+  subgraph 🏗️ Foundation
+    L2[📦 Lab 2: Docker]
+    L10[⛵ Lab 10: Helm]
+  end
+  subgraph 🔐 Security
+    L11[🔒 Lab 11: Secrets]
+  end
+  subgraph 📋 Config
+    L12[📁 Lab 12: ConfigMaps]
+  end
+  subgraph 🚀 Deployment
+    L13[🔄 Lab 13: ArgoCD]
+  end
+  L2 --> L10
+  L10 --> L11
+  L11 --> L12
+  L12 --> L13
+  style L11 fill:#4d96ff
+```
+
+---
+
+## 📍 Slide 29 – 📈 Security Metrics
+
+| 📊 Metric | 📝 Description | 🎯 Target |
+|-----------|----------------|-----------|
+| 🔄 Secret Age | Time since rotation | < 90 days |
+| 📊 Access Audit | % of accesses logged | 100% |
+| 🔐 Encryption | % secrets encrypted | 100% |
+| 👥 Shared Secrets | Secrets used by >1 app | 0 |
+| ⏱️ TTL Compliance | Secrets with TTL | > 80% |
+
+> 🤔 **Question:** How would you measure secret security in your organization?
+
+---
+
+## 📍 Slide 30 – ✅ Secret Management Best Practices
+
+**🛡️ The Golden Rules:**
+
+1. 🚫 **Never commit secrets** to version control
+2. 🔄 **Rotate regularly** — automate where possible
+3. 📋 **Audit everything** — know who accessed what
+4. 🔐 **Encrypt at rest** — etcd encryption minimum
+5. 👤 **Least privilege** — only what's needed
+6. ⏱️ **Short-lived** — dynamic secrets when possible
+
+```mermaid
+flowchart LR
+  A[🔐 Encrypt] --> B[🔄 Rotate]
+  B --> C[📋 Audit]
+  C --> D[👤 Least Privilege]
+  D --> A
+```
+
+---
+
+## 📍 Slide 31 – 👨‍💻 Day in the Life: Secret Management
+
+**☀️ Morning:**
+* ☕ Check Vault audit logs for anomalies
+* 🔄 Review expiring secrets dashboard
+* 📋 Approve new secret access requests
+
+**🌤️ Afternoon:**
+* 🛠️ Help dev team configure Vault injection
+* 📝 Update policies for new microservice
+* 🔐 Rotate database credentials (automated)
+
+**🌙 Evening:**
+* 📊 Review daily access report
+* 🔔 Set up alerts for unusual patterns
+* 📚 Document new secret paths
+
+---
+
+## 📍 Slide 32 – 👥 Roles & Secret Management
+
+| 👤 Role | 🔐 Secret Responsibilities |
+|---------|---------------------------|
+| 🧑‍💻 Developer | Use secrets correctly, never commit |
+| 🔧 DevOps | Configure injection, manage policies |
+| 🛡️ Security | Audit access, define requirements |
+| 🏗️ Platform | Maintain Vault infrastructure |
+| 📋 Compliance | Ensure rotation, audit trails |
+
+> 💡 **Common Thread:** Everyone shares responsibility for secrets
+
+---
+
+## 📍 Slide 33 – 🏢 Real-World: How Companies Handle Secrets
+
+**🎬 Netflix:**
+* 🔐 Custom secret management platform
+* 🔄 Automatic rotation every 24 hours
+* 📊 Real-time access monitoring
+
+**📦 Shopify:**
+* 🏰 HashiCorp Vault at scale
+* 🔑 Dynamic database credentials
+* 👤 Per-service unique credentials
+
+**🚗 Uber:**
+* 📚 Learned from 2016 breach
+* 🔐 Zero hardcoded secrets policy
+* 🤖 Automated secret scanning in CI
+
+---
+
+## 📍 Slide 34 – 🎯 Decision Framework: Choosing a Solution
+
+```mermaid
+flowchart TD
+  Start[🤔 Need Secret Management] --> Q1{Small team?<br/>Simple app?}
+  Q1 -->|Yes| K8s[☸️ K8s Secrets + etcd encryption]
+  Q1 -->|No| Q2{Multi-platform?<br/>Compliance needs?}
+  Q2 -->|Yes| Vault[🏰 HashiCorp Vault]
+  Q2 -->|No| Q3{Cloud-native only?}
+  Q3 -->|Yes| Cloud[☁️ Cloud Secret Manager]
+  Q3 -->|No| Vault
+```
+
+---
+
+## 📍 Slide 35 – 📝 Key Takeaways
+
+1. 🚫 **Never hardcode secrets** — it's a breach waiting to happen
+2. 🔄 **Base64 ≠ encryption** — K8s Secrets need etcd encryption
+3. 🏰 **Vault for enterprise** — when you need rotation, audit, dynamic
+4. 💉 **Sidecar injection** — cleanest pattern for K8s + Vault
+5. 📋 **Audit everything** — you can't secure what you can't see
+
+> 💬 *"Security is not a product, but a process."* — Bruce Schneier
+
+---
+
+## 📍 Slide 36 – 🔄 Mindset Shift
+
+| 😰 Old Mindset | 🚀 New Mindset |
+|----------------|----------------|
+| "Hardcode for convenience" | "Secrets are separate from code" |
+| "Base64 is secure enough" | "Encryption at rest is mandatory" |
+| "Rotate when breached" | "Rotate proactively and automatically" |
+| "Trust developers" | "Least privilege for everyone" |
+| "Hope nobody finds it" | "Assume breach, audit everything" |
+
+> 🤔 **Which mindset do you currently have?**
+
+---
+
+## 📍 Slide 37 – ✅ Your Progress
+
+**🎓 You can now:**
+- [x] 🧠 Explain why secret management matters
+- [x] 🔍 Create K8s Secrets via kubectl and Helm
+- [x] ⚠️ Recognize encoding vs encryption
+- [x] 🛠️ Configure Vault sidecar injection
+- [x] 🗺️ Choose appropriate secret management strategy
+
+**🚀 Ready for:** Lab 11 — Kubernetes Secrets & HashiCorp Vault
+
+---
+
+## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L11_POST
+
+---
+
+## 📍 Slide 39 – 🚀 What's Next
+
+**📅 Next Lecture:** Configuration & Persistent Storage
+* 📁 ConfigMaps for non-sensitive config
+* 💾 Persistent Volumes for data
+* 🔧 Mounting strategies
+
+```mermaid
+flowchart LR
+  Now[🔐 Secrets] --> Next[📁 ConfigMaps]
+  Next --> Storage[💾 Storage]
+  Storage --> GitOps[🔄 GitOps]
+```
+
+> 💪 *"You've secured the secrets. Now let's configure everything else!"*
+
+---
+
+## 📚 Resources
+
+**📖 Books:**
+* "HashiCorp Vault: Securing Secrets" — by various authors
+* "Kubernetes Security" — by Liz Rice
+* "Zero Trust Networks" — by Evan Gilman
+
+**🔗 Links:**
+* [Vault Documentation](https://developer.hashicorp.com/vault/docs)
+* [K8s Secrets Best Practices](https://kubernetes.io/docs/concepts/security/secrets-good-practices/)
+* [OWASP Secrets Management](https://cheatsheetseries.owasp.org/cheatsheets/Secrets_Management_Cheat_Sheet.html)
diff --git a/lectures/lec12.md b/lectures/lec12.md
index ef8ff54778..4ff75600fc 100644
--- a/lectures/lec12.md
+++ b/lectures/lec12.md
@@ -1,854 +1,854 @@
-# 📌 Lecture 12 — Configuration & Storage: Externalizing Application State
-
-> 🎯 **From hardcoded configs to dynamic, portable applications**
-
----
-
-## 📍 Slide 1 – 🚀 Welcome to Configuration Management
-
-Last lecture we secured our **secrets**. But what about everything else?
-
-* 🔧 **Database URLs** — different per environment
-* 📊 **Feature flags** — enable/disable features dynamically
-* 📁 **Data persistence** — where does your app store files?
-* ⚙️ **App settings** — logging levels, timeouts, cache sizes
-
-```mermaid
-flowchart LR
-  A[😰 Hardcoded Config] --> B[🔧 Externalized Config]
-  B --> C[🚀 Portable Apps]
-  C --> D[💎 Any Environment]
-```
-
-> 🎯 **Goal:** Build applications that run anywhere without code changes
-
----
-
-## 📍 Slide 2 – 📚 Learning Outcomes
-
-By the end of this lecture, you will:
-
-| # | 🎯 Outcome |
-|---|-----------|
-| 1 | ✅ Understand the **12-Factor App** configuration principle |
-| 2 | ✅ Create and use **ConfigMaps** for non-sensitive configuration |
-| 3 | ✅ Differentiate between **ConfigMaps** and **Secrets** |
-| 4 | ✅ Understand **Persistent Volumes** and storage in Kubernetes |
-| 5 | ✅ Implement **PersistentVolumeClaims** for stateful applications |
-| 6 | ✅ Apply configuration management **best practices** |
-
----
-
-## 📍 Slide 3 – 🗺️ Lecture Overview
-
-```
-┌─────────────────────────────────────────────────────────────┐
-│  SECTION 0: Introduction                    (Slides 1-4)   │
-├─────────────────────────────────────────────────────────────┤
-│  📝 PRE QUIZ                                (Slide 5)      │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 1: The Configuration Problem       (Slides 6-10)  │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 2: ConfigMaps Deep Dive            (Slides 11-15) │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 3: Hands-on Scenarios              (Slides 16-24) │
-├─────────────────────────────────────────────────────────────┤
-│  📝 MID QUIZ                                (Slide 25)     │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 4: Persistent Storage              (Slides 26-32) │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 5: Production Patterns             (Slides 33-37) │
-├─────────────────────────────────────────────────────────────┤
-│  📝 POST QUIZ                               (Slide 38)     │
-├─────────────────────────────────────────────────────────────┤
-│  FINAL: What's Next                         (Slide 39)     │
-└─────────────────────────────────────────────────────────────┘
-```
-
----
-
-## 📍 Slide 4 – 🤔 The Big Question
-
-> 💬 *"Store config in the environment, not in the code."*
-> — The Twelve-Factor App
-
-**Consider this:**
-
-* 🏭 You have the **same application** running in dev, staging, and production
-* 🔧 Each environment needs **different database URLs**
-* 📊 You want to change **log levels without redeploying**
-* 💾 Your app needs to **persist user uploads** somewhere
-
-> 🤔 **Think:** How do you build ONE container image that works everywhere?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L12_PRE
-
----
-
-## 📍 Slide 6 – ⚠️ Section 1: The Configuration Problem
-
-**The Anti-Pattern: Hardcoded Configuration**
-
-```mermaid
-flowchart TD
-  subgraph 😰 Hardcoded
-    A[app-dev.jar] --> D1[Dev DB]
-    B[app-staging.jar] --> D2[Staging DB]
-    C[app-prod.jar] --> D3[Prod DB]
-  end
-
-  subgraph 🚀 Externalized
-    E[app.jar] --> F{Config}
-    F --> D1
-    F --> D2
-    F --> D3
-  end
-```
-
-* 😰 **Hardcoded:** Different artifact per environment
-* 🚀 **Externalized:** One artifact, configuration injected at runtime
-
----
-
-## 📍 Slide 7 – 🔥 Pain Point 1: Environment-Specific Builds
-
-**The Problem:**
-
-```dockerfile
-# ❌ Bad: Environment-specific Dockerfile
-FROM python:3.12
-ENV DATABASE_URL=postgres://dev-server:5432/mydb  # 😱 Hardcoded!
-ENV LOG_LEVEL=DEBUG
-COPY . /app
-```
-
-* 🔄 Need to **rebuild** for each environment
-* 🐛 **"Works on my machine"** — config differs
-* 🔍 Can't trace which **version** is where
-* 💀 Accidentally deploying **dev config to production**
-
-> 😱 **Horror Story:** Company deployed with `DEBUG=true` to production, logging credit card numbers
-
----
-
-## 📍 Slide 8 – 🔥 Pain Point 2: Configuration Drift
-
-**What happens over time:**
-
-| 📅 Month | 🔧 Dev Config | 🎭 Staging Config | 🏭 Prod Config |
-|----------|---------------|-------------------|----------------|
-| January  | `timeout=30` | `timeout=30` | `timeout=30` |
-| March    | `timeout=60` | `timeout=30` | `timeout=30` |
-| June     | `timeout=60` | `timeout=45` | `timeout=30` |
-| Now      | 😵 Nobody knows what's deployed where |
-
-* 🔄 **Manual changes** accumulate
-* 📋 No **version control** for configuration
-* 🐛 **Staging doesn't match production** — bugs slip through
-
----
-
-## 📍 Slide 9 – 🔥 Pain Point 3: Data Loss
-
-**Stateless containers + persistent data = 💥**
-
-```mermaid
-flowchart LR
-  A[📦 Container v1] --> B[💾 /app/uploads]
-  B --> C[🔄 Deployment]
-  C --> D[📦 Container v2]
-  D --> E[💾 /app/uploads]
-  E --> F[😱 Empty!]
-```
-
-* 📦 Containers are **ephemeral** — data inside is lost on restart
-* 💾 User uploads, databases, caches — all **gone**
-* 🔄 Rolling updates = **data loss** without proper storage
-
-> 🤔 **Discussion:** Where should container applications store their data?
-
----
-
-## 📍 Slide 10 – 💰 The Cost of Poor Configuration
-
-| 🔥 Problem | 💥 Impact | 📊 Statistics |
-|-----------|----------|---------------|
-| Config drift | Inconsistent behavior | 62% of outages involve config changes |
-| Hardcoded secrets | Security breaches | Covered in Lecture 11! |
-| Data loss | Customer impact | Average $150K per incident |
-| Manual config | Human error | 70% of failures are human error |
-
-**Root causes of production incidents (2024 survey):**
-* 🔧 Configuration changes: **41%**
-* 📦 Code deployments: **31%**
-* 🔌 Infrastructure failures: **28%**
-
----
-
-## 📍 Slide 11 – ✅ Section 2: ConfigMaps to the Rescue
-
-**What is a ConfigMap?**
-
-* 📋 Kubernetes object that stores **non-confidential** configuration data
-* 🔑 Key-value pairs or **entire files**
-* 🔄 Decouples configuration from container images
-* ⚡ Can be updated **without rebuilding** the application
-
-```mermaid
-flowchart LR
-  A[📋 ConfigMap] --> B[📦 Pod]
-  A --> C[📦 Pod]
-  A --> D[📦 Pod]
-
-  E[🔐 Secret] --> B
-  E --> C
-  E --> D
-```
-
-> 💡 **Key Insight:** ConfigMaps for config, Secrets for sensitive data
-
----
-
-## 📍 Slide 12 – 🚫 ConfigMaps: What They're NOT
-
-| 🚫 Myth | ✅ Reality |
-|---------|----------|
-| ConfigMaps are secure | ❌ Stored in plain text in etcd |
-| ConfigMaps replace Secrets | ❌ Use Secrets for sensitive data |
-| ConfigMaps auto-reload apps | ❌ Apps must implement hot-reload |
-| ConfigMaps have no size limit | ❌ Limited to 1MB per ConfigMap |
-
-> ⚠️ **Warning:** Never store passwords, tokens, or keys in ConfigMaps!
-
-**When to use which:**
-
-| 📋 ConfigMap | 🔐 Secret |
-|-------------|----------|
-| Database URLs (without password) | Database passwords |
-| Feature flags | API keys |
-| Log levels | TLS certificates |
-| Application settings | OAuth tokens |
-
----
-
-## 📍 Slide 13 – 🛠️ Creating ConfigMaps
-
-**Method 1: From literal values**
-```bash
-kubectl create configmap app-config \
-  --from-literal=LOG_LEVEL=INFO \
-  --from-literal=CACHE_TTL=3600
-```
-
-**Method 2: From a file**
-```bash
-kubectl create configmap nginx-config \
-  --from-file=nginx.conf
-```
-
-**Method 3: From YAML manifest**
-```yaml
-apiVersion: v1
-kind: ConfigMap
-metadata:
-  name: app-config
-data:
-  LOG_LEVEL: "INFO"
-  DATABASE_HOST: "postgres.default.svc"
-  config.yaml: |
-    server:
-      port: 8080
-      timeout: 30s
-```
-
----
-
-## 📍 Slide 14 – 🔌 Consuming ConfigMaps
-
-**Option 1: Environment Variables**
-```yaml
-# ✅ Individual keys
-env:
-  - name: LOG_LEVEL
-    valueFrom:
-      configMapKeyRef:
-        name: app-config
-        key: LOG_LEVEL
-
-# ✅ All keys at once
-envFrom:
-  - configMapRef:
-      name: app-config
-```
-
-**Option 2: Volume Mounts (for files)**
-```yaml
-volumes:
-  - name: config-volume
-    configMap:
-      name: nginx-config
-volumeMounts:
-  - name: config-volume
-    mountPath: /etc/nginx/nginx.conf
-    subPath: nginx.conf
-```
-
----
-
-## 📍 Slide 15 – 📊 Before vs After: Configuration
-
-| 📋 Aspect | 😰 Before (Hardcoded) | 🚀 After (ConfigMaps) |
-|----------|----------------------|----------------------|
-| Build per environment | Yes, multiple images | No, one image |
-| Change config | Rebuild & redeploy | Update ConfigMap |
-| Version control | In code (scattered) | Centralized, declarative |
-| Environment parity | Difficult | Easy |
-| Rollback | Redeploy old image | Apply old ConfigMap |
-| Audit trail | Git history (code) | K8s + Git history |
-
-> 🤔 **Think:** What configuration in your applications could be externalized?
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: Let's Simulate!
-
-**Scenario:** You're a DevOps engineer at **CloudMart** 🛒
-
-Your application:
-* 🐍 Python/Go web service
-* 📊 Needs different configs per environment
-* 💾 Stores user uploads
-* 🔧 Frequently changes feature flags
-
-**What could go wrong?** Everything! Let's fix it.
-
----
-
-## 📍 Slide 17 – 💥 Scenario 1: Wrong Environment Config
-
-**Situation:** Developer accidentally deploys with staging database URL to production
-
-```mermaid
-flowchart LR
-  A[👨‍💻 Dev pushes] --> B[🔄 CI/CD]
-  B --> C[📦 Deploy to Prod]
-  C --> D[🔗 Connects to Staging DB]
-  D --> E[😱 Production reads staging data!]
-```
-
-* 😱 **Impact:** Customers see test data
-* ⏱️ **Detection time:** 2 hours
-* 💰 **Cost:** Lost sales, reputation damage
-
-> 🤔 **Question:** How do we prevent this?
-
----
-
-## 📍 Slide 18 – ✅ Solution 1: Environment-Specific ConfigMaps
-
-**Fix:** Namespace-isolated ConfigMaps
-
-```yaml
-# configmap-prod.yaml
-apiVersion: v1
-kind: ConfigMap
-metadata:
-  name: app-config
-  namespace: production  # 🔑 Namespace isolation
-data:
-  DATABASE_HOST: "prod-db.internal"
-  ENVIRONMENT: "production"
----
-# configmap-staging.yaml
-apiVersion: v1
-kind: ConfigMap
-metadata:
-  name: app-config
-  namespace: staging
-data:
-  DATABASE_HOST: "staging-db.internal"
-  ENVIRONMENT: "staging"
-```
-
-* ✅ **Same ConfigMap name**, different namespaces
-* ✅ **Impossible** to mix environments
-* ✅ **GitOps friendly** — config in version control
-
----
-
-## 📍 Slide 19 – 💥 Scenario 2: Config Change Causes Outage
-
-**Situation:** Changed `CACHE_TTL` from 3600 to 36 (typo!) — cache expires every 36 seconds
-
-```mermaid
-flowchart TD
-  A[⌨️ Typo: 3600 → 36] --> B[📋 ConfigMap Updated]
-  B --> C[📦 Pods reload config]
-  C --> D[🔥 Cache thrashing]
-  D --> E[💀 Database overloaded]
-  E --> F[😱 Site down!]
-```
-
-* 😱 **Impact:** 30-minute outage
-* 🔍 **Root cause:** No validation, no review
-
----
-
-## 📍 Slide 20 – ✅ Solution 2: Immutable ConfigMaps + Versioning
-
-**Fix:** Treat ConfigMaps as immutable, version them
-
-```yaml
-apiVersion: v1
-kind: ConfigMap
-metadata:
-  name: app-config-v3  # 🔑 Versioned name
-  labels:
-    version: "3"
-immutable: true  # 🔒 Cannot be modified
-data:
-  CACHE_TTL: "3600"
-```
-
-**Deployment references specific version:**
-```yaml
-envFrom:
-  - configMapRef:
-      name: app-config-v3  # 🔑 Explicit version
-```
-
-* ✅ **Rollback** = change reference to previous version
-* ✅ **Audit trail** — which version when
-* ✅ **Validation** in CI/CD before applying
-
----
-
-## 📍 Slide 21 – 💥 Scenario 3: User Uploads Disappear
-
-**Situation:** Deployment rolls out new pods, user uploads are gone
-
-```mermaid
-flowchart TD
-  A[📦 Pod v1] --> B[💾 /app/uploads]
-  B --> C[📸 User uploads photo]
-  C --> D[🔄 Rolling Update]
-  D --> E[📦 Pod v2]
-  E --> F[💾 /app/uploads - Empty!]
-  F --> G[😱 User: Where's my photo?!]
-```
-
-* 💾 Container filesystem is **ephemeral**
-* 🔄 New container = **fresh filesystem**
-* 😱 All data is **lost**
-
----
-
-## 📍 Slide 22 – ✅ Solution 3: Persistent Volumes
-
-**Fix:** External storage that survives pod restarts
-
-```yaml
-apiVersion: v1
-kind: PersistentVolumeClaim
-metadata:
-  name: uploads-pvc
-spec:
-  accessModes:
-    - ReadWriteOnce
-  resources:
-    requests:
-      storage: 10Gi
----
-# In Deployment
-volumes:
-  - name: uploads
-    persistentVolumeClaim:
-      claimName: uploads-pvc
-volumeMounts:
-  - name: uploads
-    mountPath: /app/uploads
-```
-
-```mermaid
-flowchart LR
-  A[📦 Pod v1] --> B[💾 PVC]
-  C[📦 Pod v2] --> B
-  D[📦 Pod v3] --> B
-  B --> E[🗄️ Persistent Storage]
-```
-
----
-
-## 📍 Slide 23 – 💥 Scenario 4: ConfigMap Update Not Applied
-
-**Situation:** Updated ConfigMap, but app still uses old values
-
-```mermaid
-flowchart LR
-  A[📋 ConfigMap Updated] --> B[📦 Pod still running]
-  B --> C[⚠️ Using old config!]
-  C --> D[🤔 Why isn't it working?]
-```
-
-* 🔄 ConfigMap updates **don't automatically restart** pods
-* 📦 Pod keeps the config from when it started
-
----
-
-## 📍 Slide 24 – ✅ Solution 4: Config Reload Strategies
-
-**Strategy 1: Restart Deployment**
-```bash
-kubectl rollout restart deployment/myapp
-```
-
-**Strategy 2: Use a hash annotation (GitOps-friendly)**
-```yaml
-metadata:
-  annotations:
-    checksum/config: {{ sha256sum .Values.config | quote }}
-```
-
-**Strategy 3: App-level hot reload**
-* 📂 Mount ConfigMap as volume
-* 👀 Watch for file changes
-* 🔄 Reload configuration in-memory
-
-**Strategy 4: Reloader controller**
-* 🤖 Automatically restarts pods when ConfigMap changes
-* 📦 `stakater/reloader` — popular open source solution
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L12_MID
-
----
-
-## 📍 Slide 26 – 💾 Section 4: Persistent Storage Deep Dive
-
-**The Storage Stack in Kubernetes:**
-
-```mermaid
-flowchart TD
-  A[📦 Pod] --> B[📁 Volume Mount]
-  B --> C[💾 PersistentVolumeClaim]
-  C --> D[🗄️ PersistentVolume]
-  D --> E[☁️ Storage Backend]
-
-  F[📋 StorageClass] -.-> C
-  F -.-> D
-```
-
-* 📦 **Pod:** Uses the storage via mount
-* 💾 **PVC:** Request for storage ("I need 10GB")
-* 🗄️ **PV:** Actual storage resource
-* ☁️ **Backend:** AWS EBS, GCE PD, NFS, local disk
-* 📋 **StorageClass:** Template for dynamic provisioning
-
----
-
-## 📍 Slide 27 – 📋 Storage Concepts Breakdown
-
-| 🔧 Concept | 📝 Description | 🎯 Analogy |
-|-----------|---------------|-----------|
-| **PersistentVolume (PV)** | A piece of storage in the cluster | A physical hard drive |
-| **PersistentVolumeClaim (PVC)** | A request for storage | "I need a 100GB drive" |
-| **StorageClass** | Template for provisioning | "Give me SSD storage" |
-| **Access Modes** | How pods can access | ReadWriteOnce, ReadWriteMany |
-| **Reclaim Policy** | What happens when PVC deleted | Retain, Delete, Recycle |
-
-**Access Modes:**
-* 🔒 **ReadWriteOnce (RWO):** One node can mount read-write
-* 📖 **ReadOnlyMany (ROX):** Many nodes can mount read-only
-* 📝 **ReadWriteMany (RWX):** Many nodes can mount read-write
-
----
-
-## 📍 Slide 28 – 🔄 Dynamic Provisioning
-
-**Without Dynamic Provisioning (Manual):**
-```mermaid
-flowchart LR
-  A[👨‍💻 Admin creates PV] --> B[📋 PV available]
-  B --> C[👨‍💻 Dev creates PVC]
-  C --> D[🔗 PVC binds to PV]
-```
-
-**With Dynamic Provisioning (Automatic):**
-```mermaid
-flowchart LR
-  A[👨‍💻 Dev creates PVC] --> B[📋 StorageClass]
-  B --> C[🤖 Auto-create PV]
-  C --> D[🔗 PVC binds to PV]
-```
-
-```yaml
-apiVersion: storage.k8s.io/v1
-kind: StorageClass
-metadata:
-  name: fast-ssd
-provisioner: kubernetes.io/gce-pd  # Cloud-specific
-parameters:
-  type: pd-ssd
-reclaimPolicy: Delete
-volumeBindingMode: WaitForFirstConsumer
-```
-
----
-
-## 📍 Slide 29 – ⚠️ Storage Pitfalls
-
-| ⚠️ Pitfall | 💥 Impact | ✅ Solution |
-|-----------|----------|------------|
-| Wrong access mode | Pod scheduling fails | Match mode to use case |
-| No storage class | PVC pending forever | Set default StorageClass |
-| Reclaim = Delete | Data lost on PVC delete | Use Retain for important data |
-| Zone mismatch | Pod can't mount volume | Use topology-aware provisioning |
-| Insufficient capacity | PVC pending | Monitor storage usage |
-
-**Common error:**
-```
-Warning  FailedScheduling  pod has unbound immediate PersistentVolumeClaims
-```
-
-> 🔍 **Debug:** `kubectl describe pvc <name>` — check events
-
----
-
-## 📍 Slide 30 – 📊 Volume Types Comparison
-
-| 📦 Volume Type | 🎯 Use Case | ⚡ Performance | 💰 Cost |
-|---------------|------------|---------------|--------|
-| **emptyDir** | Temp data, cache | Fast (node storage) | Free |
-| **hostPath** | Node-specific data | Fast | Free |
-| **NFS** | Shared storage | Medium | Varies |
-| **Cloud (EBS, PD)** | Production workloads | Configurable | $$$ |
-| **Local PV** | Databases, high IOPS | Very fast | Node-dependent |
-
-**Decision tree:**
-```mermaid
-flowchart TD
-  A[Need persistent storage?] --> |No| B[emptyDir]
-  A --> |Yes| C[Shared across pods?]
-  C --> |No| D[Cloud Block Storage]
-  C --> |Yes| E[NFS or Cloud File Storage]
-```
-
----
-
-## 📍 Slide 31 – 🔧 Practical PVC Example
-
-**Complete example for a web application:**
-
-```yaml
-apiVersion: v1
-kind: PersistentVolumeClaim
-metadata:
-  name: app-uploads
-spec:
-  accessModes:
-    - ReadWriteOnce
-  storageClassName: standard
-  resources:
-    requests:
-      storage: 5Gi
----
-apiVersion: apps/v1
-kind: Deployment
-metadata:
-  name: webapp
-spec:
-  template:
-    spec:
-      containers:
-        - name: app
-          volumeMounts:
-            - name: uploads
-              mountPath: /app/uploads
-      volumes:
-        - name: uploads
-          persistentVolumeClaim:
-            claimName: app-uploads
-```
-
----
-
-## 📍 Slide 32 – 📈 Storage Lifecycle
-
-```mermaid
-stateDiagram-v2
-  [*] --> Pending: PVC Created
-  Pending --> Bound: PV Available
-  Bound --> Released: PVC Deleted
-  Released --> Available: Reclaim
-  Released --> [*]: Delete Policy
-
-  note right of Pending: Waiting for PV
-  note right of Bound: In use
-  note right of Released: Data still exists
-```
-
-**Key states:**
-* ⏳ **Pending:** Waiting for matching PV
-* ✅ **Bound:** PVC matched to PV
-* 🔓 **Released:** PVC deleted, PV still has data
-* ❌ **Failed:** Error in provisioning
-
----
-
-## 📍 Slide 33 – 🏭 Section 5: Production Patterns
-
-**Pattern 1: GitOps Configuration Management**
-
-```mermaid
-flowchart LR
-  A[📝 Git Repo] --> B[🔄 ArgoCD]
-  B --> C[📋 ConfigMaps]
-  B --> D[🔐 Secrets]
-  B --> E[📦 Deployments]
-
-  C --> F[🎯 Cluster]
-  D --> F
-  E --> F
-```
-
-* 📋 **All configuration in Git** — single source of truth
-* 🔄 **ArgoCD syncs** to cluster
-* 🔍 **Audit trail** — who changed what, when
-* ↩️ **Rollback** — `git revert`
-
----
-
-## 📍 Slide 34 – 🔧 Pattern 2: Environment Hierarchy
-
-**Kustomize for environment-specific configs:**
-
-```
-base/
-  ├── deployment.yaml
-  ├── service.yaml
-  └── configmap.yaml
-overlays/
-  ├── dev/
-  │   └── kustomization.yaml
-  ├── staging/
-  │   └── kustomization.yaml
-  └── prod/
-      └── kustomization.yaml
-```
-
-```yaml
-# overlays/prod/kustomization.yaml
-resources:
-  - ../../base
-configMapGenerator:
-  - name: app-config
-    literals:
-      - LOG_LEVEL=WARN
-      - REPLICAS=5
-```
-
-* ✅ **DRY** — Don't Repeat Yourself
-* ✅ **Environment-specific** overrides
-* ✅ **Consistent** base configuration
-
----
-
-## 📍 Slide 35 – 🔐 Pattern 3: Secrets + ConfigMaps Together
-
-**Combining Secrets and ConfigMaps:**
-
-```yaml
-spec:
-  containers:
-    - name: app
-      env:
-        # 📋 From ConfigMap (non-sensitive)
-        - name: DATABASE_HOST
-          valueFrom:
-            configMapKeyRef:
-              name: app-config
-              key: DATABASE_HOST
-        # 🔐 From Secret (sensitive)
-        - name: DATABASE_PASSWORD
-          valueFrom:
-            secretKeyRef:
-              name: app-secrets
-              key: db-password
-```
-
-**Best Practice:**
-* 📋 **ConfigMap:** URLs, ports, feature flags
-* 🔐 **Secret:** Passwords, tokens, certificates
-* 🔒 **Never mix** sensitive and non-sensitive data
-
----
-
-## 📍 Slide 36 – 📊 Configuration Best Practices
-
-| 🔧 Practice | 📝 Description |
-|------------|---------------|
-| **Version ConfigMaps** | Include version in name (`app-config-v2`) |
-| **Use namespaces** | Isolate environments (dev, staging, prod) |
-| **Validate in CI** | Check config syntax before deploy |
-| **Document defaults** | What happens if config missing? |
-| **Monitor changes** | Alert on ConfigMap updates |
-| **Limit size** | Keep ConfigMaps under 1MB |
-| **Use labels** | Tag configs with app, version, environment |
-
----
-
-## 📍 Slide 37 – 🎯 Key Takeaways
-
-1. 📋 **ConfigMaps** separate configuration from code — one image, any environment
-2. 🔐 **ConfigMaps ≠ Secrets** — never store sensitive data in ConfigMaps
-3. 💾 **PVCs** provide persistent storage that survives pod restarts
-4. 🔄 **Dynamic provisioning** automates storage management
-5. 📁 **Version your configs** — treat them like code
-6. 🏭 **GitOps** — configuration in Git is the source of truth
-
-> 💬 *"Configuration belongs in the environment, not the artifact."*
-> — 12-Factor App
-
----
-
-## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L12_POST
-
----
-
-## 📍 Slide 39 – 🚀 What's Next?
-
-**Coming up: Lecture 13 — GitOps with ArgoCD**
-
-```mermaid
-flowchart LR
-  A[📝 Git] --> B[🔄 ArgoCD]
-  B --> C[☸️ Kubernetes]
-  C --> D[🎯 Desired State]
-```
-
-* 🔄 **Continuous Deployment** automated
-* 📝 **Git as single source of truth**
-* 🔍 **Drift detection** and auto-sync
-* ↩️ **Easy rollbacks** with git revert
-
-> 🎯 **Lab 12:** Apply these concepts — create ConfigMaps, use PVCs, externalize your app configuration!
-
----
-
-## 📚 Resources
-
-**Documentation:**
-* 📖 [Kubernetes ConfigMaps](https://kubernetes.io/docs/concepts/configuration/configmap/)
-* 📖 [Persistent Volumes](https://kubernetes.io/docs/concepts/storage/persistent-volumes/)
-* 📖 [12-Factor App — Config](https://12factor.net/config)
-
-**Tools:**
-* 🔧 [Kustomize](https://kustomize.io/)
-* 🔧 [Reloader](https://github.com/stakater/Reloader)
-
-**Books:**
-* 📕 *Kubernetes Patterns* by Bilgin Ibryam & Roland Huß
-* 📕 *Cloud Native DevOps with Kubernetes* by John Arundel & Justin Domingus
+# 📌 Lecture 12 — Configuration & Storage: Externalizing Application State
+
+> 🎯 **From hardcoded configs to dynamic, portable applications**
+
+---
+
+## 📍 Slide 1 – 🚀 Welcome to Configuration Management
+
+Last lecture we secured our **secrets**. But what about everything else?
+
+* 🔧 **Database URLs** — different per environment
+* 📊 **Feature flags** — enable/disable features dynamically
+* 📁 **Data persistence** — where does your app store files?
+* ⚙️ **App settings** — logging levels, timeouts, cache sizes
+
+```mermaid
+flowchart LR
+  A[😰 Hardcoded Config] --> B[🔧 Externalized Config]
+  B --> C[🚀 Portable Apps]
+  C --> D[💎 Any Environment]
+```
+
+> 🎯 **Goal:** Build applications that run anywhere without code changes
+
+---
+
+## 📍 Slide 2 – 📚 Learning Outcomes
+
+By the end of this lecture, you will:
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | ✅ Understand the **12-Factor App** configuration principle |
+| 2 | ✅ Create and use **ConfigMaps** for non-sensitive configuration |
+| 3 | ✅ Differentiate between **ConfigMaps** and **Secrets** |
+| 4 | ✅ Understand **Persistent Volumes** and storage in Kubernetes |
+| 5 | ✅ Implement **PersistentVolumeClaims** for stateful applications |
+| 6 | ✅ Apply configuration management **best practices** |
+
+---
+
+## 📍 Slide 3 – 🗺️ Lecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  SECTION 0: Introduction                    (Slides 1-4)   │
+├─────────────────────────────────────────────────────────────┤
+│  📝 PRE QUIZ                                (Slide 5)      │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 1: The Configuration Problem       (Slides 6-10)  │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 2: ConfigMaps Deep Dive            (Slides 11-15) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 3: Hands-on Scenarios              (Slides 16-24) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 MID QUIZ                                (Slide 25)     │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 4: Persistent Storage              (Slides 26-32) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 5: Production Patterns             (Slides 33-37) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 POST QUIZ                               (Slide 38)     │
+├─────────────────────────────────────────────────────────────┤
+│  FINAL: What's Next                         (Slide 39)     │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 📍 Slide 4 – 🤔 The Big Question
+
+> 💬 *"Store config in the environment, not in the code."*
+> — The Twelve-Factor App
+
+**Consider this:**
+
+* 🏭 You have the **same application** running in dev, staging, and production
+* 🔧 Each environment needs **different database URLs**
+* 📊 You want to change **log levels without redeploying**
+* 💾 Your app needs to **persist user uploads** somewhere
+
+> 🤔 **Think:** How do you build ONE container image that works everywhere?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L12_PRE
+
+---
+
+## 📍 Slide 6 – ⚠️ Section 1: The Configuration Problem
+
+**The Anti-Pattern: Hardcoded Configuration**
+
+```mermaid
+flowchart TD
+  subgraph 😰 Hardcoded
+    A[app-dev.jar] --> D1[Dev DB]
+    B[app-staging.jar] --> D2[Staging DB]
+    C[app-prod.jar] --> D3[Prod DB]
+  end
+
+  subgraph 🚀 Externalized
+    E[app.jar] --> F{Config}
+    F --> D1
+    F --> D2
+    F --> D3
+  end
+```
+
+* 😰 **Hardcoded:** Different artifact per environment
+* 🚀 **Externalized:** One artifact, configuration injected at runtime
+
+---
+
+## 📍 Slide 7 – 🔥 Pain Point 1: Environment-Specific Builds
+
+**The Problem:**
+
+```dockerfile
+# ❌ Bad: Environment-specific Dockerfile
+FROM python:3.12
+ENV DATABASE_URL=postgres://dev-server:5432/mydb  # 😱 Hardcoded!
+ENV LOG_LEVEL=DEBUG
+COPY . /app
+```
+
+* 🔄 Need to **rebuild** for each environment
+* 🐛 **"Works on my machine"** — config differs
+* 🔍 Can't trace which **version** is where
+* 💀 Accidentally deploying **dev config to production**
+
+> 😱 **Horror Story:** Company deployed with `DEBUG=true` to production, logging credit card numbers
+
+---
+
+## 📍 Slide 8 – 🔥 Pain Point 2: Configuration Drift
+
+**What happens over time:**
+
+| 📅 Month | 🔧 Dev Config | 🎭 Staging Config | 🏭 Prod Config |
+|----------|---------------|-------------------|----------------|
+| January  | `timeout=30` | `timeout=30` | `timeout=30` |
+| March    | `timeout=60` | `timeout=30` | `timeout=30` |
+| June     | `timeout=60` | `timeout=45` | `timeout=30` |
+| Now      | 😵 Nobody knows what's deployed where |
+
+* 🔄 **Manual changes** accumulate
+* 📋 No **version control** for configuration
+* 🐛 **Staging doesn't match production** — bugs slip through
+
+---
+
+## 📍 Slide 9 – 🔥 Pain Point 3: Data Loss
+
+**Stateless containers + persistent data = 💥**
+
+```mermaid
+flowchart LR
+  A[📦 Container v1] --> B[💾 /app/uploads]
+  B --> C[🔄 Deployment]
+  C --> D[📦 Container v2]
+  D --> E[💾 /app/uploads]
+  E --> F[😱 Empty!]
+```
+
+* 📦 Containers are **ephemeral** — data inside is lost on restart
+* 💾 User uploads, databases, caches — all **gone**
+* 🔄 Rolling updates = **data loss** without proper storage
+
+> 🤔 **Discussion:** Where should container applications store their data?
+
+---
+
+## 📍 Slide 10 – 💰 The Cost of Poor Configuration
+
+| 🔥 Problem | 💥 Impact | 📊 Statistics |
+|-----------|----------|---------------|
+| Config drift | Inconsistent behavior | 62% of outages involve config changes |
+| Hardcoded secrets | Security breaches | Covered in Lecture 11! |
+| Data loss | Customer impact | Average $150K per incident |
+| Manual config | Human error | 70% of failures are human error |
+
+**Root causes of production incidents (2024 survey):**
+* 🔧 Configuration changes: **41%**
+* 📦 Code deployments: **31%**
+* 🔌 Infrastructure failures: **28%**
+
+---
+
+## 📍 Slide 11 – ✅ Section 2: ConfigMaps to the Rescue
+
+**What is a ConfigMap?**
+
+* 📋 Kubernetes object that stores **non-confidential** configuration data
+* 🔑 Key-value pairs or **entire files**
+* 🔄 Decouples configuration from container images
+* ⚡ Can be updated **without rebuilding** the application
+
+```mermaid
+flowchart LR
+  A[📋 ConfigMap] --> B[📦 Pod]
+  A --> C[📦 Pod]
+  A --> D[📦 Pod]
+
+  E[🔐 Secret] --> B
+  E --> C
+  E --> D
+```
+
+> 💡 **Key Insight:** ConfigMaps for config, Secrets for sensitive data
+
+---
+
+## 📍 Slide 12 – 🚫 ConfigMaps: What They're NOT
+
+| 🚫 Myth | ✅ Reality |
+|---------|----------|
+| ConfigMaps are secure | ❌ Stored in plain text in etcd |
+| ConfigMaps replace Secrets | ❌ Use Secrets for sensitive data |
+| ConfigMaps auto-reload apps | ❌ Apps must implement hot-reload |
+| ConfigMaps have no size limit | ❌ Limited to 1MB per ConfigMap |
+
+> ⚠️ **Warning:** Never store passwords, tokens, or keys in ConfigMaps!
+
+**When to use which:**
+
+| 📋 ConfigMap | 🔐 Secret |
+|-------------|----------|
+| Database URLs (without password) | Database passwords |
+| Feature flags | API keys |
+| Log levels | TLS certificates |
+| Application settings | OAuth tokens |
+
+---
+
+## 📍 Slide 13 – 🛠️ Creating ConfigMaps
+
+**Method 1: From literal values**
+```bash
+kubectl create configmap app-config \
+  --from-literal=LOG_LEVEL=INFO \
+  --from-literal=CACHE_TTL=3600
+```
+
+**Method 2: From a file**
+```bash
+kubectl create configmap nginx-config \
+  --from-file=nginx.conf
+```
+
+**Method 3: From YAML manifest**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: app-config
+data:
+  LOG_LEVEL: "INFO"
+  DATABASE_HOST: "postgres.default.svc"
+  config.yaml: |
+    server:
+      port: 8080
+      timeout: 30s
+```
+
+---
+
+## 📍 Slide 14 – 🔌 Consuming ConfigMaps
+
+**Option 1: Environment Variables**
+```yaml
+# ✅ Individual keys
+env:
+  - name: LOG_LEVEL
+    valueFrom:
+      configMapKeyRef:
+        name: app-config
+        key: LOG_LEVEL
+
+# ✅ All keys at once
+envFrom:
+  - configMapRef:
+      name: app-config
+```
+
+**Option 2: Volume Mounts (for files)**
+```yaml
+volumes:
+  - name: config-volume
+    configMap:
+      name: nginx-config
+volumeMounts:
+  - name: config-volume
+    mountPath: /etc/nginx/nginx.conf
+    subPath: nginx.conf
+```
+
+---
+
+## 📍 Slide 15 – 📊 Before vs After: Configuration
+
+| 📋 Aspect | 😰 Before (Hardcoded) | 🚀 After (ConfigMaps) |
+|----------|----------------------|----------------------|
+| Build per environment | Yes, multiple images | No, one image |
+| Change config | Rebuild & redeploy | Update ConfigMap |
+| Version control | In code (scattered) | Centralized, declarative |
+| Environment parity | Difficult | Easy |
+| Rollback | Redeploy old image | Apply old ConfigMap |
+| Audit trail | Git history (code) | K8s + Git history |
+
+> 🤔 **Think:** What configuration in your applications could be externalized?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Let's Simulate!
+
+**Scenario:** You're a DevOps engineer at **CloudMart** 🛒
+
+Your application:
+* 🐍 Python/Go web service
+* 📊 Needs different configs per environment
+* 💾 Stores user uploads
+* 🔧 Frequently changes feature flags
+
+**What could go wrong?** Everything! Let's fix it.
+
+---
+
+## 📍 Slide 17 – 💥 Scenario 1: Wrong Environment Config
+
+**Situation:** Developer accidentally deploys with staging database URL to production
+
+```mermaid
+flowchart LR
+  A[👨‍💻 Dev pushes] --> B[🔄 CI/CD]
+  B --> C[📦 Deploy to Prod]
+  C --> D[🔗 Connects to Staging DB]
+  D --> E[😱 Production reads staging data!]
+```
+
+* 😱 **Impact:** Customers see test data
+* ⏱️ **Detection time:** 2 hours
+* 💰 **Cost:** Lost sales, reputation damage
+
+> 🤔 **Question:** How do we prevent this?
+
+---
+
+## 📍 Slide 18 – ✅ Solution 1: Environment-Specific ConfigMaps
+
+**Fix:** Namespace-isolated ConfigMaps
+
+```yaml
+# configmap-prod.yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: app-config
+  namespace: production  # 🔑 Namespace isolation
+data:
+  DATABASE_HOST: "prod-db.internal"
+  ENVIRONMENT: "production"
+---
+# configmap-staging.yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: app-config
+  namespace: staging
+data:
+  DATABASE_HOST: "staging-db.internal"
+  ENVIRONMENT: "staging"
+```
+
+* ✅ **Same ConfigMap name**, different namespaces
+* ✅ **Impossible** to mix environments
+* ✅ **GitOps friendly** — config in version control
+
+---
+
+## 📍 Slide 19 – 💥 Scenario 2: Config Change Causes Outage
+
+**Situation:** Changed `CACHE_TTL` from 3600 to 36 (typo!) — cache expires every 36 seconds
+
+```mermaid
+flowchart TD
+  A[⌨️ Typo: 3600 → 36] --> B[📋 ConfigMap Updated]
+  B --> C[📦 Pods reload config]
+  C --> D[🔥 Cache thrashing]
+  D --> E[💀 Database overloaded]
+  E --> F[😱 Site down!]
+```
+
+* 😱 **Impact:** 30-minute outage
+* 🔍 **Root cause:** No validation, no review
+
+---
+
+## 📍 Slide 20 – ✅ Solution 2: Immutable ConfigMaps + Versioning
+
+**Fix:** Treat ConfigMaps as immutable, version them
+
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: app-config-v3  # 🔑 Versioned name
+  labels:
+    version: "3"
+immutable: true  # 🔒 Cannot be modified
+data:
+  CACHE_TTL: "3600"
+```
+
+**Deployment references specific version:**
+```yaml
+envFrom:
+  - configMapRef:
+      name: app-config-v3  # 🔑 Explicit version
+```
+
+* ✅ **Rollback** = change reference to previous version
+* ✅ **Audit trail** — which version when
+* ✅ **Validation** in CI/CD before applying
+
+---
+
+## 📍 Slide 21 – 💥 Scenario 3: User Uploads Disappear
+
+**Situation:** Deployment rolls out new pods, user uploads are gone
+
+```mermaid
+flowchart TD
+  A[📦 Pod v1] --> B[💾 /app/uploads]
+  B --> C[📸 User uploads photo]
+  C --> D[🔄 Rolling Update]
+  D --> E[📦 Pod v2]
+  E --> F[💾 /app/uploads - Empty!]
+  F --> G[😱 User: Where's my photo?!]
+```
+
+* 💾 Container filesystem is **ephemeral**
+* 🔄 New container = **fresh filesystem**
+* 😱 All data is **lost**
+
+---
+
+## 📍 Slide 22 – ✅ Solution 3: Persistent Volumes
+
+**Fix:** External storage that survives pod restarts
+
+```yaml
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: uploads-pvc
+spec:
+  accessModes:
+    - ReadWriteOnce
+  resources:
+    requests:
+      storage: 10Gi
+---
+# In Deployment
+volumes:
+  - name: uploads
+    persistentVolumeClaim:
+      claimName: uploads-pvc
+volumeMounts:
+  - name: uploads
+    mountPath: /app/uploads
+```
+
+```mermaid
+flowchart LR
+  A[📦 Pod v1] --> B[💾 PVC]
+  C[📦 Pod v2] --> B
+  D[📦 Pod v3] --> B
+  B --> E[🗄️ Persistent Storage]
+```
+
+---
+
+## 📍 Slide 23 – 💥 Scenario 4: ConfigMap Update Not Applied
+
+**Situation:** Updated ConfigMap, but app still uses old values
+
+```mermaid
+flowchart LR
+  A[📋 ConfigMap Updated] --> B[📦 Pod still running]
+  B --> C[⚠️ Using old config!]
+  C --> D[🤔 Why isn't it working?]
+```
+
+* 🔄 ConfigMap updates **don't automatically restart** pods
+* 📦 Pod keeps the config from when it started
+
+---
+
+## 📍 Slide 24 – ✅ Solution 4: Config Reload Strategies
+
+**Strategy 1: Restart Deployment**
+```bash
+kubectl rollout restart deployment/myapp
+```
+
+**Strategy 2: Use a hash annotation (GitOps-friendly)**
+```yaml
+metadata:
+  annotations:
+    checksum/config: {{ sha256sum .Values.config | quote }}
+```
+
+**Strategy 3: App-level hot reload**
+* 📂 Mount ConfigMap as volume
+* 👀 Watch for file changes
+* 🔄 Reload configuration in-memory
+
+**Strategy 4: Reloader controller**
+* 🤖 Automatically restarts pods when ConfigMap changes
+* 📦 `stakater/reloader` — popular open source solution
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L12_MID
+
+---
+
+## 📍 Slide 26 – 💾 Section 4: Persistent Storage Deep Dive
+
+**The Storage Stack in Kubernetes:**
+
+```mermaid
+flowchart TD
+  A[📦 Pod] --> B[📁 Volume Mount]
+  B --> C[💾 PersistentVolumeClaim]
+  C --> D[🗄️ PersistentVolume]
+  D --> E[☁️ Storage Backend]
+
+  F[📋 StorageClass] -.-> C
+  F -.-> D
+```
+
+* 📦 **Pod:** Uses the storage via mount
+* 💾 **PVC:** Request for storage ("I need 10GB")
+* 🗄️ **PV:** Actual storage resource
+* ☁️ **Backend:** AWS EBS, GCE PD, NFS, local disk
+* 📋 **StorageClass:** Template for dynamic provisioning
+
+---
+
+## 📍 Slide 27 – 📋 Storage Concepts Breakdown
+
+| 🔧 Concept | 📝 Description | 🎯 Analogy |
+|-----------|---------------|-----------|
+| **PersistentVolume (PV)** | A piece of storage in the cluster | A physical hard drive |
+| **PersistentVolumeClaim (PVC)** | A request for storage | "I need a 100GB drive" |
+| **StorageClass** | Template for provisioning | "Give me SSD storage" |
+| **Access Modes** | How pods can access | ReadWriteOnce, ReadWriteMany |
+| **Reclaim Policy** | What happens when PVC deleted | Retain, Delete, Recycle |
+
+**Access Modes:**
+* 🔒 **ReadWriteOnce (RWO):** One node can mount read-write
+* 📖 **ReadOnlyMany (ROX):** Many nodes can mount read-only
+* 📝 **ReadWriteMany (RWX):** Many nodes can mount read-write
+
+---
+
+## 📍 Slide 28 – 🔄 Dynamic Provisioning
+
+**Without Dynamic Provisioning (Manual):**
+```mermaid
+flowchart LR
+  A[👨‍💻 Admin creates PV] --> B[📋 PV available]
+  B --> C[👨‍💻 Dev creates PVC]
+  C --> D[🔗 PVC binds to PV]
+```
+
+**With Dynamic Provisioning (Automatic):**
+```mermaid
+flowchart LR
+  A[👨‍💻 Dev creates PVC] --> B[📋 StorageClass]
+  B --> C[🤖 Auto-create PV]
+  C --> D[🔗 PVC binds to PV]
+```
+
+```yaml
+apiVersion: storage.k8s.io/v1
+kind: StorageClass
+metadata:
+  name: fast-ssd
+provisioner: kubernetes.io/gce-pd  # Cloud-specific
+parameters:
+  type: pd-ssd
+reclaimPolicy: Delete
+volumeBindingMode: WaitForFirstConsumer
+```
+
+---
+
+## 📍 Slide 29 – ⚠️ Storage Pitfalls
+
+| ⚠️ Pitfall | 💥 Impact | ✅ Solution |
+|-----------|----------|------------|
+| Wrong access mode | Pod scheduling fails | Match mode to use case |
+| No storage class | PVC pending forever | Set default StorageClass |
+| Reclaim = Delete | Data lost on PVC delete | Use Retain for important data |
+| Zone mismatch | Pod can't mount volume | Use topology-aware provisioning |
+| Insufficient capacity | PVC pending | Monitor storage usage |
+
+**Common error:**
+```
+Warning  FailedScheduling  pod has unbound immediate PersistentVolumeClaims
+```
+
+> 🔍 **Debug:** `kubectl describe pvc <name>` — check events
+
+---
+
+## 📍 Slide 30 – 📊 Volume Types Comparison
+
+| 📦 Volume Type | 🎯 Use Case | ⚡ Performance | 💰 Cost |
+|---------------|------------|---------------|--------|
+| **emptyDir** | Temp data, cache | Fast (node storage) | Free |
+| **hostPath** | Node-specific data | Fast | Free |
+| **NFS** | Shared storage | Medium | Varies |
+| **Cloud (EBS, PD)** | Production workloads | Configurable | $$$ |
+| **Local PV** | Databases, high IOPS | Very fast | Node-dependent |
+
+**Decision tree:**
+```mermaid
+flowchart TD
+  A[Need persistent storage?] --> |No| B[emptyDir]
+  A --> |Yes| C[Shared across pods?]
+  C --> |No| D[Cloud Block Storage]
+  C --> |Yes| E[NFS or Cloud File Storage]
+```
+
+---
+
+## 📍 Slide 31 – 🔧 Practical PVC Example
+
+**Complete example for a web application:**
+
+```yaml
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: app-uploads
+spec:
+  accessModes:
+    - ReadWriteOnce
+  storageClassName: standard
+  resources:
+    requests:
+      storage: 5Gi
+---
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: webapp
+spec:
+  template:
+    spec:
+      containers:
+        - name: app
+          volumeMounts:
+            - name: uploads
+              mountPath: /app/uploads
+      volumes:
+        - name: uploads
+          persistentVolumeClaim:
+            claimName: app-uploads
+```
+
+---
+
+## 📍 Slide 32 – 📈 Storage Lifecycle
+
+```mermaid
+stateDiagram-v2
+  [*] --> Pending: PVC Created
+  Pending --> Bound: PV Available
+  Bound --> Released: PVC Deleted
+  Released --> Available: Reclaim
+  Released --> [*]: Delete Policy
+
+  note right of Pending: Waiting for PV
+  note right of Bound: In use
+  note right of Released: Data still exists
+```
+
+**Key states:**
+* ⏳ **Pending:** Waiting for matching PV
+* ✅ **Bound:** PVC matched to PV
+* 🔓 **Released:** PVC deleted, PV still has data
+* ❌ **Failed:** Error in provisioning
+
+---
+
+## 📍 Slide 33 – 🏭 Section 5: Production Patterns
+
+**Pattern 1: GitOps Configuration Management**
+
+```mermaid
+flowchart LR
+  A[📝 Git Repo] --> B[🔄 ArgoCD]
+  B --> C[📋 ConfigMaps]
+  B --> D[🔐 Secrets]
+  B --> E[📦 Deployments]
+
+  C --> F[🎯 Cluster]
+  D --> F
+  E --> F
+```
+
+* 📋 **All configuration in Git** — single source of truth
+* 🔄 **ArgoCD syncs** to cluster
+* 🔍 **Audit trail** — who changed what, when
+* ↩️ **Rollback** — `git revert`
+
+---
+
+## 📍 Slide 34 – 🔧 Pattern 2: Environment Hierarchy
+
+**Kustomize for environment-specific configs:**
+
+```
+base/
+  ├── deployment.yaml
+  ├── service.yaml
+  └── configmap.yaml
+overlays/
+  ├── dev/
+  │   └── kustomization.yaml
+  ├── staging/
+  │   └── kustomization.yaml
+  └── prod/
+      └── kustomization.yaml
+```
+
+```yaml
+# overlays/prod/kustomization.yaml
+resources:
+  - ../../base
+configMapGenerator:
+  - name: app-config
+    literals:
+      - LOG_LEVEL=WARN
+      - REPLICAS=5
+```
+
+* ✅ **DRY** — Don't Repeat Yourself
+* ✅ **Environment-specific** overrides
+* ✅ **Consistent** base configuration
+
+---
+
+## 📍 Slide 35 – 🔐 Pattern 3: Secrets + ConfigMaps Together
+
+**Combining Secrets and ConfigMaps:**
+
+```yaml
+spec:
+  containers:
+    - name: app
+      env:
+        # 📋 From ConfigMap (non-sensitive)
+        - name: DATABASE_HOST
+          valueFrom:
+            configMapKeyRef:
+              name: app-config
+              key: DATABASE_HOST
+        # 🔐 From Secret (sensitive)
+        - name: DATABASE_PASSWORD
+          valueFrom:
+            secretKeyRef:
+              name: app-secrets
+              key: db-password
+```
+
+**Best Practice:**
+* 📋 **ConfigMap:** URLs, ports, feature flags
+* 🔐 **Secret:** Passwords, tokens, certificates
+* 🔒 **Never mix** sensitive and non-sensitive data
+
+---
+
+## 📍 Slide 36 – 📊 Configuration Best Practices
+
+| 🔧 Practice | 📝 Description |
+|------------|---------------|
+| **Version ConfigMaps** | Include version in name (`app-config-v2`) |
+| **Use namespaces** | Isolate environments (dev, staging, prod) |
+| **Validate in CI** | Check config syntax before deploy |
+| **Document defaults** | What happens if config missing? |
+| **Monitor changes** | Alert on ConfigMap updates |
+| **Limit size** | Keep ConfigMaps under 1MB |
+| **Use labels** | Tag configs with app, version, environment |
+
+---
+
+## 📍 Slide 37 – 🎯 Key Takeaways
+
+1. 📋 **ConfigMaps** separate configuration from code — one image, any environment
+2. 🔐 **ConfigMaps ≠ Secrets** — never store sensitive data in ConfigMaps
+3. 💾 **PVCs** provide persistent storage that survives pod restarts
+4. 🔄 **Dynamic provisioning** automates storage management
+5. 📁 **Version your configs** — treat them like code
+6. 🏭 **GitOps** — configuration in Git is the source of truth
+
+> 💬 *"Configuration belongs in the environment, not the artifact."*
+> — 12-Factor App
+
+---
+
+## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L12_POST
+
+---
+
+## 📍 Slide 39 – 🚀 What's Next?
+
+**Coming up: Lecture 13 — GitOps with ArgoCD**
+
+```mermaid
+flowchart LR
+  A[📝 Git] --> B[🔄 ArgoCD]
+  B --> C[☸️ Kubernetes]
+  C --> D[🎯 Desired State]
+```
+
+* 🔄 **Continuous Deployment** automated
+* 📝 **Git as single source of truth**
+* 🔍 **Drift detection** and auto-sync
+* ↩️ **Easy rollbacks** with git revert
+
+> 🎯 **Lab 12:** Apply these concepts — create ConfigMaps, use PVCs, externalize your app configuration!
+
+---
+
+## 📚 Resources
+
+**Documentation:**
+* 📖 [Kubernetes ConfigMaps](https://kubernetes.io/docs/concepts/configuration/configmap/)
+* 📖 [Persistent Volumes](https://kubernetes.io/docs/concepts/storage/persistent-volumes/)
+* 📖 [12-Factor App — Config](https://12factor.net/config)
+
+**Tools:**
+* 🔧 [Kustomize](https://kustomize.io/)
+* 🔧 [Reloader](https://github.com/stakater/Reloader)
+
+**Books:**
+* 📕 *Kubernetes Patterns* by Bilgin Ibryam & Roland Huß
+* 📕 *Cloud Native DevOps with Kubernetes* by John Arundel & Justin Domingus
diff --git a/lectures/lec13.md b/lectures/lec13.md
index 370ae7821a..1f3c679803 100644
--- a/lectures/lec13.md
+++ b/lectures/lec13.md
@@ -1,830 +1,830 @@
-# 📌 Lecture 13 — GitOps with ArgoCD: Git as the Source of Truth
-
-> 🎯 **From manual deployments to automated, auditable, self-healing infrastructure**
-
----
-
-## 📍 Slide 1 – 🚀 Welcome to GitOps
-
-We've learned to store configuration in **ConfigMaps** and **Secrets**. But who deploys them?
-
-* 👨‍💻 **Manual kubectl?** — "Who ran that command?"
-* 🔄 **CI/CD pipeline?** — Push-based, fragile
-* 🤔 **What about drift?** — Reality vs desired state
-
-```mermaid
-flowchart LR
-  A[😰 Manual Deploys] --> B[🔄 CI/CD Push]
-  B --> C[🚀 GitOps Pull]
-  C --> D[💎 Self-healing Infrastructure]
-```
-
-> 🎯 **Goal:** Git becomes the single source of truth for your entire infrastructure
-
----
-
-## 📍 Slide 2 – 📚 Learning Outcomes
-
-By the end of this lecture, you will:
-
-| # | 🎯 Outcome |
-|---|-----------|
-| 1 | ✅ Understand **GitOps principles** and benefits |
-| 2 | ✅ Differentiate **push vs pull** deployment models |
-| 3 | ✅ Deploy applications using **ArgoCD** |
-| 4 | ✅ Configure **sync policies** and **auto-healing** |
-| 5 | ✅ Handle **secrets** in GitOps workflows |
-| 6 | ✅ Implement **multi-environment** deployments |
-
----
-
-## 📍 Slide 3 – 🗺️ Lecture Overview
-
-```
-┌─────────────────────────────────────────────────────────────┐
-│  SECTION 0: Introduction                    (Slides 1-4)   │
-├─────────────────────────────────────────────────────────────┤
-│  📝 PRE QUIZ                                (Slide 5)      │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 1: The Deployment Problem          (Slides 6-10)  │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 2: GitOps Principles               (Slides 11-15) │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 3: ArgoCD in Action                (Slides 16-24) │
-├─────────────────────────────────────────────────────────────┤
-│  📝 MID QUIZ                                (Slide 25)     │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 4: Advanced Patterns               (Slides 26-32) │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 5: Production GitOps               (Slides 33-37) │
-├─────────────────────────────────────────────────────────────┤
-│  📝 POST QUIZ                               (Slide 38)     │
-├─────────────────────────────────────────────────────────────┤
-│  FINAL: What's Next                         (Slide 39)     │
-└─────────────────────────────────────────────────────────────┘
-```
-
----
-
-## 📍 Slide 4 – 🤔 The Big Question
-
-> 💬 *"If it's not in Git, it doesn't exist."*
-> — GitOps Mantra
-
-**Consider this scenario:**
-
-* 🌙 **3 AM alert:** Production is down
-* 🔍 **Investigation:** Someone changed a deployment
-* ❓ **Questions:** Who? When? What changed? How to rollback?
-* 😱 **Answer:** Nobody knows...
-
-> 🤔 **Think:** How do we ensure every change is tracked, auditable, and reversible?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L13_PRE
-
----
-
-## 📍 Slide 6 – ⚠️ Section 1: The Deployment Problem
-
-**Traditional Deployment Models:**
-
-```mermaid
-flowchart TD
-  subgraph 😰 Manual
-    A[👨‍💻 Developer] --> B[⌨️ kubectl apply]
-    B --> C[☸️ Cluster]
-  end
-
-  subgraph 🔄 CI/CD Push
-    D[📝 Git Push] --> E[🔧 CI Pipeline]
-    E --> F[⌨️ kubectl apply]
-    F --> G[☸️ Cluster]
-  end
-```
-
-* 😰 **Manual:** No audit trail, human error, inconsistent
-* 🔄 **CI/CD Push:** Better, but credentials in pipeline, cluster access
-
----
-
-## 📍 Slide 7 – 🔥 Pain Point 1: The "It Works on My Machine" Problem
-
-**Symptoms:**
-
-* 👨‍💻 **Dev:** "I deployed it, it's working!"
-* 🏭 **Prod:** "It's completely broken!"
-* 🔍 **Investigation:** Configs don't match
-
-```mermaid
-flowchart LR
-  A[👨‍💻 Local kubectl] --> B[🎭 Staging]
-  C[👨‍💻 Different kubectl] --> D[🏭 Production]
-  B --> E[😵 Different States]
-  D --> E
-```
-
-* 🔧 **No single source of truth**
-* 📋 **Manual processes** lead to drift
-* 😱 **"Emergency fixes"** bypass procedures
-
----
-
-## 📍 Slide 8 – 🔥 Pain Point 2: Configuration Drift
-
-**Drift:** When actual state ≠ desired state
-
-| 📅 Time | 📝 Git (Desired) | ☸️ Cluster (Actual) | 😱 Drift |
-|---------|------------------|---------------------|----------|
-| Day 1 | replicas: 3 | replicas: 3 | ✅ None |
-| Day 5 | replicas: 3 | replicas: 5 (scaled manually) | ⚠️ Drift! |
-| Day 10 | replicas: 3 | replicas: 5, extra env var | 🔥 More drift! |
-| Day 30 | 🤷 Unknown | 🤷 Unknown | 💀 Chaos |
-
-**Real impact:**
-* 🔄 **Deployments fail** because actual state differs
-* 📋 **Documentation lies** — cluster is reality
-* 🔍 **Debugging nightmare** — which version is deployed?
-
----
-
-## 📍 Slide 9 – 🔥 Pain Point 3: Credential Sprawl
-
-**Push-based CI/CD security concerns:**
-
-```mermaid
-flowchart TD
-  A[🔐 Cluster Credentials] --> B[📦 CI Server]
-  A --> C[💻 Dev Machines]
-  A --> D[🔧 Scripts]
-  A --> E[📋 Pipeline Configs]
-
-  B --> F[😱 Breach Vector]
-  C --> F
-  D --> F
-  E --> F
-```
-
-* 🔐 **Credentials everywhere** — CI servers, dev machines
-* 🎯 **Attack surface** expands with each tool
-* 🔑 **Shared secrets** — who has access?
-
----
-
-## 📍 Slide 10 – 💰 The Cost of Manual Deployments
-
-| 🔥 Problem | 💥 Impact | 📊 Data |
-|-----------|----------|---------|
-| No audit trail | Compliance failures | 73% fail audits without GitOps |
-| Manual errors | Outages | 70% of outages are human error |
-| Credential sprawl | Security breaches | Average breach cost: $4.45M |
-| Slow recovery | Downtime | MTTR 4x longer without GitOps |
-
-> 💬 *"The cost of a breach is not the breach itself, but the inability to respond quickly."*
-
----
-
-## 📍 Slide 11 – ✅ Section 2: GitOps Principles
-
-**What is GitOps?**
-
-* 📝 **Git as single source of truth** — declarative desired state
-* 🔄 **Continuous reconciliation** — actual → desired
-* 🔀 **Pull-based deployment** — agent pulls from Git
-* 🔒 **Immutable, auditable** — every change tracked
-
-```mermaid
-flowchart LR
-  A[📝 Git Repo] --> |Pull| B[🤖 ArgoCD Agent]
-  B --> |Reconcile| C[☸️ Cluster]
-  C --> |Report Status| B
-```
-
-> 💡 **Key Insight:** The cluster pulls changes, no credentials leave the cluster!
-
----
-
-## 📍 Slide 12 – 🚫 GitOps: What It's NOT
-
-| 🚫 Myth | ✅ Reality |
-|---------|----------|
-| Just using Git for YAML files | A complete operational model with reconciliation |
-| Another CI/CD tool | Continuous deployment, not continuous integration |
-| Only for Kubernetes | Works for any declarative infrastructure |
-| Complicated to adopt | Can start simple, grow incrementally |
-
-> 🔥 **Hot take:** "Putting YAML in Git is not GitOps. GitOps is about the reconciliation loop."
-
-**The Four Principles (from OpenGitOps):**
-1. 📝 **Declarative** — Desired state expressed declaratively
-2. 🔄 **Versioned and Immutable** — Stored in Git
-3. 🤖 **Pulled Automatically** — Agents pull desired state
-4. ♾️ **Continuously Reconciled** — Agents ensure actual = desired
-
----
-
-## 📍 Slide 13 – 🔄 Push vs Pull Deployment
-
-```mermaid
-flowchart TD
-  subgraph 🔄 Push Model
-    A[📝 Git] --> B[🔧 CI/CD]
-    B --> |Push credentials needed| C[☸️ Cluster]
-  end
-
-  subgraph 🚀 Pull Model - GitOps
-    D[📝 Git] --> |Pull| E[🤖 Agent in Cluster]
-    E --> |Apply| F[☸️ Same Cluster]
-  end
-```
-
-| 📋 Aspect | 🔄 Push | 🚀 Pull (GitOps) |
-|----------|--------|------------------|
-| Credentials | CI needs cluster creds | Agent has local access |
-| Drift detection | None | Continuous |
-| Audit trail | CI logs (external) | Git history |
-| Recovery | Re-run pipeline | Automatic reconciliation |
-
----
-
-## 📍 Slide 14 – 🛠️ GitOps Tools Landscape
-
-| 🛠️ Tool | 📝 Description | ⭐ Best For |
-|---------|---------------|------------|
-| **ArgoCD** | Declarative GitOps for K8s | Most Kubernetes use cases |
-| **Flux** | Toolkit approach, CNCF project | Composable, extensible setups |
-| **Jenkins X** | CI/CD + GitOps combined | Jenkins-heavy organizations |
-| **Rancher Fleet** | Multi-cluster GitOps | Managing many clusters |
-
-**Why ArgoCD?**
-* 🎯 Most adopted (70%+ of GitOps users)
-* 🖥️ Excellent UI for visualization
-* 🔧 Rich feature set out of the box
-* 📚 Large community, good documentation
-
----
-
-## 📍 Slide 15 – 📊 Before vs After: Deployment
-
-| 📋 Aspect | 😰 Before (Manual/Push) | 🚀 After (GitOps) |
-|----------|-------------------------|-------------------|
-| Change process | kubectl, scripts, pipelines | Git PR → merge → auto-sync |
-| Audit trail | Scattered logs | Complete Git history |
-| Rollback | "Which version was before?" | `git revert` |
-| Drift | Undetected until failure | Detected immediately |
-| Credentials | Spread across tools | Stay in cluster |
-| Recovery | Manual intervention | Self-healing |
-
-> 🤔 **Think:** How would GitOps have helped in your last deployment issue?
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: ArgoCD in Action
-
-**ArgoCD Architecture:**
-
-```mermaid
-flowchart TD
-  A[📝 Git Repository] --> B[🤖 ArgoCD Server]
-  B --> C[🔄 Application Controller]
-  C --> D[☸️ Kubernetes API]
-  E[👨‍💻 User] --> F[🖥️ ArgoCD UI / CLI]
-  F --> B
-  D --> C
-```
-
-**Components:**
-* 🖥️ **API Server:** UI, CLI, webhook endpoints
-* 🔄 **Application Controller:** Reconciliation engine
-* 📦 **Repository Server:** Caches Git repos, renders manifests
-* 🔗 **Dex:** SSO authentication (optional)
-
----
-
-## 📍 Slide 17 – 💥 Scenario 1: First ArgoCD Deployment
-
-**Situation:** Deploy your first application with ArgoCD
-
-```yaml
-# Application manifest
-apiVersion: argoproj.io/v1alpha1
-kind: Application
-metadata:
-  name: my-app
-  namespace: argocd
-spec:
-  project: default
-  source:
-    repoURL: https://github.com/org/app-manifests
-    path: environments/dev
-    targetRevision: main
-  destination:
-    server: https://kubernetes.default.svc
-    namespace: dev
-```
-
-```mermaid
-flowchart LR
-  A[📝 Create App] --> B[🔄 ArgoCD Syncs]
-  B --> C[📦 Resources Created]
-  C --> D[✅ App Running]
-```
-
----
-
-## 📍 Slide 18 – ✅ Solution 1: Understanding Sync
-
-**Sync States:**
-
-| 🔄 State | 📝 Meaning | 🎯 Action |
-|----------|-----------|----------|
-| **Synced** | Cluster matches Git | ✅ Good! |
-| **OutOfSync** | Cluster differs from Git | 🔄 Sync needed |
-| **Unknown** | Can't determine state | 🔍 Check connection |
-| **Missing** | Resources don't exist yet | 🔄 Initial sync |
-
-**Health States:**
-
-| 💚 Health | 📝 Meaning |
-|----------|-----------|
-| **Healthy** | All resources running correctly |
-| **Progressing** | Resources being updated |
-| **Degraded** | Some resources have issues |
-| **Suspended** | Manually paused |
-
----
-
-## 📍 Slide 19 – 💥 Scenario 2: Handling Drift
-
-**Situation:** Someone manually changed replicas in the cluster
-
-```mermaid
-flowchart TD
-  A[📝 Git: replicas=3] --> B[🤖 ArgoCD]
-  C[👨‍💻 kubectl scale replicas=5] --> D[☸️ Cluster]
-  B --> |Detects| E[⚠️ OutOfSync]
-  E --> |Auto-sync enabled| F[🔄 Restore to 3]
-```
-
-**ArgoCD detects drift immediately!**
-* 🔍 **Visibility:** Shows exactly what differs
-* 🔄 **Options:** Manual sync or auto-sync
-* 📋 **Audit:** Who changed Git matters, not who ran kubectl
-
----
-
-## 📍 Slide 20 – ✅ Solution 2: Sync Policies
-
-**Configure automatic reconciliation:**
-
-```yaml
-spec:
-  syncPolicy:
-    automated:
-      prune: true        # Delete resources not in Git
-      selfHeal: true     # Revert manual changes
-    syncOptions:
-      - CreateNamespace=true
-      - PruneLast=true
-```
-
-**Options explained:**
-* 🔄 **automated:** Enable auto-sync on Git changes
-* 🗑️ **prune:** Delete resources removed from Git
-* 💚 **selfHeal:** Revert manual cluster changes
-* 📦 **CreateNamespace:** Create namespace if missing
-
----
-
-## 📍 Slide 21 – 💥 Scenario 3: Multi-Environment Deployment
-
-**Situation:** Same app, different configs for dev/staging/prod
-
-```
-repo/
-├── base/
-│   ├── deployment.yaml
-│   └── service.yaml
-└── overlays/
-    ├── dev/
-    │   └── kustomization.yaml
-    ├── staging/
-    │   └── kustomization.yaml
-    └── prod/
-        └── kustomization.yaml
-```
-
-```mermaid
-flowchart TD
-  A[📝 Git Repo] --> B[🤖 ArgoCD]
-  B --> C[📦 App-Dev]
-  B --> D[📦 App-Staging]
-  B --> E[📦 App-Prod]
-  C --> F[☸️ Dev Cluster]
-  D --> G[☸️ Staging Cluster]
-  E --> H[☸️ Prod Cluster]
-```
-
----
-
-## 📍 Slide 22 – ✅ Solution 3: ApplicationSet
-
-**Deploy to multiple environments with one definition:**
-
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: ApplicationSet
-metadata:
-  name: my-app
-spec:
-  generators:
-    - list:
-        elements:
-          - env: dev
-            namespace: dev
-          - env: staging
-            namespace: staging
-          - env: prod
-            namespace: prod
-  template:
-    metadata:
-      name: 'my-app-{{env}}'
-    spec:
-      source:
-        repoURL: https://github.com/org/manifests
-        path: 'overlays/{{env}}'
-      destination:
-        namespace: '{{namespace}}'
-```
-
----
-
-## 📍 Slide 23 – 💥 Scenario 4: Secrets in GitOps
-
-**Problem:** Secrets shouldn't be in Git... but GitOps needs everything in Git!
-
-```mermaid
-flowchart TD
-  A[🔐 Secret] --> B{Where to store?}
-  B --> |❌ Plain Git| C[😱 Security breach]
-  B --> |✅ Encrypted| D[🔒 Sealed Secrets]
-  B --> |✅ External| E[🔐 Vault + ESO]
-```
-
-**The dilemma:**
-* 📝 GitOps: Everything in Git
-* 🔐 Security: Secrets NOT in Git
-* 🤔 How to reconcile?
-
----
-
-## 📍 Slide 24 – ✅ Solution 4: Secrets Management Patterns
-
-**Option 1: Sealed Secrets**
-```yaml
-apiVersion: bitnami.com/v1alpha1
-kind: SealedSecret
-metadata:
-  name: my-secret
-spec:
-  encryptedData:
-    password: AgBghY8... # Encrypted, safe to commit!
-```
-
-**Option 2: External Secrets Operator + Vault**
-```yaml
-apiVersion: external-secrets.io/v1beta1
-kind: ExternalSecret
-metadata:
-  name: my-secret
-spec:
-  secretStoreRef:
-    name: vault-backend
-  target:
-    name: my-secret
-  data:
-    - secretKey: password
-      remoteRef:
-        key: app/database
-        property: password
-```
-
-* ✅ **Encrypted in Git** (Sealed Secrets)
-* ✅ **Reference only in Git** (External Secrets)
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L13_MID
-
----
-
-## 📍 Slide 26 – 🔧 Section 4: Advanced ArgoCD Patterns
-
-**Sync Waves & Hooks:**
-
-```yaml
-metadata:
-  annotations:
-    argocd.argoproj.io/sync-wave: "1"  # Order of deployment
-    argocd.argoproj.io/hook: PreSync   # Run before main sync
-```
-
-```mermaid
-flowchart LR
-  A[🔄 PreSync Hooks] --> B[📦 Wave 0]
-  B --> C[📦 Wave 1]
-  C --> D[📦 Wave 2]
-  D --> E[✅ PostSync Hooks]
-```
-
-**Use cases:**
-* 📊 **Database migrations** before app deploy
-* 🧹 **Cleanup jobs** after deployment
-* 🔍 **Health checks** between phases
-
----
-
-## 📍 Slide 27 – 🔄 Sync Options Deep Dive
-
-| 🔧 Option | 📝 Purpose |
-|----------|-----------|
-| `Replace` | Replace instead of apply (for immutable fields) |
-| `PruneLast` | Delete resources after all others sync |
-| `ApplyOutOfSyncOnly` | Only apply changed resources |
-| `ServerSideApply` | Use server-side apply (K8s 1.22+) |
-| `FailOnSharedResource` | Fail if resource owned by another app |
-
-```yaml
-syncPolicy:
-  syncOptions:
-    - CreateNamespace=true
-    - PrunePropagationPolicy=foreground
-    - PruneLast=true
-```
-
----
-
-## 📍 Slide 28 – 🏗️ Repository Structure Patterns
-
-**Pattern 1: Monorepo**
-```
-repo/
-├── apps/
-│   ├── app1/
-│   └── app2/
-└── infrastructure/
-    ├── prometheus/
-    └── argocd/
-```
-
-**Pattern 2: Repo per App**
-```
-app1-config/     # App 1 manifests
-app2-config/     # App 2 manifests
-infrastructure/  # Shared infra
-```
-
-**Pattern 3: Environment Repos**
-```
-dev-cluster/     # All dev apps
-prod-cluster/    # All prod apps
-```
-
-> 💡 **Recommendation:** Start with monorepo, split when it gets complex
-
----
-
-## 📍 Slide 29 – 📊 ArgoCD Metrics & Monitoring
-
-**Key metrics to watch:**
-
-| 📊 Metric | 📝 Meaning | ⚠️ Alert When |
-|----------|-----------|--------------|
-| `argocd_app_sync_total` | Total syncs | Unusually high |
-| `argocd_app_health_status` | App health | Not healthy |
-| `argocd_app_reconcile_duration` | Sync time | > 5 minutes |
-| `argocd_cluster_api_resource_objects` | Total objects | Growing unexpectedly |
-
-**Dashboard integration:**
-* 📊 Grafana dashboards available
-* 🔔 Alertmanager integration
-* 📝 Slack/Teams notifications
-
----
-
-## 📍 Slide 30 – 🔐 RBAC & Multi-tenancy
-
-**ArgoCD RBAC:**
-
-```yaml
-# argocd-rbac-cm ConfigMap
-policy.csv: |
-  p, role:dev-team, applications, get, dev-project/*, allow
-  p, role:dev-team, applications, sync, dev-project/*, allow
-  p, role:ops-team, applications, *, */*, allow
-
-  g, dev-group, role:dev-team
-  g, ops-group, role:ops-team
-```
-
-**Projects for isolation:**
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: AppProject
-metadata:
-  name: dev-project
-spec:
-  sourceRepos:
-    - 'https://github.com/org/dev-*'
-  destinations:
-    - namespace: 'dev-*'
-      server: https://kubernetes.default.svc
-```
-
----
-
-## 📍 Slide 31 – 🚨 Disaster Recovery
-
-**Git is your backup!**
-
-```mermaid
-flowchart TD
-  A[💀 Cluster Gone] --> B[🆕 New Cluster]
-  B --> C[📦 Install ArgoCD]
-  C --> D[🔗 Connect to Git]
-  D --> E[🔄 Sync All Apps]
-  E --> F[✅ Fully Restored]
-```
-
-**Recovery steps:**
-1. 🆕 Create new cluster
-2. 📦 Install ArgoCD
-3. 🔗 Point to Git repository
-4. ☕ Wait for sync
-5. ✅ Everything restored!
-
-> 💡 **Key insight:** If Git has everything, recovery is just a sync away
-
----
-
-## 📍 Slide 32 – 📋 GitOps Workflow Summary
-
-```mermaid
-flowchart TD
-  A[👨‍💻 Developer] --> |PR| B[📝 Git Repo]
-  B --> |Review| C[✅ Merge]
-  C --> |Webhook| D[🤖 ArgoCD]
-  D --> |Sync| E[☸️ Cluster]
-  E --> |Status| D
-  D --> |Notify| F[💬 Slack]
-
-  G[🔍 Drift Detection] --> D
-  D --> |Self-heal| E
-```
-
-**The complete loop:**
-1. 📝 **Change:** Developer creates PR
-2. 👀 **Review:** Team reviews and approves
-3. 🔀 **Merge:** Changes merge to main
-4. 🤖 **Detect:** ArgoCD detects new commit
-5. 🔄 **Sync:** Resources deployed to cluster
-6. 💚 **Verify:** Health checks pass
-7. 📢 **Notify:** Team informed of deployment
-
----
-
-## 📍 Slide 33 – 🏭 Section 5: Production GitOps
-
-**Enterprise Patterns:**
-
-```mermaid
-flowchart TD
-  subgraph Git
-    A[📝 Feature Branch] --> B[📝 Main Branch]
-    B --> C[📝 Release Branch]
-  end
-
-  subgraph ArgoCD
-    D[🤖 Dev App] --> E[🤖 Staging App]
-    E --> F[🤖 Prod App]
-  end
-
-  B --> D
-  C --> F
-```
-
-* 🔀 **Branch strategy:** Main for dev, release for prod
-* 🎯 **Progressive delivery:** Dev → Staging → Prod
-* ✅ **Promotion:** PR from main to release
-
----
-
-## 📍 Slide 34 – 🏢 Real-World GitOps: Intuit
-
-**Case Study: Intuit's GitOps Journey**
-
-* 📊 **Scale:** 2,000+ applications
-* 🔄 **Deployments:** 500+ per day
-* ⏱️ **MTTR:** Reduced by 80%
-
-**What they learned:**
-* 📋 Start small, grow incrementally
-* 🔧 Standardize templates early
-* 👥 Train teams on Git workflows
-* 📊 Monitor everything
-
-> 💬 *"GitOps turned our deployment from a ceremony into a non-event."* — Intuit Engineer
-
----
-
-## 📍 Slide 35 – 🔧 Migration Strategy
-
-**Adopting GitOps incrementally:**
-
-```mermaid
-flowchart LR
-  A[1️⃣ Non-critical app] --> B[2️⃣ Dev environment]
-  B --> C[3️⃣ More apps]
-  C --> D[4️⃣ Staging]
-  D --> E[5️⃣ Production]
-```
-
-**Phases:**
-1. 🧪 **Pilot:** One non-critical app in dev
-2. 📚 **Learn:** Document patterns, train team
-3. 📦 **Expand:** More apps, still dev
-4. 🎭 **Staging:** Full staging environment
-5. 🏭 **Production:** Controlled rollout
-
----
-
-## 📍 Slide 36 – 🎯 Key Takeaways
-
-1. 📝 **Git is the source of truth** — not the cluster, not CI/CD
-2. 🔄 **Pull > Push** — credentials stay in cluster
-3. 💚 **Self-healing** — drift is detected and corrected
-4. 🔍 **Complete audit trail** — git log is your history
-5. ↩️ **Easy rollback** — `git revert` reverts infrastructure
-6. 🔐 **Secrets need special handling** — Sealed Secrets or External Secrets
-
-> 💬 *"Operations by Pull Request"*
-> — Kelsey Hightower
-
----
-
-## 📍 Slide 37 – 🧠 Mindset Shift
-
-| 😰 Old Mindset | 🚀 New Mindset |
-|---------------|----------------|
-| "I'll just kubectl this" | "Let me create a PR" |
-| "The cluster is truth" | "Git is truth" |
-| "We need cluster access" | "We need Git access" |
-| "Rollback is scary" | "Rollback is git revert" |
-| "Who changed what?" | "Check git log" |
-| "Emergency fix!" | "Emergency PR with fast review" |
-
-> 🤔 **Question:** Which mindset do you operate with today?
-
----
-
-## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L13_POST
-
----
-
-## 📍 Slide 39 – 🚀 What's Next?
-
-**Coming up: Lecture 14 — Progressive Delivery with Argo Rollouts**
-
-```mermaid
-flowchart LR
-  A[📦 v1] --> B[🚀 Canary 10%]
-  B --> C[🚀 Canary 50%]
-  C --> D[🚀 Full Rollout]
-```
-
-* 🐤 **Canary deployments** — test with small traffic
-* 🔵 **Blue-green deployments** — instant switchover
-* 📊 **Automated analysis** — metrics-driven promotion
-* ↩️ **Automatic rollback** — on failure
-
-> 🎯 **Lab 13:** Set up ArgoCD and deploy your application using GitOps!
-
----
-
-## 📚 Resources
-
-**Documentation:**
-* 📖 [ArgoCD Docs](https://argo-cd.readthedocs.io/)
-* 📖 [OpenGitOps](https://opengitops.dev/)
-* 📖 [Sealed Secrets](https://sealed-secrets.netlify.app/)
-* 📖 [External Secrets Operator](https://external-secrets.io/)
-
-**Tools:**
-* 🔧 [ArgoCD](https://argoproj.github.io/cd/)
-* 🔧 [Flux](https://fluxcd.io/)
-* 🔧 [Kustomize](https://kustomize.io/)
-
-**Books:**
-* 📕 *GitOps and Kubernetes* by Billy Yuen, et al.
-* 📕 *Continuous Delivery* by Jez Humble & David Farley
+# 📌 Lecture 13 — GitOps with ArgoCD: Git as the Source of Truth
+
+> 🎯 **From manual deployments to automated, auditable, self-healing infrastructure**
+
+---
+
+## 📍 Slide 1 – 🚀 Welcome to GitOps
+
+We've learned to store configuration in **ConfigMaps** and **Secrets**. But who deploys them?
+
+* 👨‍💻 **Manual kubectl?** — "Who ran that command?"
+* 🔄 **CI/CD pipeline?** — Push-based, fragile
+* 🤔 **What about drift?** — Reality vs desired state
+
+```mermaid
+flowchart LR
+  A[😰 Manual Deploys] --> B[🔄 CI/CD Push]
+  B --> C[🚀 GitOps Pull]
+  C --> D[💎 Self-healing Infrastructure]
+```
+
+> 🎯 **Goal:** Git becomes the single source of truth for your entire infrastructure
+
+---
+
+## 📍 Slide 2 – 📚 Learning Outcomes
+
+By the end of this lecture, you will:
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | ✅ Understand **GitOps principles** and benefits |
+| 2 | ✅ Differentiate **push vs pull** deployment models |
+| 3 | ✅ Deploy applications using **ArgoCD** |
+| 4 | ✅ Configure **sync policies** and **auto-healing** |
+| 5 | ✅ Handle **secrets** in GitOps workflows |
+| 6 | ✅ Implement **multi-environment** deployments |
+
+---
+
+## 📍 Slide 3 – 🗺️ Lecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  SECTION 0: Introduction                    (Slides 1-4)   │
+├─────────────────────────────────────────────────────────────┤
+│  📝 PRE QUIZ                                (Slide 5)      │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 1: The Deployment Problem          (Slides 6-10)  │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 2: GitOps Principles               (Slides 11-15) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 3: ArgoCD in Action                (Slides 16-24) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 MID QUIZ                                (Slide 25)     │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 4: Advanced Patterns               (Slides 26-32) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 5: Production GitOps               (Slides 33-37) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 POST QUIZ                               (Slide 38)     │
+├─────────────────────────────────────────────────────────────┤
+│  FINAL: What's Next                         (Slide 39)     │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 📍 Slide 4 – 🤔 The Big Question
+
+> 💬 *"If it's not in Git, it doesn't exist."*
+> — GitOps Mantra
+
+**Consider this scenario:**
+
+* 🌙 **3 AM alert:** Production is down
+* 🔍 **Investigation:** Someone changed a deployment
+* ❓ **Questions:** Who? When? What changed? How to rollback?
+* 😱 **Answer:** Nobody knows...
+
+> 🤔 **Think:** How do we ensure every change is tracked, auditable, and reversible?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L13_PRE
+
+---
+
+## 📍 Slide 6 – ⚠️ Section 1: The Deployment Problem
+
+**Traditional Deployment Models:**
+
+```mermaid
+flowchart TD
+  subgraph 😰 Manual
+    A[👨‍💻 Developer] --> B[⌨️ kubectl apply]
+    B --> C[☸️ Cluster]
+  end
+
+  subgraph 🔄 CI/CD Push
+    D[📝 Git Push] --> E[🔧 CI Pipeline]
+    E --> F[⌨️ kubectl apply]
+    F --> G[☸️ Cluster]
+  end
+```
+
+* 😰 **Manual:** No audit trail, human error, inconsistent
+* 🔄 **CI/CD Push:** Better, but credentials in pipeline, cluster access
+
+---
+
+## 📍 Slide 7 – 🔥 Pain Point 1: The "It Works on My Machine" Problem
+
+**Symptoms:**
+
+* 👨‍💻 **Dev:** "I deployed it, it's working!"
+* 🏭 **Prod:** "It's completely broken!"
+* 🔍 **Investigation:** Configs don't match
+
+```mermaid
+flowchart LR
+  A[👨‍💻 Local kubectl] --> B[🎭 Staging]
+  C[👨‍💻 Different kubectl] --> D[🏭 Production]
+  B --> E[😵 Different States]
+  D --> E
+```
+
+* 🔧 **No single source of truth**
+* 📋 **Manual processes** lead to drift
+* 😱 **"Emergency fixes"** bypass procedures
+
+---
+
+## 📍 Slide 8 – 🔥 Pain Point 2: Configuration Drift
+
+**Drift:** When actual state ≠ desired state
+
+| 📅 Time | 📝 Git (Desired) | ☸️ Cluster (Actual) | 😱 Drift |
+|---------|------------------|---------------------|----------|
+| Day 1 | replicas: 3 | replicas: 3 | ✅ None |
+| Day 5 | replicas: 3 | replicas: 5 (scaled manually) | ⚠️ Drift! |
+| Day 10 | replicas: 3 | replicas: 5, extra env var | 🔥 More drift! |
+| Day 30 | 🤷 Unknown | 🤷 Unknown | 💀 Chaos |
+
+**Real impact:**
+* 🔄 **Deployments fail** because actual state differs
+* 📋 **Documentation lies** — cluster is reality
+* 🔍 **Debugging nightmare** — which version is deployed?
+
+---
+
+## 📍 Slide 9 – 🔥 Pain Point 3: Credential Sprawl
+
+**Push-based CI/CD security concerns:**
+
+```mermaid
+flowchart TD
+  A[🔐 Cluster Credentials] --> B[📦 CI Server]
+  A --> C[💻 Dev Machines]
+  A --> D[🔧 Scripts]
+  A --> E[📋 Pipeline Configs]
+
+  B --> F[😱 Breach Vector]
+  C --> F
+  D --> F
+  E --> F
+```
+
+* 🔐 **Credentials everywhere** — CI servers, dev machines
+* 🎯 **Attack surface** expands with each tool
+* 🔑 **Shared secrets** — who has access?
+
+---
+
+## 📍 Slide 10 – 💰 The Cost of Manual Deployments
+
+| 🔥 Problem | 💥 Impact | 📊 Data |
+|-----------|----------|---------|
+| No audit trail | Compliance failures | 73% fail audits without GitOps |
+| Manual errors | Outages | 70% of outages are human error |
+| Credential sprawl | Security breaches | Average breach cost: $4.45M |
+| Slow recovery | Downtime | MTTR 4x longer without GitOps |
+
+> 💬 *"The cost of a breach is not the breach itself, but the inability to respond quickly."*
+
+---
+
+## 📍 Slide 11 – ✅ Section 2: GitOps Principles
+
+**What is GitOps?**
+
+* 📝 **Git as single source of truth** — declarative desired state
+* 🔄 **Continuous reconciliation** — actual → desired
+* 🔀 **Pull-based deployment** — agent pulls from Git
+* 🔒 **Immutable, auditable** — every change tracked
+
+```mermaid
+flowchart LR
+  A[📝 Git Repo] --> |Pull| B[🤖 ArgoCD Agent]
+  B --> |Reconcile| C[☸️ Cluster]
+  C --> |Report Status| B
+```
+
+> 💡 **Key Insight:** The cluster pulls changes, no credentials leave the cluster!
+
+---
+
+## 📍 Slide 12 – 🚫 GitOps: What It's NOT
+
+| 🚫 Myth | ✅ Reality |
+|---------|----------|
+| Just using Git for YAML files | A complete operational model with reconciliation |
+| Another CI/CD tool | Continuous deployment, not continuous integration |
+| Only for Kubernetes | Works for any declarative infrastructure |
+| Complicated to adopt | Can start simple, grow incrementally |
+
+> 🔥 **Hot take:** "Putting YAML in Git is not GitOps. GitOps is about the reconciliation loop."
+
+**The Four Principles (from OpenGitOps):**
+1. 📝 **Declarative** — Desired state expressed declaratively
+2. 🔄 **Versioned and Immutable** — Stored in Git
+3. 🤖 **Pulled Automatically** — Agents pull desired state
+4. ♾️ **Continuously Reconciled** — Agents ensure actual = desired
+
+---
+
+## 📍 Slide 13 – 🔄 Push vs Pull Deployment
+
+```mermaid
+flowchart TD
+  subgraph 🔄 Push Model
+    A[📝 Git] --> B[🔧 CI/CD]
+    B --> |Push credentials needed| C[☸️ Cluster]
+  end
+
+  subgraph 🚀 Pull Model - GitOps
+    D[📝 Git] --> |Pull| E[🤖 Agent in Cluster]
+    E --> |Apply| F[☸️ Same Cluster]
+  end
+```
+
+| 📋 Aspect | 🔄 Push | 🚀 Pull (GitOps) |
+|----------|--------|------------------|
+| Credentials | CI needs cluster creds | Agent has local access |
+| Drift detection | None | Continuous |
+| Audit trail | CI logs (external) | Git history |
+| Recovery | Re-run pipeline | Automatic reconciliation |
+
+---
+
+## 📍 Slide 14 – 🛠️ GitOps Tools Landscape
+
+| 🛠️ Tool | 📝 Description | ⭐ Best For |
+|---------|---------------|------------|
+| **ArgoCD** | Declarative GitOps for K8s | Most Kubernetes use cases |
+| **Flux** | Toolkit approach, CNCF project | Composable, extensible setups |
+| **Jenkins X** | CI/CD + GitOps combined | Jenkins-heavy organizations |
+| **Rancher Fleet** | Multi-cluster GitOps | Managing many clusters |
+
+**Why ArgoCD?**
+* 🎯 Most adopted (70%+ of GitOps users)
+* 🖥️ Excellent UI for visualization
+* 🔧 Rich feature set out of the box
+* 📚 Large community, good documentation
+
+---
+
+## 📍 Slide 15 – 📊 Before vs After: Deployment
+
+| 📋 Aspect | 😰 Before (Manual/Push) | 🚀 After (GitOps) |
+|----------|-------------------------|-------------------|
+| Change process | kubectl, scripts, pipelines | Git PR → merge → auto-sync |
+| Audit trail | Scattered logs | Complete Git history |
+| Rollback | "Which version was before?" | `git revert` |
+| Drift | Undetected until failure | Detected immediately |
+| Credentials | Spread across tools | Stay in cluster |
+| Recovery | Manual intervention | Self-healing |
+
+> 🤔 **Think:** How would GitOps have helped in your last deployment issue?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: ArgoCD in Action
+
+**ArgoCD Architecture:**
+
+```mermaid
+flowchart TD
+  A[📝 Git Repository] --> B[🤖 ArgoCD Server]
+  B --> C[🔄 Application Controller]
+  C --> D[☸️ Kubernetes API]
+  E[👨‍💻 User] --> F[🖥️ ArgoCD UI / CLI]
+  F --> B
+  D --> C
+```
+
+**Components:**
+* 🖥️ **API Server:** UI, CLI, webhook endpoints
+* 🔄 **Application Controller:** Reconciliation engine
+* 📦 **Repository Server:** Caches Git repos, renders manifests
+* 🔗 **Dex:** SSO authentication (optional)
+
+---
+
+## 📍 Slide 17 – 💥 Scenario 1: First ArgoCD Deployment
+
+**Situation:** Deploy your first application with ArgoCD
+
+```yaml
+# Application manifest
+apiVersion: argoproj.io/v1alpha1
+kind: Application
+metadata:
+  name: my-app
+  namespace: argocd
+spec:
+  project: default
+  source:
+    repoURL: https://github.com/org/app-manifests
+    path: environments/dev
+    targetRevision: main
+  destination:
+    server: https://kubernetes.default.svc
+    namespace: dev
+```
+
+```mermaid
+flowchart LR
+  A[📝 Create App] --> B[🔄 ArgoCD Syncs]
+  B --> C[📦 Resources Created]
+  C --> D[✅ App Running]
+```
+
+---
+
+## 📍 Slide 18 – ✅ Solution 1: Understanding Sync
+
+**Sync States:**
+
+| 🔄 State | 📝 Meaning | 🎯 Action |
+|----------|-----------|----------|
+| **Synced** | Cluster matches Git | ✅ Good! |
+| **OutOfSync** | Cluster differs from Git | 🔄 Sync needed |
+| **Unknown** | Can't determine state | 🔍 Check connection |
+| **Missing** | Resources don't exist yet | 🔄 Initial sync |
+
+**Health States:**
+
+| 💚 Health | 📝 Meaning |
+|----------|-----------|
+| **Healthy** | All resources running correctly |
+| **Progressing** | Resources being updated |
+| **Degraded** | Some resources have issues |
+| **Suspended** | Manually paused |
+
+---
+
+## 📍 Slide 19 – 💥 Scenario 2: Handling Drift
+
+**Situation:** Someone manually changed replicas in the cluster
+
+```mermaid
+flowchart TD
+  A[📝 Git: replicas=3] --> B[🤖 ArgoCD]
+  C[👨‍💻 kubectl scale replicas=5] --> D[☸️ Cluster]
+  B --> |Detects| E[⚠️ OutOfSync]
+  E --> |Auto-sync enabled| F[🔄 Restore to 3]
+```
+
+**ArgoCD detects drift immediately!**
+* 🔍 **Visibility:** Shows exactly what differs
+* 🔄 **Options:** Manual sync or auto-sync
+* 📋 **Audit:** Who changed Git matters, not who ran kubectl
+
+---
+
+## 📍 Slide 20 – ✅ Solution 2: Sync Policies
+
+**Configure automatic reconciliation:**
+
+```yaml
+spec:
+  syncPolicy:
+    automated:
+      prune: true        # Delete resources not in Git
+      selfHeal: true     # Revert manual changes
+    syncOptions:
+      - CreateNamespace=true
+      - PruneLast=true
+```
+
+**Options explained:**
+* 🔄 **automated:** Enable auto-sync on Git changes
+* 🗑️ **prune:** Delete resources removed from Git
+* 💚 **selfHeal:** Revert manual cluster changes
+* 📦 **CreateNamespace:** Create namespace if missing
+
+---
+
+## 📍 Slide 21 – 💥 Scenario 3: Multi-Environment Deployment
+
+**Situation:** Same app, different configs for dev/staging/prod
+
+```
+repo/
+├── base/
+│   ├── deployment.yaml
+│   └── service.yaml
+└── overlays/
+    ├── dev/
+    │   └── kustomization.yaml
+    ├── staging/
+    │   └── kustomization.yaml
+    └── prod/
+        └── kustomization.yaml
+```
+
+```mermaid
+flowchart TD
+  A[📝 Git Repo] --> B[🤖 ArgoCD]
+  B --> C[📦 App-Dev]
+  B --> D[📦 App-Staging]
+  B --> E[📦 App-Prod]
+  C --> F[☸️ Dev Cluster]
+  D --> G[☸️ Staging Cluster]
+  E --> H[☸️ Prod Cluster]
+```
+
+---
+
+## 📍 Slide 22 – ✅ Solution 3: ApplicationSet
+
+**Deploy to multiple environments with one definition:**
+
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: ApplicationSet
+metadata:
+  name: my-app
+spec:
+  generators:
+    - list:
+        elements:
+          - env: dev
+            namespace: dev
+          - env: staging
+            namespace: staging
+          - env: prod
+            namespace: prod
+  template:
+    metadata:
+      name: 'my-app-{{env}}'
+    spec:
+      source:
+        repoURL: https://github.com/org/manifests
+        path: 'overlays/{{env}}'
+      destination:
+        namespace: '{{namespace}}'
+```
+
+---
+
+## 📍 Slide 23 – 💥 Scenario 4: Secrets in GitOps
+
+**Problem:** Secrets shouldn't be in Git... but GitOps needs everything in Git!
+
+```mermaid
+flowchart TD
+  A[🔐 Secret] --> B{Where to store?}
+  B --> |❌ Plain Git| C[😱 Security breach]
+  B --> |✅ Encrypted| D[🔒 Sealed Secrets]
+  B --> |✅ External| E[🔐 Vault + ESO]
+```
+
+**The dilemma:**
+* 📝 GitOps: Everything in Git
+* 🔐 Security: Secrets NOT in Git
+* 🤔 How to reconcile?
+
+---
+
+## 📍 Slide 24 – ✅ Solution 4: Secrets Management Patterns
+
+**Option 1: Sealed Secrets**
+```yaml
+apiVersion: bitnami.com/v1alpha1
+kind: SealedSecret
+metadata:
+  name: my-secret
+spec:
+  encryptedData:
+    password: AgBghY8... # Encrypted, safe to commit!
+```
+
+**Option 2: External Secrets Operator + Vault**
+```yaml
+apiVersion: external-secrets.io/v1beta1
+kind: ExternalSecret
+metadata:
+  name: my-secret
+spec:
+  secretStoreRef:
+    name: vault-backend
+  target:
+    name: my-secret
+  data:
+    - secretKey: password
+      remoteRef:
+        key: app/database
+        property: password
+```
+
+* ✅ **Encrypted in Git** (Sealed Secrets)
+* ✅ **Reference only in Git** (External Secrets)
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L13_MID
+
+---
+
+## 📍 Slide 26 – 🔧 Section 4: Advanced ArgoCD Patterns
+
+**Sync Waves & Hooks:**
+
+```yaml
+metadata:
+  annotations:
+    argocd.argoproj.io/sync-wave: "1"  # Order of deployment
+    argocd.argoproj.io/hook: PreSync   # Run before main sync
+```
+
+```mermaid
+flowchart LR
+  A[🔄 PreSync Hooks] --> B[📦 Wave 0]
+  B --> C[📦 Wave 1]
+  C --> D[📦 Wave 2]
+  D --> E[✅ PostSync Hooks]
+```
+
+**Use cases:**
+* 📊 **Database migrations** before app deploy
+* 🧹 **Cleanup jobs** after deployment
+* 🔍 **Health checks** between phases
+
+---
+
+## 📍 Slide 27 – 🔄 Sync Options Deep Dive
+
+| 🔧 Option | 📝 Purpose |
+|----------|-----------|
+| `Replace` | Replace instead of apply (for immutable fields) |
+| `PruneLast` | Delete resources after all others sync |
+| `ApplyOutOfSyncOnly` | Only apply changed resources |
+| `ServerSideApply` | Use server-side apply (K8s 1.22+) |
+| `FailOnSharedResource` | Fail if resource owned by another app |
+
+```yaml
+syncPolicy:
+  syncOptions:
+    - CreateNamespace=true
+    - PrunePropagationPolicy=foreground
+    - PruneLast=true
+```
+
+---
+
+## 📍 Slide 28 – 🏗️ Repository Structure Patterns
+
+**Pattern 1: Monorepo**
+```
+repo/
+├── apps/
+│   ├── app1/
+│   └── app2/
+└── infrastructure/
+    ├── prometheus/
+    └── argocd/
+```
+
+**Pattern 2: Repo per App**
+```
+app1-config/     # App 1 manifests
+app2-config/     # App 2 manifests
+infrastructure/  # Shared infra
+```
+
+**Pattern 3: Environment Repos**
+```
+dev-cluster/     # All dev apps
+prod-cluster/    # All prod apps
+```
+
+> 💡 **Recommendation:** Start with monorepo, split when it gets complex
+
+---
+
+## 📍 Slide 29 – 📊 ArgoCD Metrics & Monitoring
+
+**Key metrics to watch:**
+
+| 📊 Metric | 📝 Meaning | ⚠️ Alert When |
+|----------|-----------|--------------|
+| `argocd_app_sync_total` | Total syncs | Unusually high |
+| `argocd_app_health_status` | App health | Not healthy |
+| `argocd_app_reconcile_duration` | Sync time | > 5 minutes |
+| `argocd_cluster_api_resource_objects` | Total objects | Growing unexpectedly |
+
+**Dashboard integration:**
+* 📊 Grafana dashboards available
+* 🔔 Alertmanager integration
+* 📝 Slack/Teams notifications
+
+---
+
+## 📍 Slide 30 – 🔐 RBAC & Multi-tenancy
+
+**ArgoCD RBAC:**
+
+```yaml
+# argocd-rbac-cm ConfigMap
+policy.csv: |
+  p, role:dev-team, applications, get, dev-project/*, allow
+  p, role:dev-team, applications, sync, dev-project/*, allow
+  p, role:ops-team, applications, *, */*, allow
+
+  g, dev-group, role:dev-team
+  g, ops-group, role:ops-team
+```
+
+**Projects for isolation:**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: AppProject
+metadata:
+  name: dev-project
+spec:
+  sourceRepos:
+    - 'https://github.com/org/dev-*'
+  destinations:
+    - namespace: 'dev-*'
+      server: https://kubernetes.default.svc
+```
+
+---
+
+## 📍 Slide 31 – 🚨 Disaster Recovery
+
+**Git is your backup!**
+
+```mermaid
+flowchart TD
+  A[💀 Cluster Gone] --> B[🆕 New Cluster]
+  B --> C[📦 Install ArgoCD]
+  C --> D[🔗 Connect to Git]
+  D --> E[🔄 Sync All Apps]
+  E --> F[✅ Fully Restored]
+```
+
+**Recovery steps:**
+1. 🆕 Create new cluster
+2. 📦 Install ArgoCD
+3. 🔗 Point to Git repository
+4. ☕ Wait for sync
+5. ✅ Everything restored!
+
+> 💡 **Key insight:** If Git has everything, recovery is just a sync away
+
+---
+
+## 📍 Slide 32 – 📋 GitOps Workflow Summary
+
+```mermaid
+flowchart TD
+  A[👨‍💻 Developer] --> |PR| B[📝 Git Repo]
+  B --> |Review| C[✅ Merge]
+  C --> |Webhook| D[🤖 ArgoCD]
+  D --> |Sync| E[☸️ Cluster]
+  E --> |Status| D
+  D --> |Notify| F[💬 Slack]
+
+  G[🔍 Drift Detection] --> D
+  D --> |Self-heal| E
+```
+
+**The complete loop:**
+1. 📝 **Change:** Developer creates PR
+2. 👀 **Review:** Team reviews and approves
+3. 🔀 **Merge:** Changes merge to main
+4. 🤖 **Detect:** ArgoCD detects new commit
+5. 🔄 **Sync:** Resources deployed to cluster
+6. 💚 **Verify:** Health checks pass
+7. 📢 **Notify:** Team informed of deployment
+
+---
+
+## 📍 Slide 33 – 🏭 Section 5: Production GitOps
+
+**Enterprise Patterns:**
+
+```mermaid
+flowchart TD
+  subgraph Git
+    A[📝 Feature Branch] --> B[📝 Main Branch]
+    B --> C[📝 Release Branch]
+  end
+
+  subgraph ArgoCD
+    D[🤖 Dev App] --> E[🤖 Staging App]
+    E --> F[🤖 Prod App]
+  end
+
+  B --> D
+  C --> F
+```
+
+* 🔀 **Branch strategy:** Main for dev, release for prod
+* 🎯 **Progressive delivery:** Dev → Staging → Prod
+* ✅ **Promotion:** PR from main to release
+
+---
+
+## 📍 Slide 34 – 🏢 Real-World GitOps: Intuit
+
+**Case Study: Intuit's GitOps Journey**
+
+* 📊 **Scale:** 2,000+ applications
+* 🔄 **Deployments:** 500+ per day
+* ⏱️ **MTTR:** Reduced by 80%
+
+**What they learned:**
+* 📋 Start small, grow incrementally
+* 🔧 Standardize templates early
+* 👥 Train teams on Git workflows
+* 📊 Monitor everything
+
+> 💬 *"GitOps turned our deployment from a ceremony into a non-event."* — Intuit Engineer
+
+---
+
+## 📍 Slide 35 – 🔧 Migration Strategy
+
+**Adopting GitOps incrementally:**
+
+```mermaid
+flowchart LR
+  A[1️⃣ Non-critical app] --> B[2️⃣ Dev environment]
+  B --> C[3️⃣ More apps]
+  C --> D[4️⃣ Staging]
+  D --> E[5️⃣ Production]
+```
+
+**Phases:**
+1. 🧪 **Pilot:** One non-critical app in dev
+2. 📚 **Learn:** Document patterns, train team
+3. 📦 **Expand:** More apps, still dev
+4. 🎭 **Staging:** Full staging environment
+5. 🏭 **Production:** Controlled rollout
+
+---
+
+## 📍 Slide 36 – 🎯 Key Takeaways
+
+1. 📝 **Git is the source of truth** — not the cluster, not CI/CD
+2. 🔄 **Pull > Push** — credentials stay in cluster
+3. 💚 **Self-healing** — drift is detected and corrected
+4. 🔍 **Complete audit trail** — git log is your history
+5. ↩️ **Easy rollback** — `git revert` reverts infrastructure
+6. 🔐 **Secrets need special handling** — Sealed Secrets or External Secrets
+
+> 💬 *"Operations by Pull Request"*
+> — Kelsey Hightower
+
+---
+
+## 📍 Slide 37 – 🧠 Mindset Shift
+
+| 😰 Old Mindset | 🚀 New Mindset |
+|---------------|----------------|
+| "I'll just kubectl this" | "Let me create a PR" |
+| "The cluster is truth" | "Git is truth" |
+| "We need cluster access" | "We need Git access" |
+| "Rollback is scary" | "Rollback is git revert" |
+| "Who changed what?" | "Check git log" |
+| "Emergency fix!" | "Emergency PR with fast review" |
+
+> 🤔 **Question:** Which mindset do you operate with today?
+
+---
+
+## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L13_POST
+
+---
+
+## 📍 Slide 39 – 🚀 What's Next?
+
+**Coming up: Lecture 14 — Progressive Delivery with Argo Rollouts**
+
+```mermaid
+flowchart LR
+  A[📦 v1] --> B[🚀 Canary 10%]
+  B --> C[🚀 Canary 50%]
+  C --> D[🚀 Full Rollout]
+```
+
+* 🐤 **Canary deployments** — test with small traffic
+* 🔵 **Blue-green deployments** — instant switchover
+* 📊 **Automated analysis** — metrics-driven promotion
+* ↩️ **Automatic rollback** — on failure
+
+> 🎯 **Lab 13:** Set up ArgoCD and deploy your application using GitOps!
+
+---
+
+## 📚 Resources
+
+**Documentation:**
+* 📖 [ArgoCD Docs](https://argo-cd.readthedocs.io/)
+* 📖 [OpenGitOps](https://opengitops.dev/)
+* 📖 [Sealed Secrets](https://sealed-secrets.netlify.app/)
+* 📖 [External Secrets Operator](https://external-secrets.io/)
+
+**Tools:**
+* 🔧 [ArgoCD](https://argoproj.github.io/cd/)
+* 🔧 [Flux](https://fluxcd.io/)
+* 🔧 [Kustomize](https://kustomize.io/)
+
+**Books:**
+* 📕 *GitOps and Kubernetes* by Billy Yuen, et al.
+* 📕 *Continuous Delivery* by Jez Humble & David Farley
diff --git a/lectures/lec14.md b/lectures/lec14.md
index 9ca7297ccd..f450dd0998 100644
--- a/lectures/lec14.md
+++ b/lectures/lec14.md
@@ -1,825 +1,825 @@
-# 📌 Lecture 14 — Progressive Delivery: Deploying with Confidence
-
-> 🎯 **From risky big-bang deployments to controlled, observable releases**
-
----
-
-## 📍 Slide 1 – 🚀 Welcome to Progressive Delivery
-
-GitOps solved **how** we deploy. But **when things go wrong**...
-
-* 💥 **Traditional deploy:** 100% traffic instantly → all users affected
-* 🐤 **Canary:** 5% traffic first → catch issues early
-* 🔵 **Blue-green:** Switch traffic instantly → easy rollback
-
-```mermaid
-flowchart LR
-  A[😰 Big Bang] --> B[🎲 Hope it works]
-  C[🐤 Canary] --> D[📊 Observe]
-  D --> E[✅ Promote or ↩️ Rollback]
-```
-
-> 🎯 **Goal:** Deploy changes safely with automated analysis and rollback
-
----
-
-## 📍 Slide 2 – 📚 Learning Outcomes
-
-By the end of this lecture, you will:
-
-| # | 🎯 Outcome |
-|---|-----------|
-| 1 | ✅ Understand **progressive delivery** concepts and benefits |
-| 2 | ✅ Implement **canary deployments** with Argo Rollouts |
-| 3 | ✅ Configure **blue-green deployments** for instant rollback |
-| 4 | ✅ Set up **automated analysis** with metrics |
-| 5 | ✅ Design **traffic management** strategies |
-| 6 | ✅ Handle **rollback scenarios** gracefully |
-
----
-
-## 📍 Slide 3 – 🗺️ Lecture Overview
-
-```
-┌─────────────────────────────────────────────────────────────┐
-│  SECTION 0: Introduction                    (Slides 1-4)   │
-├─────────────────────────────────────────────────────────────┤
-│  📝 PRE QUIZ                                (Slide 5)      │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 1: The Deployment Risk Problem     (Slides 6-10)  │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 2: Progressive Delivery Concepts   (Slides 11-15) │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 3: Argo Rollouts in Action         (Slides 16-24) │
-├─────────────────────────────────────────────────────────────┤
-│  📝 MID QUIZ                                (Slide 25)     │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 4: Advanced Strategies             (Slides 26-32) │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 5: Production Patterns             (Slides 33-37) │
-├─────────────────────────────────────────────────────────────┤
-│  📝 POST QUIZ                               (Slide 38)     │
-├─────────────────────────────────────────────────────────────┤
-│  FINAL: What's Next                         (Slide 39)     │
-└─────────────────────────────────────────────────────────────┘
-```
-
----
-
-## 📍 Slide 4 – 🤔 The Big Question
-
-> 💬 *"We don't want to move fast and break things. We want to move fast and fix things."*
-> — Facebook (ironically, after many outages)
-
-**Consider this:**
-
-* 🚀 You deploy a new feature at **5 PM Friday**
-* 💥 It has a subtle bug affecting **10% of requests**
-* ⏰ By the time you notice: **100,000 users affected**
-* 😱 Rollback takes **15 minutes** of downtime
-
-> 🤔 **Think:** What if you could test with 1% of users first?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L14_PRE
-
----
-
-## 📍 Slide 6 – ⚠️ Section 1: The Deployment Risk Problem
-
-**Traditional "Big Bang" Deployment:**
-
-```mermaid
-flowchart TD
-  A[📦 v1 Running] --> B[🚀 Deploy v2]
-  B --> C[⚡ 100% Traffic to v2]
-  C --> D{Works?}
-  D --> |Yes| E[✅ Success]
-  D --> |No| F[💀 100% Users Affected]
-  F --> G[😱 Emergency Rollback]
-```
-
-* ⚡ **All-or-nothing:** No gradual validation
-* 😱 **High blast radius:** Everyone affected immediately
-* ⏱️ **Slow detection:** Issues found in production
-
----
-
-## 📍 Slide 7 – 🔥 Pain Point 1: Silent Failures
-
-**Scenario:** Memory leak that only triggers under load
-
-```mermaid
-flowchart LR
-  A[🧪 Tests Pass] --> B[🎭 Staging OK]
-  B --> C[🏭 Deploy to Prod]
-  C --> D[📈 Real Traffic]
-  D --> E[💥 OOM after 2 hours]
-```
-
-* 🧪 **Tests pass** — synthetic load is different
-* 🎭 **Staging works** — not enough traffic to trigger
-* 🏭 **Production crashes** — after hours of operation
-
-**Real impact:**
-* 😱 Facebook 2021: 6-hour outage from config change
-* 💰 Estimated loss: $100 million
-
----
-
-## 📍 Slide 8 – 🔥 Pain Point 2: Slow Rollback
-
-**Traditional rollback process:**
-
-| ⏱️ Step | 📝 Action | ⌛ Time |
-|---------|----------|--------|
-| 1 | Detect the issue | 10 min |
-| 2 | Confirm it's the deploy | 5 min |
-| 3 | Find previous version | 2 min |
-| 4 | Rebuild/redeploy | 10 min |
-| 5 | Verify rollback | 5 min |
-| **Total** | **Downtime** | **32+ min** |
-
-* 🐌 **Slow detection:** Monitoring lag
-* 🤔 **Decision paralysis:** "Is it really the deploy?"
-* 🔧 **Manual process:** Error-prone under pressure
-
----
-
-## 📍 Slide 9 – 🔥 Pain Point 3: No Gradual Validation
-
-**What we want:**
-
-```
-Deploy → Observe → Decide → Promote/Rollback
-```
-
-**What we get:**
-
-```
-Deploy → 🙏 Hope → React when broken
-```
-
-* 📊 **No metrics integration** — can't auto-decide
-* 👨‍💻 **Human in the loop** — for every deploy
-* 🎲 **Risk acceptance** — every release is a gamble
-
----
-
-## 📍 Slide 10 – 💰 The Cost of Bad Deployments
-
-| 🔥 Problem | 💥 Impact | 📊 Industry Data |
-|-----------|----------|------------------|
-| Failed deployments | Service degradation | 46% experience monthly failures |
-| Slow rollback | Extended outages | Avg 30 min to rollback |
-| No canary testing | Full user impact | 100% blast radius |
-| Manual promotion | Human error | 70% of incidents |
-
-**DORA metrics show:**
-* 🏆 **Elite teams:** Deploy multiple times per day with <1% failure rate
-* 😰 **Low performers:** Monthly deploys with 15%+ failure rate
-
----
-
-## 📍 Slide 11 – ✅ Section 2: Progressive Delivery Concepts
-
-**What is Progressive Delivery?**
-
-* 🐤 **Gradual rollout:** Incrementally shift traffic
-* 📊 **Observability:** Measure success at each step
-* 🤖 **Automation:** Promote or rollback based on metrics
-* 🎯 **Targeted:** Control which users see changes
-
-```mermaid
-flowchart LR
-  A[📦 v2] --> |5%| B[🎯 Test]
-  B --> |Metrics OK| C[25%]
-  C --> |Metrics OK| D[50%]
-  D --> |Metrics OK| E[100%]
-
-  B --> |Metrics Bad| F[↩️ Rollback]
-```
-
----
-
-## 📍 Slide 12 – 🚫 Progressive Delivery: What It's NOT
-
-| 🚫 Myth | ✅ Reality |
-|---------|----------|
-| Just slow deployments | Strategic, metrics-driven progression |
-| Replaces testing | Complements testing with real traffic |
-| Only for big companies | Available via Argo Rollouts, Flagger |
-| Complicated to implement | Start simple, add automation gradually |
-
-> 🔥 **Hot take:** "If you're not doing progressive delivery, you're gambling with every deploy."
-
-**Progressive Delivery is:**
-* 🎯 **Risk reduction** — smaller blast radius
-* 📊 **Data-driven** — metrics decide promotion
-* 🔄 **Continuous** — part of the deployment pipeline
-
----
-
-## 📍 Slide 13 – 🐤 Canary Deployments Explained
-
-**Named after "canary in a coal mine"** — early warning system
-
-```mermaid
-flowchart TD
-  subgraph Production
-    A[📦 v1 - 95%] --> C[🌐 Users]
-    B[📦 v2 - 5%] --> C
-  end
-
-  D[📊 Metrics] --> E{Healthy?}
-  E --> |Yes| F[📦 v2 - 100%]
-  E --> |No| G[↩️ v1 - 100%]
-```
-
-**How it works:**
-1. 🚀 Deploy new version alongside old
-2. 🎯 Route small % of traffic to new
-3. 📊 Compare metrics (errors, latency)
-4. ✅ Gradually increase or ↩️ rollback
-
----
-
-## 📍 Slide 14 – 🔵 Blue-Green Deployments Explained
-
-**Two identical environments, instant switchover**
-
-```mermaid
-flowchart LR
-  subgraph Before
-    A[🔵 Blue v1] --> |100%| C[🌐 Traffic]
-    B[🟢 Green v2] --> |0%| C
-  end
-
-  subgraph After Switch
-    D[🔵 Blue v1] --> |0%| F[🌐 Traffic]
-    E[🟢 Green v2] --> |100%| F
-  end
-```
-
-**Characteristics:**
-* ⚡ **Instant switch:** Traffic moves all at once
-* ↩️ **Fast rollback:** Switch back to blue
-* 💰 **Resource cost:** Double infrastructure during deploy
-* 🎯 **Use case:** Database migrations, breaking changes
-
----
-
-## 📍 Slide 15 – 📊 Canary vs Blue-Green
-
-| 📋 Aspect | 🐤 Canary | 🔵 Blue-Green |
-|----------|----------|---------------|
-| Traffic shift | Gradual (5% → 25% → 100%) | Instant (0% → 100%) |
-| Rollback speed | Instant | Instant |
-| Resource usage | Minimal overhead | Double during deploy |
-| Risk exposure | Minimal (small %) | Full (100% at switch) |
-| Complexity | Higher (traffic splitting) | Lower (simple switch) |
-| Best for | Most deployments | Major version changes |
-
-> 🤔 **Think:** Which strategy would you use for a database schema change?
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: Argo Rollouts in Action
-
-**What is Argo Rollouts?**
-
-* 🔄 Kubernetes controller for progressive delivery
-* 📦 Replaces standard Deployment resource
-* 🎯 Supports canary, blue-green, and more
-* 📊 Integrates with metrics providers
-
-```mermaid
-flowchart TD
-  A[📝 Rollout Resource] --> B[🤖 Argo Rollouts Controller]
-  B --> C[📦 ReplicaSets]
-  C --> D[☸️ Pods]
-  E[📊 Prometheus] --> B
-  B --> F[🎯 Traffic Management]
-```
-
----
-
-## 📍 Slide 17 – 💥 Scenario 1: First Canary Rollout
-
-**Basic canary configuration:**
-
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: Rollout
-metadata:
-  name: my-app
-spec:
-  replicas: 10
-  strategy:
-    canary:
-      steps:
-        - setWeight: 20
-        - pause: {duration: 5m}
-        - setWeight: 50
-        - pause: {duration: 5m}
-        - setWeight: 100
-  selector:
-    matchLabels:
-      app: my-app
-  template:
-    # Pod template (same as Deployment)
-```
-
-```mermaid
-flowchart LR
-  A[0%] --> |Step 1| B[20%]
-  B --> |5min pause| C[50%]
-  C --> |5min pause| D[100%]
-```
-
----
-
-## 📍 Slide 18 – ✅ Solution 1: Traffic Progression
-
-**What happens during canary:**
-
-| 🕐 Time | 📦 Stable | 🐤 Canary | 📊 Status |
-|---------|----------|----------|-----------|
-| T+0 | 100% | 0% | Rollout started |
-| T+1 | 80% | 20% | setWeight: 20 |
-| T+6 | 50% | 50% | pause completed |
-| T+11 | 0% | 100% | Full promotion |
-
-**Rollout states:**
-* 🔄 **Progressing:** Moving through steps
-* ⏸️ **Paused:** Waiting (manual or timed)
-* ✅ **Healthy:** Rollout complete
-* 💥 **Degraded:** Issues detected
-
----
-
-## 📍 Slide 19 – 💥 Scenario 2: Blue-Green with Argo Rollouts
-
-**Blue-green configuration:**
-
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: Rollout
-metadata:
-  name: my-app
-spec:
-  replicas: 5
-  strategy:
-    blueGreen:
-      activeService: my-app-active
-      previewService: my-app-preview
-      autoPromotionEnabled: false  # Manual promotion
-      scaleDownDelaySeconds: 30
-  selector:
-    matchLabels:
-      app: my-app
-```
-
-```mermaid
-flowchart TD
-  A[🔵 Active Service] --> B[📦 Stable Pods]
-  C[🟢 Preview Service] --> D[📦 New Pods]
-  E[👨‍💻 QA] --> C
-  F[🌐 Users] --> A
-```
-
----
-
-## 📍 Slide 20 – ✅ Solution 2: Preview and Promote
-
-**Blue-green workflow:**
-
-1. 🚀 **Deploy:** New pods created, preview service points to them
-2. 🧪 **Test:** QA validates via preview service
-3. ✅ **Promote:** Traffic switches to new pods
-4. 🗑️ **Cleanup:** Old pods scaled down after delay
-
-**Commands:**
-```bash
-# Check rollout status
-kubectl argo rollouts get rollout my-app
-
-# Promote preview to active
-kubectl argo rollouts promote my-app
-
-# Abort and rollback
-kubectl argo rollouts abort my-app
-```
-
----
-
-## 📍 Slide 21 – 💥 Scenario 3: Automated Analysis
-
-**Problem:** Manual observation doesn't scale
-
-```mermaid
-flowchart TD
-  A[🐤 Canary] --> B[📊 Metrics]
-  B --> C{Error rate < 1%?}
-  C --> |Yes| D{Latency < 500ms?}
-  D --> |Yes| E[✅ Promote]
-  C --> |No| F[↩️ Rollback]
-  D --> |No| F
-```
-
-**Solution:** AnalysisTemplate
-
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: AnalysisTemplate
-metadata:
-  name: success-rate
-spec:
-  metrics:
-    - name: success-rate
-      interval: 1m
-      successCondition: result[0] >= 0.99
-      provider:
-        prometheus:
-          query: |
-            sum(rate(http_requests_total{status=~"2.*"}[5m])) /
-            sum(rate(http_requests_total[5m]))
-```
-
----
-
-## 📍 Slide 22 – ✅ Solution 3: Analysis Integration
-
-**Connecting analysis to rollout:**
-
-```yaml
-strategy:
-  canary:
-    steps:
-      - setWeight: 20
-      - analysis:
-          templates:
-            - templateName: success-rate
-          args:
-            - name: service-name
-              value: my-app
-      - setWeight: 50
-      - analysis:
-          templates:
-            - templateName: success-rate
-      - setWeight: 100
-```
-
-**Analysis outcomes:**
-* ✅ **Successful:** All metrics pass → continue
-* ❌ **Failed:** Metric fails → automatic rollback
-* ⚠️ **Inconclusive:** Not enough data → pause
-
----
-
-## 📍 Slide 23 – 💥 Scenario 4: Traffic Management
-
-**Problem:** Need fine-grained traffic control
-
-**Solutions:**
-
-| 🛠️ Traffic Manager | 📝 Description |
-|-------------------|---------------|
-| **Nginx Ingress** | Canary annotations |
-| **Istio** | VirtualService routing |
-| **AWS ALB** | Target group weights |
-| **Traefik** | TraefikService |
-
-```yaml
-# With Istio
-strategy:
-  canary:
-    trafficRouting:
-      istio:
-        virtualService:
-          name: my-app-vsvc
-        destinationRule:
-          name: my-app-destrule
-          canarySubsetName: canary
-          stableSubsetName: stable
-```
-
----
-
-## 📍 Slide 24 – ✅ Solution 4: Nginx Ingress Canary
-
-**Simple traffic splitting with Nginx:**
-
-```yaml
-strategy:
-  canary:
-    canaryService: my-app-canary
-    stableService: my-app-stable
-    trafficRouting:
-      nginx:
-        stableIngress: my-app-ingress
-```
-
-**How it works:**
-* 🔧 Argo Rollouts creates canary ingress
-* 📊 Sets `nginx.ingress.kubernetes.io/canary-weight`
-* 🔄 Updates weight as rollout progresses
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L14_MID
-
----
-
-## 📍 Slide 26 – 🔧 Section 4: Advanced Strategies
-
-**Experiment: A/B Testing**
-
-```yaml
-apiVersion: argoproj.io/v1alpha1
-kind: Experiment
-metadata:
-  name: ab-test
-spec:
-  duration: 1h
-  templates:
-    - name: baseline
-      specRef: stable
-      replicas: 1
-    - name: canary
-      specRef: canary
-      replicas: 1
-  analyses:
-    - name: compare-versions
-      templateName: compare-metrics
-```
-
-**Use cases:**
-* 🧪 **Feature testing:** Compare feature A vs B
-* 📊 **Performance testing:** Baseline vs optimized
-* 🎯 **User experience:** Different UIs
-
----
-
-## 📍 Slide 27 – 📊 Metrics for Analysis
-
-**Common metrics to analyze:**
-
-| 📊 Metric | 📝 What it Measures | ⚠️ Threshold |
-|----------|-------------------|-------------|
-| Error rate | % of failed requests | < 1% |
-| Latency P99 | Slowest 1% of requests | < 500ms |
-| Saturation | Resource utilization | < 80% |
-| Success rate | % of successful operations | > 99% |
-
-**Prometheus queries:**
-```promql
-# Error rate
-sum(rate(http_requests_total{status=~"5.*"}[5m])) /
-sum(rate(http_requests_total[5m]))
-
-# P99 latency
-histogram_quantile(0.99, rate(http_duration_seconds_bucket[5m]))
-```
-
----
-
-## 📍 Slide 28 – 🔄 Rollback Strategies
-
-**Automatic rollback triggers:**
-
-```yaml
-strategy:
-  canary:
-    steps:
-      - setWeight: 20
-      - analysis:
-          templates:
-            - templateName: error-rate
-    # If analysis fails, automatic rollback
-```
-
-**Manual rollback:**
-```bash
-# Abort current rollout
-kubectl argo rollouts abort my-app
-
-# Undo to previous version
-kubectl argo rollouts undo my-app
-
-# Retry after fix
-kubectl argo rollouts retry rollout my-app
-```
-
-```mermaid
-flowchart TD
-  A[💥 Analysis Failed] --> B[🤖 Auto Rollback]
-  B --> C[📦 Scale down canary]
-  C --> D[🔄 Restore stable]
-  D --> E[✅ Service restored]
-```
-
----
-
-## 📍 Slide 29 – ⏸️ Pause and Resume
-
-**Manual gates in rollout:**
-
-```yaml
-steps:
-  - setWeight: 20
-  - pause: {}  # Manual pause - requires promotion
-  - setWeight: 50
-  - pause: {duration: 10m}  # Timed pause
-  - setWeight: 100
-```
-
-**Commands:**
-```bash
-# Resume paused rollout
-kubectl argo rollouts promote my-app
-
-# Skip all remaining steps
-kubectl argo rollouts promote my-app --full
-```
-
-**Use cases:**
-* 👀 **Manual verification** before wider rollout
-* 🕐 **Business hours** — pause overnight
-* 🧪 **QA sign-off** required
-
----
-
-## 📍 Slide 30 – 🔗 ArgoCD + Argo Rollouts
-
-**GitOps + Progressive Delivery:**
-
-```mermaid
-flowchart TD
-  A[📝 Git Push] --> B[🤖 ArgoCD]
-  B --> |Sync| C[📦 Rollout Resource]
-  C --> D[🤖 Argo Rollouts Controller]
-  D --> E[🐤 Canary Progression]
-  E --> F[📊 Analysis]
-  F --> |Pass| G[✅ Promoted]
-  F --> |Fail| H[↩️ Rollback]
-```
-
-**Benefits:**
-* 📝 **Declarative:** Rollout strategy in Git
-* 🔄 **Automated:** ArgoCD syncs, Rollouts executes
-* 🔍 **Observable:** Both tools have UIs
-
----
-
-## 📍 Slide 31 – 📊 Dashboard and Visualization
-
-**Argo Rollouts Dashboard:**
-
-```bash
-# Install dashboard
-kubectl argo rollouts dashboard
-
-# Access at localhost:3100
-```
-
-**Features:**
-* 📊 **Real-time status:** See rollout progression
-* 🎛️ **Controls:** Promote, abort, retry
-* 📈 **History:** Past rollouts and outcomes
-* 🔗 **Integration:** Links to metrics
-
----
-
-## 📍 Slide 32 – 🎯 Best Practices
-
-| 📋 Practice | 📝 Why |
-|------------|--------|
-| Start with simple canary | Learn before adding complexity |
-| Always have analysis | Don't rely only on time-based |
-| Set appropriate thresholds | Too strict = never promotes |
-| Monitor canary metrics | Catch issues before promotion |
-| Test rollback procedure | Know it works before you need it |
-| Use GitOps | Keep strategy in version control |
-
----
-
-## 📍 Slide 33 – 🏭 Section 5: Production Patterns
-
-**Netflix Progressive Delivery:**
-
-```mermaid
-flowchart LR
-  A[📦 v2] --> B[🎯 Internal 1%]
-  B --> C[🌍 One Region 5%]
-  C --> D[🌍 All Regions 25%]
-  D --> E[🚀 Full 100%]
-```
-
-**Their learnings:**
-* 🎯 **Internal first:** Employees as first canaries
-* 🌍 **Regional:** Test in one region before global
-* 📊 **Metrics-driven:** Automated promotion
-* 🐌 **Patience:** Days, not minutes
-
----
-
-## 📍 Slide 34 – 🔧 Anti-Patterns to Avoid
-
-| ❌ Anti-Pattern | ✅ Better Approach |
-|----------------|-------------------|
-| Canary with no metrics | Add analysis, even basic |
-| Too fast progression | Allow time for issues to surface |
-| Ignoring saturation | Include resource metrics |
-| Manual-only promotion | Automate with analysis |
-| Skip staging canary | Test progressive delivery in staging |
-
----
-
-## 📍 Slide 35 – 📈 Measuring Success
-
-**DORA metrics with progressive delivery:**
-
-| 📊 Metric | 😰 Before | 🚀 After |
-|----------|----------|---------|
-| Deployment frequency | Weekly | Multiple/day |
-| Change failure rate | 15% | < 1% |
-| MTTR | 30 min | 2 min |
-| Lead time | Days | Hours |
-
-**Why improvement:**
-* 🐤 **Catch issues early** — smaller blast radius
-* ↩️ **Fast rollback** — seconds, not minutes
-* 📊 **Data-driven** — objective decisions
-* 🔄 **Confidence** — deploy more often
-
----
-
-## 📍 Slide 36 – 🎯 Key Takeaways
-
-1. 🐤 **Canary deployments** test with small traffic before full rollout
-2. 🔵 **Blue-green** enables instant rollback via traffic switch
-3. 📊 **Automated analysis** removes human guesswork
-4. 🎯 **Argo Rollouts** makes progressive delivery accessible
-5. 🔗 **GitOps integration** keeps strategy declarative
-6. ↩️ **Fast rollback** is as important as deployment
-
-> 💬 *"Deploy frequently, observe constantly, rollback automatically."*
-
----
-
-## 📍 Slide 37 – 🧠 Mindset Shift
-
-| 😰 Old Mindset | 🚀 New Mindset |
-|---------------|----------------|
-| "Let's hope it works" | "Let's measure and know" |
-| "Deploy and pray" | "Deploy, observe, decide" |
-| "Rollback is failure" | "Rollback is success" |
-| "Testing is enough" | "Testing + production validation" |
-| "Deploy once a week (safe)" | "Deploy often (safer)" |
-| "100% or nothing" | "Progressive and controlled" |
-
-> 🤔 **Question:** Which deployment approach does your team use today?
-
----
-
-## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L14_POST
-
----
-
-## 📍 Slide 39 – 🚀 What's Next?
-
-**Coming up: Lecture 15 — Stateful Applications & Observability**
-
-```mermaid
-flowchart LR
-  A[📦 Deployment] --> B[🗄️ StatefulSet]
-  B --> C[💾 Persistent Storage]
-  C --> D[📊 Monitoring]
-```
-
-* 🗄️ **StatefulSets:** Managing stateful applications
-* 💾 **Persistent storage:** Beyond ephemeral pods
-* 📊 **Observability:** Prometheus, Grafana
-* 🔍 **Alerting:** Know before users complain
-
-> 🎯 **Lab 14:** Implement canary deployments with Argo Rollouts!
-
----
-
-## 📚 Resources
-
-**Documentation:**
-* 📖 [Argo Rollouts Docs](https://argoproj.github.io/argo-rollouts/)
-* 📖 [Progressive Delivery](https://www.weave.works/blog/progressive-delivery)
-* 📖 [Canary Deployments](https://martinfowler.com/bliki/CanaryRelease.html)
-
-**Tools:**
-* 🔧 [Argo Rollouts](https://argoproj.github.io/argo-rollouts/)
-* 🔧 [Flagger](https://flagger.app/)
-* 🔧 [Istio](https://istio.io/)
-
-**Books:**
-* 📕 *Accelerate* by Nicole Forsgren, Jez Humble, Gene Kim
-* 📕 *Continuous Delivery* by Jez Humble & David Farley
+# 📌 Lecture 14 — Progressive Delivery: Deploying with Confidence
+
+> 🎯 **From risky big-bang deployments to controlled, observable releases**
+
+---
+
+## 📍 Slide 1 – 🚀 Welcome to Progressive Delivery
+
+GitOps solved **how** we deploy. But **when things go wrong**...
+
+* 💥 **Traditional deploy:** 100% traffic instantly → all users affected
+* 🐤 **Canary:** 5% traffic first → catch issues early
+* 🔵 **Blue-green:** Switch traffic instantly → easy rollback
+
+```mermaid
+flowchart LR
+  A[😰 Big Bang] --> B[🎲 Hope it works]
+  C[🐤 Canary] --> D[📊 Observe]
+  D --> E[✅ Promote or ↩️ Rollback]
+```
+
+> 🎯 **Goal:** Deploy changes safely with automated analysis and rollback
+
+---
+
+## 📍 Slide 2 – 📚 Learning Outcomes
+
+By the end of this lecture, you will:
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | ✅ Understand **progressive delivery** concepts and benefits |
+| 2 | ✅ Implement **canary deployments** with Argo Rollouts |
+| 3 | ✅ Configure **blue-green deployments** for instant rollback |
+| 4 | ✅ Set up **automated analysis** with metrics |
+| 5 | ✅ Design **traffic management** strategies |
+| 6 | ✅ Handle **rollback scenarios** gracefully |
+
+---
+
+## 📍 Slide 3 – 🗺️ Lecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  SECTION 0: Introduction                    (Slides 1-4)   │
+├─────────────────────────────────────────────────────────────┤
+│  📝 PRE QUIZ                                (Slide 5)      │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 1: The Deployment Risk Problem     (Slides 6-10)  │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 2: Progressive Delivery Concepts   (Slides 11-15) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 3: Argo Rollouts in Action         (Slides 16-24) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 MID QUIZ                                (Slide 25)     │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 4: Advanced Strategies             (Slides 26-32) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 5: Production Patterns             (Slides 33-37) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 POST QUIZ                               (Slide 38)     │
+├─────────────────────────────────────────────────────────────┤
+│  FINAL: What's Next                         (Slide 39)     │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 📍 Slide 4 – 🤔 The Big Question
+
+> 💬 *"We don't want to move fast and break things. We want to move fast and fix things."*
+> — Facebook (ironically, after many outages)
+
+**Consider this:**
+
+* 🚀 You deploy a new feature at **5 PM Friday**
+* 💥 It has a subtle bug affecting **10% of requests**
+* ⏰ By the time you notice: **100,000 users affected**
+* 😱 Rollback takes **15 minutes** of downtime
+
+> 🤔 **Think:** What if you could test with 1% of users first?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L14_PRE
+
+---
+
+## 📍 Slide 6 – ⚠️ Section 1: The Deployment Risk Problem
+
+**Traditional "Big Bang" Deployment:**
+
+```mermaid
+flowchart TD
+  A[📦 v1 Running] --> B[🚀 Deploy v2]
+  B --> C[⚡ 100% Traffic to v2]
+  C --> D{Works?}
+  D --> |Yes| E[✅ Success]
+  D --> |No| F[💀 100% Users Affected]
+  F --> G[😱 Emergency Rollback]
+```
+
+* ⚡ **All-or-nothing:** No gradual validation
+* 😱 **High blast radius:** Everyone affected immediately
+* ⏱️ **Slow detection:** Issues found in production
+
+---
+
+## 📍 Slide 7 – 🔥 Pain Point 1: Silent Failures
+
+**Scenario:** Memory leak that only triggers under load
+
+```mermaid
+flowchart LR
+  A[🧪 Tests Pass] --> B[🎭 Staging OK]
+  B --> C[🏭 Deploy to Prod]
+  C --> D[📈 Real Traffic]
+  D --> E[💥 OOM after 2 hours]
+```
+
+* 🧪 **Tests pass** — synthetic load is different
+* 🎭 **Staging works** — not enough traffic to trigger
+* 🏭 **Production crashes** — after hours of operation
+
+**Real impact:**
+* 😱 Facebook 2021: 6-hour outage from config change
+* 💰 Estimated loss: $100 million
+
+---
+
+## 📍 Slide 8 – 🔥 Pain Point 2: Slow Rollback
+
+**Traditional rollback process:**
+
+| ⏱️ Step | 📝 Action | ⌛ Time |
+|---------|----------|--------|
+| 1 | Detect the issue | 10 min |
+| 2 | Confirm it's the deploy | 5 min |
+| 3 | Find previous version | 2 min |
+| 4 | Rebuild/redeploy | 10 min |
+| 5 | Verify rollback | 5 min |
+| **Total** | **Downtime** | **32+ min** |
+
+* 🐌 **Slow detection:** Monitoring lag
+* 🤔 **Decision paralysis:** "Is it really the deploy?"
+* 🔧 **Manual process:** Error-prone under pressure
+
+---
+
+## 📍 Slide 9 – 🔥 Pain Point 3: No Gradual Validation
+
+**What we want:**
+
+```
+Deploy → Observe → Decide → Promote/Rollback
+```
+
+**What we get:**
+
+```
+Deploy → 🙏 Hope → React when broken
+```
+
+* 📊 **No metrics integration** — can't auto-decide
+* 👨‍💻 **Human in the loop** — for every deploy
+* 🎲 **Risk acceptance** — every release is a gamble
+
+---
+
+## 📍 Slide 10 – 💰 The Cost of Bad Deployments
+
+| 🔥 Problem | 💥 Impact | 📊 Industry Data |
+|-----------|----------|------------------|
+| Failed deployments | Service degradation | 46% experience monthly failures |
+| Slow rollback | Extended outages | Avg 30 min to rollback |
+| No canary testing | Full user impact | 100% blast radius |
+| Manual promotion | Human error | 70% of incidents |
+
+**DORA metrics show:**
+* 🏆 **Elite teams:** Deploy multiple times per day with <1% failure rate
+* 😰 **Low performers:** Monthly deploys with 15%+ failure rate
+
+---
+
+## 📍 Slide 11 – ✅ Section 2: Progressive Delivery Concepts
+
+**What is Progressive Delivery?**
+
+* 🐤 **Gradual rollout:** Incrementally shift traffic
+* 📊 **Observability:** Measure success at each step
+* 🤖 **Automation:** Promote or rollback based on metrics
+* 🎯 **Targeted:** Control which users see changes
+
+```mermaid
+flowchart LR
+  A[📦 v2] --> |5%| B[🎯 Test]
+  B --> |Metrics OK| C[25%]
+  C --> |Metrics OK| D[50%]
+  D --> |Metrics OK| E[100%]
+
+  B --> |Metrics Bad| F[↩️ Rollback]
+```
+
+---
+
+## 📍 Slide 12 – 🚫 Progressive Delivery: What It's NOT
+
+| 🚫 Myth | ✅ Reality |
+|---------|----------|
+| Just slow deployments | Strategic, metrics-driven progression |
+| Replaces testing | Complements testing with real traffic |
+| Only for big companies | Available via Argo Rollouts, Flagger |
+| Complicated to implement | Start simple, add automation gradually |
+
+> 🔥 **Hot take:** "If you're not doing progressive delivery, you're gambling with every deploy."
+
+**Progressive Delivery is:**
+* 🎯 **Risk reduction** — smaller blast radius
+* 📊 **Data-driven** — metrics decide promotion
+* 🔄 **Continuous** — part of the deployment pipeline
+
+---
+
+## 📍 Slide 13 – 🐤 Canary Deployments Explained
+
+**Named after "canary in a coal mine"** — early warning system
+
+```mermaid
+flowchart TD
+  subgraph Production
+    A[📦 v1 - 95%] --> C[🌐 Users]
+    B[📦 v2 - 5%] --> C
+  end
+
+  D[📊 Metrics] --> E{Healthy?}
+  E --> |Yes| F[📦 v2 - 100%]
+  E --> |No| G[↩️ v1 - 100%]
+```
+
+**How it works:**
+1. 🚀 Deploy new version alongside old
+2. 🎯 Route small % of traffic to new
+3. 📊 Compare metrics (errors, latency)
+4. ✅ Gradually increase or ↩️ rollback
+
+---
+
+## 📍 Slide 14 – 🔵 Blue-Green Deployments Explained
+
+**Two identical environments, instant switchover**
+
+```mermaid
+flowchart LR
+  subgraph Before
+    A[🔵 Blue v1] --> |100%| C[🌐 Traffic]
+    B[🟢 Green v2] --> |0%| C
+  end
+
+  subgraph After Switch
+    D[🔵 Blue v1] --> |0%| F[🌐 Traffic]
+    E[🟢 Green v2] --> |100%| F
+  end
+```
+
+**Characteristics:**
+* ⚡ **Instant switch:** Traffic moves all at once
+* ↩️ **Fast rollback:** Switch back to blue
+* 💰 **Resource cost:** Double infrastructure during deploy
+* 🎯 **Use case:** Database migrations, breaking changes
+
+---
+
+## 📍 Slide 15 – 📊 Canary vs Blue-Green
+
+| 📋 Aspect | 🐤 Canary | 🔵 Blue-Green |
+|----------|----------|---------------|
+| Traffic shift | Gradual (5% → 25% → 100%) | Instant (0% → 100%) |
+| Rollback speed | Instant | Instant |
+| Resource usage | Minimal overhead | Double during deploy |
+| Risk exposure | Minimal (small %) | Full (100% at switch) |
+| Complexity | Higher (traffic splitting) | Lower (simple switch) |
+| Best for | Most deployments | Major version changes |
+
+> 🤔 **Think:** Which strategy would you use for a database schema change?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Argo Rollouts in Action
+
+**What is Argo Rollouts?**
+
+* 🔄 Kubernetes controller for progressive delivery
+* 📦 Replaces standard Deployment resource
+* 🎯 Supports canary, blue-green, and more
+* 📊 Integrates with metrics providers
+
+```mermaid
+flowchart TD
+  A[📝 Rollout Resource] --> B[🤖 Argo Rollouts Controller]
+  B --> C[📦 ReplicaSets]
+  C --> D[☸️ Pods]
+  E[📊 Prometheus] --> B
+  B --> F[🎯 Traffic Management]
+```
+
+---
+
+## 📍 Slide 17 – 💥 Scenario 1: First Canary Rollout
+
+**Basic canary configuration:**
+
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Rollout
+metadata:
+  name: my-app
+spec:
+  replicas: 10
+  strategy:
+    canary:
+      steps:
+        - setWeight: 20
+        - pause: {duration: 5m}
+        - setWeight: 50
+        - pause: {duration: 5m}
+        - setWeight: 100
+  selector:
+    matchLabels:
+      app: my-app
+  template:
+    # Pod template (same as Deployment)
+```
+
+```mermaid
+flowchart LR
+  A[0%] --> |Step 1| B[20%]
+  B --> |5min pause| C[50%]
+  C --> |5min pause| D[100%]
+```
+
+---
+
+## 📍 Slide 18 – ✅ Solution 1: Traffic Progression
+
+**What happens during canary:**
+
+| 🕐 Time | 📦 Stable | 🐤 Canary | 📊 Status |
+|---------|----------|----------|-----------|
+| T+0 | 100% | 0% | Rollout started |
+| T+1 | 80% | 20% | setWeight: 20 |
+| T+6 | 50% | 50% | pause completed |
+| T+11 | 0% | 100% | Full promotion |
+
+**Rollout states:**
+* 🔄 **Progressing:** Moving through steps
+* ⏸️ **Paused:** Waiting (manual or timed)
+* ✅ **Healthy:** Rollout complete
+* 💥 **Degraded:** Issues detected
+
+---
+
+## 📍 Slide 19 – 💥 Scenario 2: Blue-Green with Argo Rollouts
+
+**Blue-green configuration:**
+
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Rollout
+metadata:
+  name: my-app
+spec:
+  replicas: 5
+  strategy:
+    blueGreen:
+      activeService: my-app-active
+      previewService: my-app-preview
+      autoPromotionEnabled: false  # Manual promotion
+      scaleDownDelaySeconds: 30
+  selector:
+    matchLabels:
+      app: my-app
+```
+
+```mermaid
+flowchart TD
+  A[🔵 Active Service] --> B[📦 Stable Pods]
+  C[🟢 Preview Service] --> D[📦 New Pods]
+  E[👨‍💻 QA] --> C
+  F[🌐 Users] --> A
+```
+
+---
+
+## 📍 Slide 20 – ✅ Solution 2: Preview and Promote
+
+**Blue-green workflow:**
+
+1. 🚀 **Deploy:** New pods created, preview service points to them
+2. 🧪 **Test:** QA validates via preview service
+3. ✅ **Promote:** Traffic switches to new pods
+4. 🗑️ **Cleanup:** Old pods scaled down after delay
+
+**Commands:**
+```bash
+# Check rollout status
+kubectl argo rollouts get rollout my-app
+
+# Promote preview to active
+kubectl argo rollouts promote my-app
+
+# Abort and rollback
+kubectl argo rollouts abort my-app
+```
+
+---
+
+## 📍 Slide 21 – 💥 Scenario 3: Automated Analysis
+
+**Problem:** Manual observation doesn't scale
+
+```mermaid
+flowchart TD
+  A[🐤 Canary] --> B[📊 Metrics]
+  B --> C{Error rate < 1%?}
+  C --> |Yes| D{Latency < 500ms?}
+  D --> |Yes| E[✅ Promote]
+  C --> |No| F[↩️ Rollback]
+  D --> |No| F
+```
+
+**Solution:** AnalysisTemplate
+
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: AnalysisTemplate
+metadata:
+  name: success-rate
+spec:
+  metrics:
+    - name: success-rate
+      interval: 1m
+      successCondition: result[0] >= 0.99
+      provider:
+        prometheus:
+          query: |
+            sum(rate(http_requests_total{status=~"2.*"}[5m])) /
+            sum(rate(http_requests_total[5m]))
+```
+
+---
+
+## 📍 Slide 22 – ✅ Solution 3: Analysis Integration
+
+**Connecting analysis to rollout:**
+
+```yaml
+strategy:
+  canary:
+    steps:
+      - setWeight: 20
+      - analysis:
+          templates:
+            - templateName: success-rate
+          args:
+            - name: service-name
+              value: my-app
+      - setWeight: 50
+      - analysis:
+          templates:
+            - templateName: success-rate
+      - setWeight: 100
+```
+
+**Analysis outcomes:**
+* ✅ **Successful:** All metrics pass → continue
+* ❌ **Failed:** Metric fails → automatic rollback
+* ⚠️ **Inconclusive:** Not enough data → pause
+
+---
+
+## 📍 Slide 23 – 💥 Scenario 4: Traffic Management
+
+**Problem:** Need fine-grained traffic control
+
+**Solutions:**
+
+| 🛠️ Traffic Manager | 📝 Description |
+|-------------------|---------------|
+| **Nginx Ingress** | Canary annotations |
+| **Istio** | VirtualService routing |
+| **AWS ALB** | Target group weights |
+| **Traefik** | TraefikService |
+
+```yaml
+# With Istio
+strategy:
+  canary:
+    trafficRouting:
+      istio:
+        virtualService:
+          name: my-app-vsvc
+        destinationRule:
+          name: my-app-destrule
+          canarySubsetName: canary
+          stableSubsetName: stable
+```
+
+---
+
+## 📍 Slide 24 – ✅ Solution 4: Nginx Ingress Canary
+
+**Simple traffic splitting with Nginx:**
+
+```yaml
+strategy:
+  canary:
+    canaryService: my-app-canary
+    stableService: my-app-stable
+    trafficRouting:
+      nginx:
+        stableIngress: my-app-ingress
+```
+
+**How it works:**
+* 🔧 Argo Rollouts creates canary ingress
+* 📊 Sets `nginx.ingress.kubernetes.io/canary-weight`
+* 🔄 Updates weight as rollout progresses
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L14_MID
+
+---
+
+## 📍 Slide 26 – 🔧 Section 4: Advanced Strategies
+
+**Experiment: A/B Testing**
+
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Experiment
+metadata:
+  name: ab-test
+spec:
+  duration: 1h
+  templates:
+    - name: baseline
+      specRef: stable
+      replicas: 1
+    - name: canary
+      specRef: canary
+      replicas: 1
+  analyses:
+    - name: compare-versions
+      templateName: compare-metrics
+```
+
+**Use cases:**
+* 🧪 **Feature testing:** Compare feature A vs B
+* 📊 **Performance testing:** Baseline vs optimized
+* 🎯 **User experience:** Different UIs
+
+---
+
+## 📍 Slide 27 – 📊 Metrics for Analysis
+
+**Common metrics to analyze:**
+
+| 📊 Metric | 📝 What it Measures | ⚠️ Threshold |
+|----------|-------------------|-------------|
+| Error rate | % of failed requests | < 1% |
+| Latency P99 | Slowest 1% of requests | < 500ms |
+| Saturation | Resource utilization | < 80% |
+| Success rate | % of successful operations | > 99% |
+
+**Prometheus queries:**
+```promql
+# Error rate
+sum(rate(http_requests_total{status=~"5.*"}[5m])) /
+sum(rate(http_requests_total[5m]))
+
+# P99 latency
+histogram_quantile(0.99, rate(http_duration_seconds_bucket[5m]))
+```
+
+---
+
+## 📍 Slide 28 – 🔄 Rollback Strategies
+
+**Automatic rollback triggers:**
+
+```yaml
+strategy:
+  canary:
+    steps:
+      - setWeight: 20
+      - analysis:
+          templates:
+            - templateName: error-rate
+    # If analysis fails, automatic rollback
+```
+
+**Manual rollback:**
+```bash
+# Abort current rollout
+kubectl argo rollouts abort my-app
+
+# Undo to previous version
+kubectl argo rollouts undo my-app
+
+# Retry after fix
+kubectl argo rollouts retry rollout my-app
+```
+
+```mermaid
+flowchart TD
+  A[💥 Analysis Failed] --> B[🤖 Auto Rollback]
+  B --> C[📦 Scale down canary]
+  C --> D[🔄 Restore stable]
+  D --> E[✅ Service restored]
+```
+
+---
+
+## 📍 Slide 29 – ⏸️ Pause and Resume
+
+**Manual gates in rollout:**
+
+```yaml
+steps:
+  - setWeight: 20
+  - pause: {}  # Manual pause - requires promotion
+  - setWeight: 50
+  - pause: {duration: 10m}  # Timed pause
+  - setWeight: 100
+```
+
+**Commands:**
+```bash
+# Resume paused rollout
+kubectl argo rollouts promote my-app
+
+# Skip all remaining steps
+kubectl argo rollouts promote my-app --full
+```
+
+**Use cases:**
+* 👀 **Manual verification** before wider rollout
+* 🕐 **Business hours** — pause overnight
+* 🧪 **QA sign-off** required
+
+---
+
+## 📍 Slide 30 – 🔗 ArgoCD + Argo Rollouts
+
+**GitOps + Progressive Delivery:**
+
+```mermaid
+flowchart TD
+  A[📝 Git Push] --> B[🤖 ArgoCD]
+  B --> |Sync| C[📦 Rollout Resource]
+  C --> D[🤖 Argo Rollouts Controller]
+  D --> E[🐤 Canary Progression]
+  E --> F[📊 Analysis]
+  F --> |Pass| G[✅ Promoted]
+  F --> |Fail| H[↩️ Rollback]
+```
+
+**Benefits:**
+* 📝 **Declarative:** Rollout strategy in Git
+* 🔄 **Automated:** ArgoCD syncs, Rollouts executes
+* 🔍 **Observable:** Both tools have UIs
+
+---
+
+## 📍 Slide 31 – 📊 Dashboard and Visualization
+
+**Argo Rollouts Dashboard:**
+
+```bash
+# Install dashboard
+kubectl argo rollouts dashboard
+
+# Access at localhost:3100
+```
+
+**Features:**
+* 📊 **Real-time status:** See rollout progression
+* 🎛️ **Controls:** Promote, abort, retry
+* 📈 **History:** Past rollouts and outcomes
+* 🔗 **Integration:** Links to metrics
+
+---
+
+## 📍 Slide 32 – 🎯 Best Practices
+
+| 📋 Practice | 📝 Why |
+|------------|--------|
+| Start with simple canary | Learn before adding complexity |
+| Always have analysis | Don't rely only on time-based |
+| Set appropriate thresholds | Too strict = never promotes |
+| Monitor canary metrics | Catch issues before promotion |
+| Test rollback procedure | Know it works before you need it |
+| Use GitOps | Keep strategy in version control |
+
+---
+
+## 📍 Slide 33 – 🏭 Section 5: Production Patterns
+
+**Netflix Progressive Delivery:**
+
+```mermaid
+flowchart LR
+  A[📦 v2] --> B[🎯 Internal 1%]
+  B --> C[🌍 One Region 5%]
+  C --> D[🌍 All Regions 25%]
+  D --> E[🚀 Full 100%]
+```
+
+**Their learnings:**
+* 🎯 **Internal first:** Employees as first canaries
+* 🌍 **Regional:** Test in one region before global
+* 📊 **Metrics-driven:** Automated promotion
+* 🐌 **Patience:** Days, not minutes
+
+---
+
+## 📍 Slide 34 – 🔧 Anti-Patterns to Avoid
+
+| ❌ Anti-Pattern | ✅ Better Approach |
+|----------------|-------------------|
+| Canary with no metrics | Add analysis, even basic |
+| Too fast progression | Allow time for issues to surface |
+| Ignoring saturation | Include resource metrics |
+| Manual-only promotion | Automate with analysis |
+| Skip staging canary | Test progressive delivery in staging |
+
+---
+
+## 📍 Slide 35 – 📈 Measuring Success
+
+**DORA metrics with progressive delivery:**
+
+| 📊 Metric | 😰 Before | 🚀 After |
+|----------|----------|---------|
+| Deployment frequency | Weekly | Multiple/day |
+| Change failure rate | 15% | < 1% |
+| MTTR | 30 min | 2 min |
+| Lead time | Days | Hours |
+
+**Why improvement:**
+* 🐤 **Catch issues early** — smaller blast radius
+* ↩️ **Fast rollback** — seconds, not minutes
+* 📊 **Data-driven** — objective decisions
+* 🔄 **Confidence** — deploy more often
+
+---
+
+## 📍 Slide 36 – 🎯 Key Takeaways
+
+1. 🐤 **Canary deployments** test with small traffic before full rollout
+2. 🔵 **Blue-green** enables instant rollback via traffic switch
+3. 📊 **Automated analysis** removes human guesswork
+4. 🎯 **Argo Rollouts** makes progressive delivery accessible
+5. 🔗 **GitOps integration** keeps strategy declarative
+6. ↩️ **Fast rollback** is as important as deployment
+
+> 💬 *"Deploy frequently, observe constantly, rollback automatically."*
+
+---
+
+## 📍 Slide 37 – 🧠 Mindset Shift
+
+| 😰 Old Mindset | 🚀 New Mindset |
+|---------------|----------------|
+| "Let's hope it works" | "Let's measure and know" |
+| "Deploy and pray" | "Deploy, observe, decide" |
+| "Rollback is failure" | "Rollback is success" |
+| "Testing is enough" | "Testing + production validation" |
+| "Deploy once a week (safe)" | "Deploy often (safer)" |
+| "100% or nothing" | "Progressive and controlled" |
+
+> 🤔 **Question:** Which deployment approach does your team use today?
+
+---
+
+## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L14_POST
+
+---
+
+## 📍 Slide 39 – 🚀 What's Next?
+
+**Coming up: Lecture 15 — Stateful Applications & Observability**
+
+```mermaid
+flowchart LR
+  A[📦 Deployment] --> B[🗄️ StatefulSet]
+  B --> C[💾 Persistent Storage]
+  C --> D[📊 Monitoring]
+```
+
+* 🗄️ **StatefulSets:** Managing stateful applications
+* 💾 **Persistent storage:** Beyond ephemeral pods
+* 📊 **Observability:** Prometheus, Grafana
+* 🔍 **Alerting:** Know before users complain
+
+> 🎯 **Lab 14:** Implement canary deployments with Argo Rollouts!
+
+---
+
+## 📚 Resources
+
+**Documentation:**
+* 📖 [Argo Rollouts Docs](https://argoproj.github.io/argo-rollouts/)
+* 📖 [Progressive Delivery](https://www.weave.works/blog/progressive-delivery)
+* 📖 [Canary Deployments](https://martinfowler.com/bliki/CanaryRelease.html)
+
+**Tools:**
+* 🔧 [Argo Rollouts](https://argoproj.github.io/argo-rollouts/)
+* 🔧 [Flagger](https://flagger.app/)
+* 🔧 [Istio](https://istio.io/)
+
+**Books:**
+* 📕 *Accelerate* by Nicole Forsgren, Jez Humble, Gene Kim
+* 📕 *Continuous Delivery* by Jez Humble & David Farley
diff --git a/lectures/lec15.md b/lectures/lec15.md
index eb828de609..addeef685e 100644
--- a/lectures/lec15.md
+++ b/lectures/lec15.md
@@ -1,821 +1,821 @@
-# 📌 Lecture 15 — Stateful Applications & Observability: The Complete Picture
-
-> 🎯 **From stateless simplicity to production-ready stateful workloads with full observability**
-
----
-
-## 📍 Slide 1 – 🚀 The Final Pieces of Production Kubernetes
-
-We've deployed applications, managed configs, and implemented GitOps. Two challenges remain:
-
-* 🗄️ **Stateful apps:** Databases, message queues, caches — they need identity and stable storage
-* 📊 **Observability:** If you can't see it, you can't fix it
-
-```mermaid
-flowchart LR
-  A[📦 Stateless Apps] --> B[🗄️ StatefulSets]
-  B --> C[📊 Monitoring]
-  C --> D[🔔 Alerting]
-  D --> E[💎 Production Ready]
-```
-
-> 🎯 **Goal:** Master stateful workloads and comprehensive cluster observability
-
----
-
-## 📍 Slide 2 – 📚 Learning Outcomes
-
-By the end of this lecture, you will:
-
-| # | 🎯 Outcome |
-|---|-----------|
-| 1 | ✅ Understand when to use **StatefulSets** vs Deployments |
-| 2 | ✅ Implement **headless services** for pod discovery |
-| 3 | ✅ Configure **VolumeClaimTemplates** for per-pod storage |
-| 4 | ✅ Deploy **Prometheus** for metrics collection |
-| 5 | ✅ Create **Grafana dashboards** for visualization |
-| 6 | ✅ Set up **alerting** for proactive incident response |
-
----
-
-## 📍 Slide 3 – 🗺️ Lecture Overview
-
-```
-┌─────────────────────────────────────────────────────────────┐
-│  SECTION 0: Introduction                    (Slides 1-4)   │
-├─────────────────────────────────────────────────────────────┤
-│  📝 PRE QUIZ                                (Slide 5)      │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 1: Stateful Workload Challenges    (Slides 6-10)  │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 2: StatefulSets Deep Dive          (Slides 11-18) │
-├─────────────────────────────────────────────────────────────┤
-│  📝 MID QUIZ                                (Slide 19)     │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 3: Observability Fundamentals      (Slides 20-28) │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 4: Production Monitoring           (Slides 29-36) │
-├─────────────────────────────────────────────────────────────┤
-│  📝 POST QUIZ                               (Slide 37)     │
-├─────────────────────────────────────────────────────────────┤
-│  FINAL: What's Next                         (Slide 38)     │
-└─────────────────────────────────────────────────────────────┘
-```
-
----
-
-## 📍 Slide 4 – 🤔 The Big Question
-
-> 💬 *"You can't manage what you can't measure."*
-> — Peter Drucker
-
-**Consider these scenarios:**
-
-* 🗄️ **Database cluster:** Pods need stable identity for replication
-* 📊 **3 AM alert:** Is the app slow, or is it the database?
-* 🔍 **Debugging:** "What changed in the last hour?"
-* 🔮 **Capacity planning:** "Will we run out of storage next month?"
-
-> 🤔 **Think:** How do you know your system is healthy right now?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L15_PRE
-
----
-
-## 📍 Slide 6 – ⚠️ Section 1: Why Stateless Isn't Always Enough
-
-**Deployments (Stateless) characteristics:**
-
-```mermaid
-flowchart TD
-  A[📦 Deployment] --> B[📦 Pod-abc123]
-  A --> C[📦 Pod-def456]
-  A --> D[📦 Pod-ghi789]
-
-  E[Pods are interchangeable]
-  F[Random names]
-  G[Any pod can be replaced]
-```
-
-* ✅ **Great for:** Web servers, API services, workers
-* ❌ **Problem for:** Databases, message queues, distributed systems
-
----
-
-## 📍 Slide 7 – 🔥 Pain Point 1: Pod Identity
-
-**Stateful apps need stable identity:**
-
-| 🗄️ Application | 🔑 Why Identity Matters |
-|---------------|------------------------|
-| **PostgreSQL** | Primary/replica must know who is who |
-| **MongoDB** | Replica set members have specific roles |
-| **Kafka** | Brokers identified by stable IDs |
-| **Redis Cluster** | Nodes need persistent slots |
-| **Elasticsearch** | Nodes join cluster by name |
-
-**With Deployment:**
-```
-pod-abc123 → restarts → pod-xyz789 (new name!)
-```
-
-**The problem:** Other pods can't find it anymore
-
----
-
-## 📍 Slide 8 – 🔥 Pain Point 2: Storage Persistence
-
-**Scenario:** 3-node MongoDB replica set
-
-```mermaid
-flowchart TD
-  A[📦 Deployment] --> B[📦 Pod 1]
-  A --> C[📦 Pod 2]
-  A --> D[📦 Pod 3]
-
-  E[💾 Shared PVC] --> B
-  E --> C
-  E --> D
-
-  F[😱 Problem: All pods fighting for same storage!]
-```
-
-**What we need:**
-* 📦 Pod 1 → 💾 Volume 1 (its own data)
-* 📦 Pod 2 → 💾 Volume 2 (its own data)
-* 📦 Pod 3 → 💾 Volume 3 (its own data)
-
----
-
-## 📍 Slide 9 – 🔥 Pain Point 3: Ordered Operations
-
-**Database cluster startup order matters:**
-
-```mermaid
-flowchart LR
-  A[🥇 Primary starts] --> B[🥈 Replica 1 joins]
-  B --> C[🥉 Replica 2 joins]
-```
-
-**Deployment behavior:** All pods start simultaneously
-* 😱 Race condition: Who is primary?
-* 💥 Data corruption risk
-
-**Shutdown order matters too:**
-* 🥉 Replicas drain first
-* 🥇 Primary shuts down last
-
----
-
-## 📍 Slide 10 – 📊 Deployment vs StatefulSet
-
-| 📋 Aspect | 📦 Deployment | 🗄️ StatefulSet |
-|----------|--------------|----------------|
-| Pod names | Random suffix | Stable ordinal (app-0, app-1) |
-| Storage | Shared or none | Per-pod PVCs |
-| Scaling | Parallel | Sequential |
-| Updates | Rolling (parallel) | Rolling (sequential) |
-| Network identity | Via Service | Stable DNS per pod |
-| Use case | Stateless apps | Stateful apps |
-
----
-
-## 📍 Slide 11 – ✅ Section 2: StatefulSets to the Rescue
-
-**StatefulSet provides:**
-
-```mermaid
-flowchart TD
-  A[🗄️ StatefulSet] --> B[📦 app-0]
-  A --> C[📦 app-1]
-  A --> D[📦 app-2]
-
-  B --> E[💾 data-app-0]
-  C --> F[💾 data-app-1]
-  D --> G[💾 data-app-2]
-
-  H[🌐 Headless Service] --> B
-  H --> C
-  H --> D
-```
-
-* 🔢 **Stable, unique network IDs:** `app-0`, `app-1`, `app-2`
-* 💾 **Stable, persistent storage:** Each pod gets its own PVC
-* 📊 **Ordered deployment:** `app-0` first, then `app-1`, then `app-2`
-* 🔄 **Ordered termination:** Reverse order
-
----
-
-## 📍 Slide 12 – 🌐 Headless Services Explained
-
-**Regular Service vs Headless Service:**
-
-```yaml
-# Regular Service - Load balances
-apiVersion: v1
-kind: Service
-metadata:
-  name: my-app
-spec:
-  clusterIP: 10.0.0.100  # Gets an IP
-  ports:
-    - port: 80
----
-# Headless Service - Direct pod access
-apiVersion: v1
-kind: Service
-metadata:
-  name: my-app-headless
-spec:
-  clusterIP: None  # No IP assigned!
-  ports:
-    - port: 80
-```
-
-**DNS resolution:**
-* **Regular:** `my-app.namespace.svc` → `10.0.0.100`
-* **Headless:** `my-app-headless.namespace.svc` → `10.1.2.3, 10.1.2.4, 10.1.2.5` (all pod IPs)
-
----
-
-## 📍 Slide 13 – 🔗 Pod DNS in StatefulSets
-
-**Each pod gets a stable DNS name:**
-
-```
-<pod-name>.<service-name>.<namespace>.svc.cluster.local
-```
-
-**Example with MongoDB:**
-```
-mongodb-0.mongodb-headless.default.svc.cluster.local
-mongodb-1.mongodb-headless.default.svc.cluster.local
-mongodb-2.mongodb-headless.default.svc.cluster.local
-```
-
-```mermaid
-flowchart LR
-  A[🔍 DNS Query: mongodb-0.mongodb-headless] --> B[📦 mongodb-0]
-  C[🔍 DNS Query: mongodb-1.mongodb-headless] --> D[📦 mongodb-1]
-```
-
-* ✅ Other apps can connect to specific pods
-* ✅ Pods can discover each other by name
-* ✅ Names stay the same even after restart
-
----
-
-## 📍 Slide 14 – 💾 VolumeClaimTemplates
-
-**Automatic PVC creation per pod:**
-
-```yaml
-apiVersion: apps/v1
-kind: StatefulSet
-metadata:
-  name: mongodb
-spec:
-  serviceName: mongodb-headless
-  replicas: 3
-  volumeClaimTemplates:
-    - metadata:
-        name: data
-      spec:
-        accessModes: ["ReadWriteOnce"]
-        storageClassName: standard
-        resources:
-          requests:
-            storage: 10Gi
-```
-
-**Result:**
-```
-PVC: data-mongodb-0 → bound to mongodb-0
-PVC: data-mongodb-1 → bound to mongodb-1
-PVC: data-mongodb-2 → bound to mongodb-2
-```
-
----
-
-## 📍 Slide 15 – 🔄 Scaling Behavior
-
-**Scale up (sequential):**
-```mermaid
-flowchart LR
-  A[app-0 ready] --> B[app-1 starts]
-  B --> C[app-1 ready]
-  C --> D[app-2 starts]
-```
-
-**Scale down (reverse order):**
-```mermaid
-flowchart LR
-  A[app-2 terminates] --> B[app-2 gone]
-  B --> C[app-1 terminates]
-  C --> D[app-1 gone]
-```
-
-**Key points:**
-* 🔄 Next pod only starts when previous is **Ready**
-* 🗑️ Scaling down starts from highest ordinal
-* 💾 PVCs are **NOT deleted** on scale down (data preserved)
-
----
-
-## 📍 Slide 16 – 🔄 Update Strategies
-
-**RollingUpdate (default):**
-```yaml
-spec:
-  updateStrategy:
-    type: RollingUpdate
-    rollingUpdate:
-      partition: 0  # Update all pods
-```
-
-**Partition for canary:**
-```yaml
-rollingUpdate:
-  partition: 2  # Only update pods >= 2
-```
-
-```mermaid
-flowchart LR
-  A[app-0: v1] --> B[app-1: v1]
-  B --> C[app-2: v2 - canary]
-```
-
-* ✅ Test new version on highest ordinal first
-* ✅ Gradually lower partition to update more pods
-
----
-
-## 📍 Slide 17 – 🗄️ Complete StatefulSet Example
-
-```yaml
-apiVersion: apps/v1
-kind: StatefulSet
-metadata:
-  name: mongodb
-spec:
-  selector:
-    matchLabels:
-      app: mongodb
-  serviceName: mongodb-headless
-  replicas: 3
-  template:
-    metadata:
-      labels:
-        app: mongodb
-    spec:
-      containers:
-        - name: mongodb
-          image: mongo:7
-          ports:
-            - containerPort: 27017
-          volumeMounts:
-            - name: data
-              mountPath: /data/db
-  volumeClaimTemplates:
-    - metadata:
-        name: data
-      spec:
-        accessModes: ["ReadWriteOnce"]
-        resources:
-          requests:
-            storage: 10Gi
-```
-
----
-
-## 📍 Slide 18 – ⚠️ StatefulSet Gotchas
-
-| ⚠️ Gotcha | 📝 Solution |
-|----------|------------|
-| PVCs not deleted on scale down | Manual deletion if needed |
-| Pod stuck in Pending | Check PVC binding, storage class |
-| Headless service required | Must create before StatefulSet |
-| Slow scaling | Increase `podManagementPolicy: Parallel` |
-| Data loss on PVC deletion | Use `reclaimPolicy: Retain` |
-
-**Important:** StatefulSets are **more complex** than Deployments. Use only when needed!
-
----
-
-## 📍 Slide 19 – 📝 QUIZ — DEVOPS_L15_MID
-
----
-
-## 📍 Slide 20 – 📊 Section 3: The Three Pillars of Observability
-
-**Observability = Understanding system behavior from outputs**
-
-```mermaid
-flowchart TD
-  A[📊 Metrics] --> D[🔍 Observability]
-  B[📝 Logs] --> D
-  C[🔗 Traces] --> D
-  D --> E[💡 Understanding]
-```
-
-| 📊 Pillar | 📝 What It Answers | 🛠️ Tools |
-|----------|-------------------|----------|
-| **Metrics** | What is happening? (numbers) | Prometheus, Grafana |
-| **Logs** | What happened? (events) | Loki, ELK |
-| **Traces** | Where did it happen? (requests) | Jaeger, Zipkin |
-
----
-
-## 📍 Slide 21 – 📈 Prometheus: The Metrics Foundation
-
-**What is Prometheus?**
-
-* 📊 Time-series database for metrics
-* 🔍 Pull-based metric collection
-* 📝 Powerful query language (PromQL)
-* 🔔 Built-in alerting
-
-```mermaid
-flowchart LR
-  A[📦 App with /metrics] --> |Pull| B[📊 Prometheus]
-  C[📦 Another App] --> |Pull| B
-  B --> D[📈 Grafana]
-  B --> E[🔔 Alertmanager]
-```
-
----
-
-## 📍 Slide 22 – 🎯 Prometheus Metric Types
-
-| 📊 Type | 📝 Description | 🎯 Example |
-|--------|---------------|-----------|
-| **Counter** | Only goes up | Total requests, errors |
-| **Gauge** | Can go up/down | Temperature, queue size |
-| **Histogram** | Distribution of values | Request latency |
-| **Summary** | Similar to histogram | Quantiles |
-
-**Example metrics:**
-```promql
-# Counter - total HTTP requests
-http_requests_total{method="GET", status="200"}
-
-# Gauge - current memory usage
-node_memory_MemAvailable_bytes
-
-# Histogram - request duration
-http_request_duration_seconds_bucket{le="0.5"}
-```
-
----
-
-## 📍 Slide 23 – 🔍 PromQL Basics
-
-**Query examples:**
-
-```promql
-# Current value
-up{job="kubernetes-pods"}
-
-# Rate of change (per second over 5m)
-rate(http_requests_total[5m])
-
-# Error rate percentage
-sum(rate(http_requests_total{status=~"5.."}[5m])) /
-sum(rate(http_requests_total[5m])) * 100
-
-# 99th percentile latency
-histogram_quantile(0.99, rate(http_request_duration_seconds_bucket[5m]))
-
-# Top 5 pods by CPU
-topk(5, sum by (pod) (rate(container_cpu_usage_seconds_total[5m])))
-```
-
----
-
-## 📍 Slide 24 – 📦 kube-prometheus-stack
-
-**All-in-one monitoring solution:**
-
-```mermaid
-flowchart TD
-  A[📦 kube-prometheus-stack] --> B[📊 Prometheus]
-  A --> C[📈 Grafana]
-  A --> D[🔔 Alertmanager]
-  A --> E[📝 Node Exporter]
-  A --> F[📊 kube-state-metrics]
-```
-
-**Includes:**
-* 🔧 Pre-configured scrape targets
-* 📊 Default dashboards
-* 🔔 Default alerting rules
-* 📈 Grafana with data sources configured
-
-```bash
-helm install prometheus prometheus-community/kube-prometheus-stack
-```
-
----
-
-## 📍 Slide 25 – 📈 Grafana Dashboards
-
-**Key Grafana concepts:**
-
-| 🔧 Concept | 📝 Description |
-|-----------|---------------|
-| **Data Source** | Where data comes from (Prometheus) |
-| **Dashboard** | Collection of panels |
-| **Panel** | Single visualization |
-| **Variable** | Dynamic filters (namespace, pod) |
-
-**Popular pre-built dashboards:**
-* 🔢 **1860:** Node Exporter Full
-* 🔢 **315:** Kubernetes cluster
-* 🔢 **7249:** Kubernetes Pod Resources
-
----
-
-## 📍 Slide 26 – 🔔 Alerting with Alertmanager
-
-**Alert flow:**
-
-```mermaid
-flowchart LR
-  A[📊 Prometheus] --> |Alert fires| B[🔔 Alertmanager]
-  B --> |Route| C[📧 Email]
-  B --> |Route| D[💬 Slack]
-  B --> |Route| E[📱 PagerDuty]
-```
-
-**Alert rule example:**
-```yaml
-groups:
-  - name: app-alerts
-    rules:
-      - alert: HighErrorRate
-        expr: |
-          sum(rate(http_requests_total{status=~"5.."}[5m])) /
-          sum(rate(http_requests_total[5m])) > 0.01
-        for: 5m
-        labels:
-          severity: critical
-        annotations:
-          summary: "High error rate detected"
-          description: "Error rate is {{ $value | humanizePercentage }}"
-```
-
----
-
-## 📍 Slide 27 – 📊 The Four Golden Signals
-
-**Google SRE's essential metrics:**
-
-| 🔔 Signal | 📝 What to Measure | 📊 Prometheus Example |
-|----------|-------------------|----------------------|
-| **Latency** | Response time | `histogram_quantile(0.99, ...)` |
-| **Traffic** | Request rate | `rate(http_requests_total[5m])` |
-| **Errors** | Failure rate | `rate(http_requests_total{status=~"5.."}[5m])` |
-| **Saturation** | Resource usage | `container_memory_usage_bytes / limit` |
-
-> 💡 **Tip:** Start by monitoring these four signals for every service
-
----
-
-## 📍 Slide 28 – 🔧 Init Containers for Dependencies
-
-**Problem:** App starts before database is ready
-
-```yaml
-spec:
-  initContainers:
-    - name: wait-for-db
-      image: busybox
-      command:
-        - sh
-        - -c
-        - |
-          until nc -z postgres-0.postgres-headless 5432; do
-            echo "Waiting for database..."
-            sleep 2
-          done
-  containers:
-    - name: app
-      image: my-app
-```
-
-```mermaid
-flowchart LR
-  A[🚀 Pod Start] --> B[⏳ Init Container]
-  B --> |DB Ready| C[📦 App Container]
-```
-
----
-
-## 📍 Slide 29 – 🏭 Section 4: Production Monitoring Setup
-
-**ServiceMonitor for custom apps:**
-
-```yaml
-apiVersion: monitoring.coreos.com/v1
-kind: ServiceMonitor
-metadata:
-  name: my-app-monitor
-spec:
-  selector:
-    matchLabels:
-      app: my-app
-  endpoints:
-    - port: metrics
-      interval: 30s
-      path: /metrics
-```
-
-**What this does:**
-* 🔍 Tells Prometheus to scrape your app
-* 📊 Collects metrics from `/metrics` endpoint
-* ⏱️ Every 30 seconds
-
----
-
-## 📍 Slide 30 – 📊 Monitoring StatefulSets
-
-**Key metrics for stateful apps:**
-
-| 📊 Metric | 📝 Why Important |
-|----------|------------------|
-| `kubelet_volume_stats_used_bytes` | Disk usage per PVC |
-| `kube_statefulset_replicas` | Expected vs actual replicas |
-| `kube_statefulset_status_replicas_ready` | Healthy replicas |
-| App-specific metrics | Replication lag, connections |
-
-**Alert example:**
-```yaml
-- alert: StatefulSetNotReady
-  expr: |
-    kube_statefulset_status_replicas_ready /
-    kube_statefulset_replicas < 1
-  for: 5m
-  labels:
-    severity: warning
-```
-
----
-
-## 📍 Slide 31 – 📈 Resource Monitoring
-
-**CPU and Memory queries:**
-
-```promql
-# CPU usage percentage
-sum(rate(container_cpu_usage_seconds_total{pod=~"my-app.*"}[5m])) /
-sum(kube_pod_container_resource_limits{resource="cpu", pod=~"my-app.*"}) * 100
-
-# Memory usage percentage
-sum(container_memory_working_set_bytes{pod=~"my-app.*"}) /
-sum(kube_pod_container_resource_limits{resource="memory", pod=~"my-app.*"}) * 100
-```
-
-**Capacity planning alerts:**
-```yaml
-- alert: HighMemoryUsage
-  expr: |
-    sum(container_memory_working_set_bytes) by (pod) /
-    sum(kube_pod_container_resource_limits{resource="memory"}) by (pod) > 0.8
-  for: 15m
-```
-
----
-
-## 📍 Slide 32 – 🔔 Alert Fatigue Prevention
-
-**Problem:** Too many alerts = ignored alerts
-
-| ❌ Bad Practice | ✅ Better Approach |
-|----------------|-------------------|
-| Alert on every metric | Alert on symptoms, not causes |
-| No severity levels | Critical, warning, info tiers |
-| Alert immediately | Use `for` duration |
-| Generic messages | Actionable descriptions |
-| No runbooks | Link to debugging guides |
-
-**Good alert structure:**
-```yaml
-annotations:
-  summary: "High error rate on {{ $labels.service }}"
-  description: "Error rate is {{ $value }}% (threshold: 1%)"
-  runbook_url: "https://wiki/alerts/high-error-rate"
-```
-
----
-
-## 📍 Slide 33 – 📊 Dashboard Best Practices
-
-**Effective dashboard layout:**
-
-```
-┌─────────────────────────────────────────┐
-│  📊 Overview: Key metrics at a glance   │
-├─────────────┬─────────────┬─────────────┤
-│  🔴 Errors  │  ⏱️ Latency │  📈 Traffic │
-├─────────────┴─────────────┴─────────────┤
-│  💾 Resource Usage (CPU, Memory, Disk)  │
-├─────────────────────────────────────────┤
-│  🔍 Detailed Breakdowns (per pod, etc.) │
-└─────────────────────────────────────────┘
-```
-
-**Tips:**
-* 📊 Start with high-level, drill down for details
-* 🎨 Use consistent colors (red = bad)
-* 📝 Add descriptions to panels
-* 🔗 Link related dashboards
-
----
-
-## 📍 Slide 34 – 🏢 Real-World: Observability at Scale
-
-**Netflix observability approach:**
-
-* 📊 **Metrics:** Atlas (Prometheus-like, billions of time series)
-* 📝 **Logs:** Mantis (real-time stream processing)
-* 🔗 **Traces:** Edgar (distributed tracing)
-* 🔔 **Alerts:** Focused on customer impact
-
-**Key lessons:**
-* 🎯 Focus on **business metrics** (not just infra)
-* 🔄 Automate **remediation** where possible
-* 📈 Invest in **dashboards** as a product
-* 👥 Make observability **everyone's** job
-
----
-
-## 📍 Slide 35 – 🎯 Key Takeaways
-
-1. 🗄️ **StatefulSets** provide stable identity and per-pod storage for databases
-2. 🌐 **Headless services** enable direct pod-to-pod communication
-3. 📊 **Three pillars:** Metrics, Logs, Traces for full observability
-4. 📈 **Prometheus + Grafana** is the standard K8s monitoring stack
-5. 🔔 **Alerts should be actionable** — avoid alert fatigue
-6. 🎯 **Four Golden Signals:** Latency, Traffic, Errors, Saturation
-
-> 💬 *"Observability is not about collecting data, it's about understanding your system."*
-
----
-
-## 📍 Slide 36 – 🧠 Mindset Shift
-
-| 😰 Old Mindset | 🚀 New Mindset |
-|---------------|----------------|
-| "It's working, don't touch it" | "I can see it's working" |
-| "Let's check the logs" | "The dashboard shows the issue" |
-| "User reported an error" | "Alert fired before impact" |
-| "Database needs restart" | "DB has stable identity, restart is safe" |
-| "Collect all the metrics" | "Monitor what matters" |
-| "Alert on everything" | "Alert on symptoms, investigate causes" |
-
-> 🤔 **Question:** What's the first dashboard you'd build for your app?
-
----
-
-## 📍 Slide 37 – 📝 QUIZ — DEVOPS_L15_POST
-
----
-
-## 📍 Slide 38 – 🚀 What's Next?
-
-**Coming up: Lecture 16 — Beyond Kubernetes**
-
-```mermaid
-flowchart LR
-  A[☸️ Kubernetes] --> B[✈️ Fly.io]
-  A --> C[🌐 IPFS/4EVERLAND]
-  B --> D[🌍 Global Edge]
-  C --> E[🔗 Decentralized]
-```
-
-* ✈️ **Fly.io:** Edge deployment simplified
-* 🌐 **IPFS:** Decentralized hosting
-* 🤔 **When to use what:** Trade-offs and decisions
-* 🎯 **Beyond the cluster:** Alternative deployment models
-
-> 🎯 **Labs 15 & 16:** Convert your app to StatefulSet and set up comprehensive monitoring!
-
----
-
-## 📚 Resources
-
-**StatefulSets:**
-* 📖 [Kubernetes StatefulSets](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/)
-* 📖 [Headless Services](https://kubernetes.io/docs/concepts/services-networking/service/#headless-services)
-
-**Observability:**
-* 📖 [Prometheus Docs](https://prometheus.io/docs/)
-* 📖 [Grafana Docs](https://grafana.com/docs/)
-* 📖 [kube-prometheus-stack](https://github.com/prometheus-community/helm-charts/tree/main/charts/kube-prometheus-stack)
-
-**Books:**
-* 📕 *Observability Engineering* by Charity Majors, et al.
-* 📕 *Site Reliability Engineering* by Google
-* 📕 *Kubernetes Patterns* by Bilgin Ibryam & Roland Huß
+# 📌 Lecture 15 — Stateful Applications & Observability: The Complete Picture
+
+> 🎯 **From stateless simplicity to production-ready stateful workloads with full observability**
+
+---
+
+## 📍 Slide 1 – 🚀 The Final Pieces of Production Kubernetes
+
+We've deployed applications, managed configs, and implemented GitOps. Two challenges remain:
+
+* 🗄️ **Stateful apps:** Databases, message queues, caches — they need identity and stable storage
+* 📊 **Observability:** If you can't see it, you can't fix it
+
+```mermaid
+flowchart LR
+  A[📦 Stateless Apps] --> B[🗄️ StatefulSets]
+  B --> C[📊 Monitoring]
+  C --> D[🔔 Alerting]
+  D --> E[💎 Production Ready]
+```
+
+> 🎯 **Goal:** Master stateful workloads and comprehensive cluster observability
+
+---
+
+## 📍 Slide 2 – 📚 Learning Outcomes
+
+By the end of this lecture, you will:
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | ✅ Understand when to use **StatefulSets** vs Deployments |
+| 2 | ✅ Implement **headless services** for pod discovery |
+| 3 | ✅ Configure **VolumeClaimTemplates** for per-pod storage |
+| 4 | ✅ Deploy **Prometheus** for metrics collection |
+| 5 | ✅ Create **Grafana dashboards** for visualization |
+| 6 | ✅ Set up **alerting** for proactive incident response |
+
+---
+
+## 📍 Slide 3 – 🗺️ Lecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  SECTION 0: Introduction                    (Slides 1-4)   │
+├─────────────────────────────────────────────────────────────┤
+│  📝 PRE QUIZ                                (Slide 5)      │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 1: Stateful Workload Challenges    (Slides 6-10)  │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 2: StatefulSets Deep Dive          (Slides 11-18) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 MID QUIZ                                (Slide 19)     │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 3: Observability Fundamentals      (Slides 20-28) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 4: Production Monitoring           (Slides 29-36) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 POST QUIZ                               (Slide 37)     │
+├─────────────────────────────────────────────────────────────┤
+│  FINAL: What's Next                         (Slide 38)     │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 📍 Slide 4 – 🤔 The Big Question
+
+> 💬 *"You can't manage what you can't measure."*
+> — Peter Drucker
+
+**Consider these scenarios:**
+
+* 🗄️ **Database cluster:** Pods need stable identity for replication
+* 📊 **3 AM alert:** Is the app slow, or is it the database?
+* 🔍 **Debugging:** "What changed in the last hour?"
+* 🔮 **Capacity planning:** "Will we run out of storage next month?"
+
+> 🤔 **Think:** How do you know your system is healthy right now?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L15_PRE
+
+---
+
+## 📍 Slide 6 – ⚠️ Section 1: Why Stateless Isn't Always Enough
+
+**Deployments (Stateless) characteristics:**
+
+```mermaid
+flowchart TD
+  A[📦 Deployment] --> B[📦 Pod-abc123]
+  A --> C[📦 Pod-def456]
+  A --> D[📦 Pod-ghi789]
+
+  E[Pods are interchangeable]
+  F[Random names]
+  G[Any pod can be replaced]
+```
+
+* ✅ **Great for:** Web servers, API services, workers
+* ❌ **Problem for:** Databases, message queues, distributed systems
+
+---
+
+## 📍 Slide 7 – 🔥 Pain Point 1: Pod Identity
+
+**Stateful apps need stable identity:**
+
+| 🗄️ Application | 🔑 Why Identity Matters |
+|---------------|------------------------|
+| **PostgreSQL** | Primary/replica must know who is who |
+| **MongoDB** | Replica set members have specific roles |
+| **Kafka** | Brokers identified by stable IDs |
+| **Redis Cluster** | Nodes need persistent slots |
+| **Elasticsearch** | Nodes join cluster by name |
+
+**With Deployment:**
+```
+pod-abc123 → restarts → pod-xyz789 (new name!)
+```
+
+**The problem:** Other pods can't find it anymore
+
+---
+
+## 📍 Slide 8 – 🔥 Pain Point 2: Storage Persistence
+
+**Scenario:** 3-node MongoDB replica set
+
+```mermaid
+flowchart TD
+  A[📦 Deployment] --> B[📦 Pod 1]
+  A --> C[📦 Pod 2]
+  A --> D[📦 Pod 3]
+
+  E[💾 Shared PVC] --> B
+  E --> C
+  E --> D
+
+  F[😱 Problem: All pods fighting for same storage!]
+```
+
+**What we need:**
+* 📦 Pod 1 → 💾 Volume 1 (its own data)
+* 📦 Pod 2 → 💾 Volume 2 (its own data)
+* 📦 Pod 3 → 💾 Volume 3 (its own data)
+
+---
+
+## 📍 Slide 9 – 🔥 Pain Point 3: Ordered Operations
+
+**Database cluster startup order matters:**
+
+```mermaid
+flowchart LR
+  A[🥇 Primary starts] --> B[🥈 Replica 1 joins]
+  B --> C[🥉 Replica 2 joins]
+```
+
+**Deployment behavior:** All pods start simultaneously
+* 😱 Race condition: Who is primary?
+* 💥 Data corruption risk
+
+**Shutdown order matters too:**
+* 🥉 Replicas drain first
+* 🥇 Primary shuts down last
+
+---
+
+## 📍 Slide 10 – 📊 Deployment vs StatefulSet
+
+| 📋 Aspect | 📦 Deployment | 🗄️ StatefulSet |
+|----------|--------------|----------------|
+| Pod names | Random suffix | Stable ordinal (app-0, app-1) |
+| Storage | Shared or none | Per-pod PVCs |
+| Scaling | Parallel | Sequential |
+| Updates | Rolling (parallel) | Rolling (sequential) |
+| Network identity | Via Service | Stable DNS per pod |
+| Use case | Stateless apps | Stateful apps |
+
+---
+
+## 📍 Slide 11 – ✅ Section 2: StatefulSets to the Rescue
+
+**StatefulSet provides:**
+
+```mermaid
+flowchart TD
+  A[🗄️ StatefulSet] --> B[📦 app-0]
+  A --> C[📦 app-1]
+  A --> D[📦 app-2]
+
+  B --> E[💾 data-app-0]
+  C --> F[💾 data-app-1]
+  D --> G[💾 data-app-2]
+
+  H[🌐 Headless Service] --> B
+  H --> C
+  H --> D
+```
+
+* 🔢 **Stable, unique network IDs:** `app-0`, `app-1`, `app-2`
+* 💾 **Stable, persistent storage:** Each pod gets its own PVC
+* 📊 **Ordered deployment:** `app-0` first, then `app-1`, then `app-2`
+* 🔄 **Ordered termination:** Reverse order
+
+---
+
+## 📍 Slide 12 – 🌐 Headless Services Explained
+
+**Regular Service vs Headless Service:**
+
+```yaml
+# Regular Service - Load balances
+apiVersion: v1
+kind: Service
+metadata:
+  name: my-app
+spec:
+  clusterIP: 10.0.0.100  # Gets an IP
+  ports:
+    - port: 80
+---
+# Headless Service - Direct pod access
+apiVersion: v1
+kind: Service
+metadata:
+  name: my-app-headless
+spec:
+  clusterIP: None  # No IP assigned!
+  ports:
+    - port: 80
+```
+
+**DNS resolution:**
+* **Regular:** `my-app.namespace.svc` → `10.0.0.100`
+* **Headless:** `my-app-headless.namespace.svc` → `10.1.2.3, 10.1.2.4, 10.1.2.5` (all pod IPs)
+
+---
+
+## 📍 Slide 13 – 🔗 Pod DNS in StatefulSets
+
+**Each pod gets a stable DNS name:**
+
+```
+<pod-name>.<service-name>.<namespace>.svc.cluster.local
+```
+
+**Example with MongoDB:**
+```
+mongodb-0.mongodb-headless.default.svc.cluster.local
+mongodb-1.mongodb-headless.default.svc.cluster.local
+mongodb-2.mongodb-headless.default.svc.cluster.local
+```
+
+```mermaid
+flowchart LR
+  A[🔍 DNS Query: mongodb-0.mongodb-headless] --> B[📦 mongodb-0]
+  C[🔍 DNS Query: mongodb-1.mongodb-headless] --> D[📦 mongodb-1]
+```
+
+* ✅ Other apps can connect to specific pods
+* ✅ Pods can discover each other by name
+* ✅ Names stay the same even after restart
+
+---
+
+## 📍 Slide 14 – 💾 VolumeClaimTemplates
+
+**Automatic PVC creation per pod:**
+
+```yaml
+apiVersion: apps/v1
+kind: StatefulSet
+metadata:
+  name: mongodb
+spec:
+  serviceName: mongodb-headless
+  replicas: 3
+  volumeClaimTemplates:
+    - metadata:
+        name: data
+      spec:
+        accessModes: ["ReadWriteOnce"]
+        storageClassName: standard
+        resources:
+          requests:
+            storage: 10Gi
+```
+
+**Result:**
+```
+PVC: data-mongodb-0 → bound to mongodb-0
+PVC: data-mongodb-1 → bound to mongodb-1
+PVC: data-mongodb-2 → bound to mongodb-2
+```
+
+---
+
+## 📍 Slide 15 – 🔄 Scaling Behavior
+
+**Scale up (sequential):**
+```mermaid
+flowchart LR
+  A[app-0 ready] --> B[app-1 starts]
+  B --> C[app-1 ready]
+  C --> D[app-2 starts]
+```
+
+**Scale down (reverse order):**
+```mermaid
+flowchart LR
+  A[app-2 terminates] --> B[app-2 gone]
+  B --> C[app-1 terminates]
+  C --> D[app-1 gone]
+```
+
+**Key points:**
+* 🔄 Next pod only starts when previous is **Ready**
+* 🗑️ Scaling down starts from highest ordinal
+* 💾 PVCs are **NOT deleted** on scale down (data preserved)
+
+---
+
+## 📍 Slide 16 – 🔄 Update Strategies
+
+**RollingUpdate (default):**
+```yaml
+spec:
+  updateStrategy:
+    type: RollingUpdate
+    rollingUpdate:
+      partition: 0  # Update all pods
+```
+
+**Partition for canary:**
+```yaml
+rollingUpdate:
+  partition: 2  # Only update pods >= 2
+```
+
+```mermaid
+flowchart LR
+  A[app-0: v1] --> B[app-1: v1]
+  B --> C[app-2: v2 - canary]
+```
+
+* ✅ Test new version on highest ordinal first
+* ✅ Gradually lower partition to update more pods
+
+---
+
+## 📍 Slide 17 – 🗄️ Complete StatefulSet Example
+
+```yaml
+apiVersion: apps/v1
+kind: StatefulSet
+metadata:
+  name: mongodb
+spec:
+  selector:
+    matchLabels:
+      app: mongodb
+  serviceName: mongodb-headless
+  replicas: 3
+  template:
+    metadata:
+      labels:
+        app: mongodb
+    spec:
+      containers:
+        - name: mongodb
+          image: mongo:7
+          ports:
+            - containerPort: 27017
+          volumeMounts:
+            - name: data
+              mountPath: /data/db
+  volumeClaimTemplates:
+    - metadata:
+        name: data
+      spec:
+        accessModes: ["ReadWriteOnce"]
+        resources:
+          requests:
+            storage: 10Gi
+```
+
+---
+
+## 📍 Slide 18 – ⚠️ StatefulSet Gotchas
+
+| ⚠️ Gotcha | 📝 Solution |
+|----------|------------|
+| PVCs not deleted on scale down | Manual deletion if needed |
+| Pod stuck in Pending | Check PVC binding, storage class |
+| Headless service required | Must create before StatefulSet |
+| Slow scaling | Increase `podManagementPolicy: Parallel` |
+| Data loss on PVC deletion | Use `reclaimPolicy: Retain` |
+
+**Important:** StatefulSets are **more complex** than Deployments. Use only when needed!
+
+---
+
+## 📍 Slide 19 – 📝 QUIZ — DEVOPS_L15_MID
+
+---
+
+## 📍 Slide 20 – 📊 Section 3: The Three Pillars of Observability
+
+**Observability = Understanding system behavior from outputs**
+
+```mermaid
+flowchart TD
+  A[📊 Metrics] --> D[🔍 Observability]
+  B[📝 Logs] --> D
+  C[🔗 Traces] --> D
+  D --> E[💡 Understanding]
+```
+
+| 📊 Pillar | 📝 What It Answers | 🛠️ Tools |
+|----------|-------------------|----------|
+| **Metrics** | What is happening? (numbers) | Prometheus, Grafana |
+| **Logs** | What happened? (events) | Loki, ELK |
+| **Traces** | Where did it happen? (requests) | Jaeger, Zipkin |
+
+---
+
+## 📍 Slide 21 – 📈 Prometheus: The Metrics Foundation
+
+**What is Prometheus?**
+
+* 📊 Time-series database for metrics
+* 🔍 Pull-based metric collection
+* 📝 Powerful query language (PromQL)
+* 🔔 Built-in alerting
+
+```mermaid
+flowchart LR
+  A[📦 App with /metrics] --> |Pull| B[📊 Prometheus]
+  C[📦 Another App] --> |Pull| B
+  B --> D[📈 Grafana]
+  B --> E[🔔 Alertmanager]
+```
+
+---
+
+## 📍 Slide 22 – 🎯 Prometheus Metric Types
+
+| 📊 Type | 📝 Description | 🎯 Example |
+|--------|---------------|-----------|
+| **Counter** | Only goes up | Total requests, errors |
+| **Gauge** | Can go up/down | Temperature, queue size |
+| **Histogram** | Distribution of values | Request latency |
+| **Summary** | Similar to histogram | Quantiles |
+
+**Example metrics:**
+```promql
+# Counter - total HTTP requests
+http_requests_total{method="GET", status="200"}
+
+# Gauge - current memory usage
+node_memory_MemAvailable_bytes
+
+# Histogram - request duration
+http_request_duration_seconds_bucket{le="0.5"}
+```
+
+---
+
+## 📍 Slide 23 – 🔍 PromQL Basics
+
+**Query examples:**
+
+```promql
+# Current value
+up{job="kubernetes-pods"}
+
+# Rate of change (per second over 5m)
+rate(http_requests_total[5m])
+
+# Error rate percentage
+sum(rate(http_requests_total{status=~"5.."}[5m])) /
+sum(rate(http_requests_total[5m])) * 100
+
+# 99th percentile latency
+histogram_quantile(0.99, rate(http_request_duration_seconds_bucket[5m]))
+
+# Top 5 pods by CPU
+topk(5, sum by (pod) (rate(container_cpu_usage_seconds_total[5m])))
+```
+
+---
+
+## 📍 Slide 24 – 📦 kube-prometheus-stack
+
+**All-in-one monitoring solution:**
+
+```mermaid
+flowchart TD
+  A[📦 kube-prometheus-stack] --> B[📊 Prometheus]
+  A --> C[📈 Grafana]
+  A --> D[🔔 Alertmanager]
+  A --> E[📝 Node Exporter]
+  A --> F[📊 kube-state-metrics]
+```
+
+**Includes:**
+* 🔧 Pre-configured scrape targets
+* 📊 Default dashboards
+* 🔔 Default alerting rules
+* 📈 Grafana with data sources configured
+
+```bash
+helm install prometheus prometheus-community/kube-prometheus-stack
+```
+
+---
+
+## 📍 Slide 25 – 📈 Grafana Dashboards
+
+**Key Grafana concepts:**
+
+| 🔧 Concept | 📝 Description |
+|-----------|---------------|
+| **Data Source** | Where data comes from (Prometheus) |
+| **Dashboard** | Collection of panels |
+| **Panel** | Single visualization |
+| **Variable** | Dynamic filters (namespace, pod) |
+
+**Popular pre-built dashboards:**
+* 🔢 **1860:** Node Exporter Full
+* 🔢 **315:** Kubernetes cluster
+* 🔢 **7249:** Kubernetes Pod Resources
+
+---
+
+## 📍 Slide 26 – 🔔 Alerting with Alertmanager
+
+**Alert flow:**
+
+```mermaid
+flowchart LR
+  A[📊 Prometheus] --> |Alert fires| B[🔔 Alertmanager]
+  B --> |Route| C[📧 Email]
+  B --> |Route| D[💬 Slack]
+  B --> |Route| E[📱 PagerDuty]
+```
+
+**Alert rule example:**
+```yaml
+groups:
+  - name: app-alerts
+    rules:
+      - alert: HighErrorRate
+        expr: |
+          sum(rate(http_requests_total{status=~"5.."}[5m])) /
+          sum(rate(http_requests_total[5m])) > 0.01
+        for: 5m
+        labels:
+          severity: critical
+        annotations:
+          summary: "High error rate detected"
+          description: "Error rate is {{ $value | humanizePercentage }}"
+```
+
+---
+
+## 📍 Slide 27 – 📊 The Four Golden Signals
+
+**Google SRE's essential metrics:**
+
+| 🔔 Signal | 📝 What to Measure | 📊 Prometheus Example |
+|----------|-------------------|----------------------|
+| **Latency** | Response time | `histogram_quantile(0.99, ...)` |
+| **Traffic** | Request rate | `rate(http_requests_total[5m])` |
+| **Errors** | Failure rate | `rate(http_requests_total{status=~"5.."}[5m])` |
+| **Saturation** | Resource usage | `container_memory_usage_bytes / limit` |
+
+> 💡 **Tip:** Start by monitoring these four signals for every service
+
+---
+
+## 📍 Slide 28 – 🔧 Init Containers for Dependencies
+
+**Problem:** App starts before database is ready
+
+```yaml
+spec:
+  initContainers:
+    - name: wait-for-db
+      image: busybox
+      command:
+        - sh
+        - -c
+        - |
+          until nc -z postgres-0.postgres-headless 5432; do
+            echo "Waiting for database..."
+            sleep 2
+          done
+  containers:
+    - name: app
+      image: my-app
+```
+
+```mermaid
+flowchart LR
+  A[🚀 Pod Start] --> B[⏳ Init Container]
+  B --> |DB Ready| C[📦 App Container]
+```
+
+---
+
+## 📍 Slide 29 – 🏭 Section 4: Production Monitoring Setup
+
+**ServiceMonitor for custom apps:**
+
+```yaml
+apiVersion: monitoring.coreos.com/v1
+kind: ServiceMonitor
+metadata:
+  name: my-app-monitor
+spec:
+  selector:
+    matchLabels:
+      app: my-app
+  endpoints:
+    - port: metrics
+      interval: 30s
+      path: /metrics
+```
+
+**What this does:**
+* 🔍 Tells Prometheus to scrape your app
+* 📊 Collects metrics from `/metrics` endpoint
+* ⏱️ Every 30 seconds
+
+---
+
+## 📍 Slide 30 – 📊 Monitoring StatefulSets
+
+**Key metrics for stateful apps:**
+
+| 📊 Metric | 📝 Why Important |
+|----------|------------------|
+| `kubelet_volume_stats_used_bytes` | Disk usage per PVC |
+| `kube_statefulset_replicas` | Expected vs actual replicas |
+| `kube_statefulset_status_replicas_ready` | Healthy replicas |
+| App-specific metrics | Replication lag, connections |
+
+**Alert example:**
+```yaml
+- alert: StatefulSetNotReady
+  expr: |
+    kube_statefulset_status_replicas_ready /
+    kube_statefulset_replicas < 1
+  for: 5m
+  labels:
+    severity: warning
+```
+
+---
+
+## 📍 Slide 31 – 📈 Resource Monitoring
+
+**CPU and Memory queries:**
+
+```promql
+# CPU usage percentage
+sum(rate(container_cpu_usage_seconds_total{pod=~"my-app.*"}[5m])) /
+sum(kube_pod_container_resource_limits{resource="cpu", pod=~"my-app.*"}) * 100
+
+# Memory usage percentage
+sum(container_memory_working_set_bytes{pod=~"my-app.*"}) /
+sum(kube_pod_container_resource_limits{resource="memory", pod=~"my-app.*"}) * 100
+```
+
+**Capacity planning alerts:**
+```yaml
+- alert: HighMemoryUsage
+  expr: |
+    sum(container_memory_working_set_bytes) by (pod) /
+    sum(kube_pod_container_resource_limits{resource="memory"}) by (pod) > 0.8
+  for: 15m
+```
+
+---
+
+## 📍 Slide 32 – 🔔 Alert Fatigue Prevention
+
+**Problem:** Too many alerts = ignored alerts
+
+| ❌ Bad Practice | ✅ Better Approach |
+|----------------|-------------------|
+| Alert on every metric | Alert on symptoms, not causes |
+| No severity levels | Critical, warning, info tiers |
+| Alert immediately | Use `for` duration |
+| Generic messages | Actionable descriptions |
+| No runbooks | Link to debugging guides |
+
+**Good alert structure:**
+```yaml
+annotations:
+  summary: "High error rate on {{ $labels.service }}"
+  description: "Error rate is {{ $value }}% (threshold: 1%)"
+  runbook_url: "https://wiki/alerts/high-error-rate"
+```
+
+---
+
+## 📍 Slide 33 – 📊 Dashboard Best Practices
+
+**Effective dashboard layout:**
+
+```
+┌─────────────────────────────────────────┐
+│  📊 Overview: Key metrics at a glance   │
+├─────────────┬─────────────┬─────────────┤
+│  🔴 Errors  │  ⏱️ Latency │  📈 Traffic │
+├─────────────┴─────────────┴─────────────┤
+│  💾 Resource Usage (CPU, Memory, Disk)  │
+├─────────────────────────────────────────┤
+│  🔍 Detailed Breakdowns (per pod, etc.) │
+└─────────────────────────────────────────┘
+```
+
+**Tips:**
+* 📊 Start with high-level, drill down for details
+* 🎨 Use consistent colors (red = bad)
+* 📝 Add descriptions to panels
+* 🔗 Link related dashboards
+
+---
+
+## 📍 Slide 34 – 🏢 Real-World: Observability at Scale
+
+**Netflix observability approach:**
+
+* 📊 **Metrics:** Atlas (Prometheus-like, billions of time series)
+* 📝 **Logs:** Mantis (real-time stream processing)
+* 🔗 **Traces:** Edgar (distributed tracing)
+* 🔔 **Alerts:** Focused on customer impact
+
+**Key lessons:**
+* 🎯 Focus on **business metrics** (not just infra)
+* 🔄 Automate **remediation** where possible
+* 📈 Invest in **dashboards** as a product
+* 👥 Make observability **everyone's** job
+
+---
+
+## 📍 Slide 35 – 🎯 Key Takeaways
+
+1. 🗄️ **StatefulSets** provide stable identity and per-pod storage for databases
+2. 🌐 **Headless services** enable direct pod-to-pod communication
+3. 📊 **Three pillars:** Metrics, Logs, Traces for full observability
+4. 📈 **Prometheus + Grafana** is the standard K8s monitoring stack
+5. 🔔 **Alerts should be actionable** — avoid alert fatigue
+6. 🎯 **Four Golden Signals:** Latency, Traffic, Errors, Saturation
+
+> 💬 *"Observability is not about collecting data, it's about understanding your system."*
+
+---
+
+## 📍 Slide 36 – 🧠 Mindset Shift
+
+| 😰 Old Mindset | 🚀 New Mindset |
+|---------------|----------------|
+| "It's working, don't touch it" | "I can see it's working" |
+| "Let's check the logs" | "The dashboard shows the issue" |
+| "User reported an error" | "Alert fired before impact" |
+| "Database needs restart" | "DB has stable identity, restart is safe" |
+| "Collect all the metrics" | "Monitor what matters" |
+| "Alert on everything" | "Alert on symptoms, investigate causes" |
+
+> 🤔 **Question:** What's the first dashboard you'd build for your app?
+
+---
+
+## 📍 Slide 37 – 📝 QUIZ — DEVOPS_L15_POST
+
+---
+
+## 📍 Slide 38 – 🚀 What's Next?
+
+**Coming up: Lecture 16 — Beyond Kubernetes**
+
+```mermaid
+flowchart LR
+  A[☸️ Kubernetes] --> B[✈️ Fly.io]
+  A --> C[🌐 IPFS/4EVERLAND]
+  B --> D[🌍 Global Edge]
+  C --> E[🔗 Decentralized]
+```
+
+* ✈️ **Fly.io:** Edge deployment simplified
+* 🌐 **IPFS:** Decentralized hosting
+* 🤔 **When to use what:** Trade-offs and decisions
+* 🎯 **Beyond the cluster:** Alternative deployment models
+
+> 🎯 **Labs 15 & 16:** Convert your app to StatefulSet and set up comprehensive monitoring!
+
+---
+
+## 📚 Resources
+
+**StatefulSets:**
+* 📖 [Kubernetes StatefulSets](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/)
+* 📖 [Headless Services](https://kubernetes.io/docs/concepts/services-networking/service/#headless-services)
+
+**Observability:**
+* 📖 [Prometheus Docs](https://prometheus.io/docs/)
+* 📖 [Grafana Docs](https://grafana.com/docs/)
+* 📖 [kube-prometheus-stack](https://github.com/prometheus-community/helm-charts/tree/main/charts/kube-prometheus-stack)
+
+**Books:**
+* 📕 *Observability Engineering* by Charity Majors, et al.
+* 📕 *Site Reliability Engineering* by Google
+* 📕 *Kubernetes Patterns* by Bilgin Ibryam & Roland Huß
diff --git a/lectures/lec16.md b/lectures/lec16.md
index 2f8bf01d5b..44b59d8ff3 100644
--- a/lectures/lec16.md
+++ b/lectures/lec16.md
@@ -1,717 +1,717 @@
-# 📌 Lecture 16 — Beyond Kubernetes: Alternative Deployment Models
-
-> 🎯 **From cluster management to platform abstraction and decentralized hosting**
-
----
-
-## 📍 Slide 1 – 🚀 Kubernetes Isn't Always the Answer
-
-We've mastered Kubernetes. But is it always the right choice?
-
-* ☸️ **Kubernetes:** Powerful, but complex
-* ✈️ **PaaS (Fly.io):** Simple, global, managed
-* 🌐 **Decentralized (IPFS):** Permanent, censorship-resistant
-
-```mermaid
-flowchart LR
-  A[📦 Your App] --> B{What matters most?}
-  B --> |Control & Scale| C[☸️ Kubernetes]
-  B --> |Simplicity & Global| D[✈️ Fly.io]
-  B --> |Permanence & Decentralization| E[🌐 IPFS]
-```
-
-> 🎯 **Goal:** Understand when to choose each deployment model
-
----
-
-## 📍 Slide 2 – 📚 Learning Outcomes
-
-By the end of this lecture, you will:
-
-| # | 🎯 Outcome |
-|---|-----------|
-| 1 | ✅ Evaluate **trade-offs** between deployment models |
-| 2 | ✅ Deploy applications to **Fly.io** edge network |
-| 3 | ✅ Understand **IPFS** and content addressing |
-| 4 | ✅ Use **4EVERLAND** for decentralized hosting |
-| 5 | ✅ Choose the **right tool** for different use cases |
-| 6 | ✅ Appreciate the **evolving cloud landscape** |
-
----
-
-## 📍 Slide 3 – 🗺️ Lecture Overview
-
-```
-┌─────────────────────────────────────────────────────────────┐
-│  SECTION 0: Introduction                    (Slides 1-4)   │
-├─────────────────────────────────────────────────────────────┤
-│  📝 PRE QUIZ                                (Slide 5)      │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 1: The Complexity Trade-off        (Slides 6-10)  │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 2: Edge Computing with Fly.io      (Slides 11-18) │
-├─────────────────────────────────────────────────────────────┤
-│  📝 MID QUIZ                                (Slide 19)     │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 3: Decentralized Web & IPFS        (Slides 20-28) │
-├─────────────────────────────────────────────────────────────┤
-│  SECTION 4: Choosing Your Path              (Slides 29-35) │
-├─────────────────────────────────────────────────────────────┤
-│  📝 POST QUIZ                               (Slide 36)     │
-├─────────────────────────────────────────────────────────────┤
-│  FINAL: Course Wrap-up                      (Slide 37)     │
-└─────────────────────────────────────────────────────────────┘
-```
-
----
-
-## 📍 Slide 4 – 🤔 The Big Question
-
-> 💬 *"The best tool is the one that solves your problem with the least unnecessary complexity."*
-> — Practical Engineering Wisdom
-
-**Consider these scenarios:**
-
-* 🏢 **Enterprise with 500 microservices:** Probably needs Kubernetes
-* 🚀 **Startup with 3 developers:** Maybe doesn't need a cluster
-* 📰 **News article that must stay online forever:** Decentralized?
-* 🌍 **App serving users globally:** Edge deployment?
-
-> 🤔 **Think:** What does YOUR application actually need?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L16_PRE
-
----
-
-## 📍 Slide 6 – ⚠️ Section 1: The Kubernetes Tax
-
-**What Kubernetes requires:**
-
-```mermaid
-flowchart TD
-  A[☸️ Kubernetes Cluster] --> B[🔧 Cluster Management]
-  A --> C[🔐 Security Hardening]
-  A --> D[📊 Monitoring Setup]
-  A --> E[🔄 Upgrade Planning]
-  A --> F[💰 Infrastructure Cost]
-```
-
-* 🔧 **Cluster operations:** Updates, scaling, troubleshooting
-* 🧠 **Team expertise:** Steep learning curve
-* 💰 **Cost:** Control plane, nodes, load balancers
-* ⏱️ **Time:** Setup, maintenance, incident response
-
----
-
-## 📍 Slide 7 – 🔥 When Kubernetes Is Overkill
-
-**Signs you might not need Kubernetes:**
-
-| 🚩 Sign | 📝 Alternative |
-|--------|---------------|
-| Single application | PaaS (Fly.io, Railway, Render) |
-| Small team (1-5 devs) | Managed services |
-| Simple deployment needs | Container platforms |
-| Cost-sensitive startup | Serverless or PaaS |
-| No specialized workloads | Simpler solutions |
-
-> 💬 *"Don't use Kubernetes to solve problems you don't have."*
-
----
-
-## 📍 Slide 8 – 📊 The Abstraction Spectrum
-
-```mermaid
-flowchart LR
-  A[🖥️ Bare Metal] --> B[☁️ VMs/IaaS]
-  B --> C[☸️ Kubernetes]
-  C --> D[✈️ PaaS]
-  D --> E[⚡ Serverless]
-  E --> F[🌐 Decentralized]
-
-  G[More Control] -.-> A
-  H[More Abstraction] -.-> F
-```
-
-| 🎚️ Level | 🔧 You Manage | ✅ Platform Manages |
-|----------|--------------|---------------------|
-| Bare Metal | Everything | Nothing |
-| IaaS (EC2) | OS, runtime, app | Hardware |
-| Kubernetes | App, configs | Orchestration |
-| PaaS | App code only | Everything else |
-| Serverless | Functions | Runtime, scaling |
-
----
-
-## 📍 Slide 9 – 🎯 Right Tool, Right Job
-
-**Decision factors:**
-
-| 📋 Factor | ☸️ K8s | ✈️ PaaS | 🌐 IPFS |
-|----------|--------|--------|---------|
-| Team size | Large | Small | Varies |
-| Control needs | High | Medium | Low |
-| Cost at scale | Efficient | Can be expensive | Very low |
-| Setup time | Days/weeks | Minutes | Minutes |
-| Global distribution | Manual config | Built-in | Inherent |
-| Vendor lock-in | Low | Medium | None |
-
----
-
-## 📍 Slide 10 – 💡 The Emergence of Edge Computing
-
-**Traditional deployment:**
-```
-User (Tokyo) → CDN → US-East Server → Response (200ms)
-```
-
-**Edge deployment:**
-```
-User (Tokyo) → Edge Server (Tokyo) → Response (20ms)
-```
-
-```mermaid
-flowchart TD
-  A[🌍 User Anywhere] --> B{Edge Network}
-  B --> C[🗼 Tokyo]
-  B --> D[🗼 London]
-  B --> E[🗼 New York]
-  B --> F[🗼 Sydney]
-```
-
-* ⚡ **Lower latency:** Code runs closer to users
-* 🌍 **Global by default:** No region configuration
-* 🔄 **Automatic routing:** Users hit nearest edge
-
----
-
-## 📍 Slide 11 – ✈️ Section 2: Fly.io - Simplicity Meets Global
-
-**What is Fly.io?**
-
-* ✈️ Platform for running apps globally
-* 📦 Deploys Docker containers (or builds from source)
-* 🌍 Runs in 30+ regions automatically
-* 💰 Free tier for small apps
-
-```mermaid
-flowchart LR
-  A[📦 Your Container] --> B[✈️ Fly.io]
-  B --> C[🗼 Edge 1]
-  B --> D[🗼 Edge 2]
-  B --> E[🗼 Edge 3]
-  C --> F[👤 Users]
-  D --> F
-  E --> F
-```
-
----
-
-## 📍 Slide 12 – 🛠️ Fly.io Architecture
-
-**Key concepts:**
-
-| 🔧 Concept | 📝 Description |
-|-----------|---------------|
-| **Machine** | A Fly VM running your app |
-| **App** | A named collection of Machines |
-| **Region** | A geographical location (ams, iad, sin) |
-| **Volume** | Persistent storage attached to Machine |
-| **Secret** | Encrypted environment variable |
-
-```toml
-# fly.toml
-app = "my-app"
-primary_region = "ams"
-
-[http_service]
-  internal_port = 8080
-  force_https = true
-  auto_stop_machines = true
-  auto_start_machines = true
-```
-
----
-
-## 📍 Slide 13 – 🚀 Deploying to Fly.io
-
-**The entire deployment process:**
-
-```bash
-# 1. Install CLI
-curl -L https://fly.io/install.sh | sh
-
-# 2. Login
-fly auth login
-
-# 3. Launch (creates app + config)
-fly launch
-
-# 4. Deploy
-fly deploy
-
-# 5. Open in browser
-fly open
-```
-
-**That's it!** No cluster, no YAML manifests, no ingress controllers.
-
----
-
-## 📍 Slide 14 – 🌍 Multi-Region Deployment
-
-**Adding regions:**
-
-```bash
-# Add regions
-fly regions add iad sin syd
-
-# Check machines
-fly machines list
-
-# Scale in specific region
-fly scale count 2 --region ams
-```
-
-```mermaid
-flowchart TD
-  A[✈️ Your App] --> B[🇳🇱 Amsterdam]
-  A --> C[🇺🇸 Virginia]
-  A --> D[🇸🇬 Singapore]
-  A --> E[🇦🇺 Sydney]
-
-  F[👤 European User] --> B
-  G[👤 US User] --> C
-  H[👤 Asian User] --> D
-  I[👤 Australian User] --> E
-```
-
----
-
-## 📍 Slide 15 – 🔐 Secrets & Storage on Fly.io
-
-**Secrets:**
-```bash
-fly secrets set DATABASE_URL="postgres://..."
-fly secrets set API_KEY="secret123"
-fly secrets list
-```
-
-**Persistent storage:**
-```bash
-# Create volume
-fly volumes create mydata --size 1 --region ams
-```
-
-```toml
-# fly.toml
-[mounts]
-  source = "mydata"
-  destination = "/data"
-```
-
----
-
-## 📍 Slide 16 – 📊 Fly.io vs Kubernetes Comparison
-
-| 📋 Aspect | ☸️ Kubernetes | ✈️ Fly.io |
-|----------|--------------|----------|
-| Setup time | Hours/days | Minutes |
-| Learning curve | Steep | Gentle |
-| Global distribution | Manual | Built-in |
-| Scaling | HPA, VPA, manual | Auto-scale, simple commands |
-| Cost (small app) | $50-100/month | Free tier available |
-| Control | Full | Limited |
-| Customization | Unlimited | Constrained |
-| Multi-cloud | Yes | No (Fly only) |
-
----
-
-## 📍 Slide 17 – 🎯 When to Choose Fly.io
-
-**Good fit:**
-
-* ✅ Small to medium applications
-* ✅ Need for low global latency
-* ✅ Small team, limited DevOps resources
-* ✅ Rapid iteration, quick deployments
-* ✅ Cost-conscious early-stage projects
-
-**Not ideal:**
-
-* ❌ Complex microservices architectures
-* ❌ Need for specific cloud services (AWS RDS, etc.)
-* ❌ Compliance requirements for specific regions
-* ❌ Already invested heavily in Kubernetes
-
----
-
-## 📍 Slide 18 – 🔧 Fly.io Best Practices
-
-| 📋 Practice | 📝 Reason |
-|------------|----------|
-| Use auto_stop_machines | Save costs when idle |
-| Add health checks | Enable auto-restart on failure |
-| Use volumes for stateful data | Machines are ephemeral |
-| Set min_machines_running | Prevent cold starts |
-| Use regions near your users | Optimize latency |
-
-```toml
-[http_service]
-  auto_stop_machines = true
-  auto_start_machines = true
-  min_machines_running = 1
-
-[checks]
-  [checks.health]
-    type = "http"
-    port = 8080
-    path = "/health"
-```
-
----
-
-## 📍 Slide 19 – 📝 QUIZ — DEVOPS_L16_MID
-
----
-
-## 📍 Slide 20 – 🌐 Section 3: IPFS & The Decentralized Web
-
-**What is IPFS?**
-
-* 🌐 **InterPlanetary File System**
-* 📦 Distributed, peer-to-peer storage
-* 🔗 Content-addressed (identified by hash, not location)
-* ♾️ Immutable, permanent storage
-
-```mermaid
-flowchart LR
-  A[📄 File] --> B[#️⃣ Hash]
-  B --> C[🔗 CID: QmXxx...]
-  C --> D[🌐 Available Globally]
-```
-
-> 💡 **Key insight:** Same content = same address, anywhere in the world
-
----
-
-## 📍 Slide 21 – 🔍 Content Addressing Explained
-
-**Traditional web (location-based):**
-```
-https://server.com/path/to/file.html
-                    ↓
-        Server could change content!
-```
-
-**IPFS (content-based):**
-```
-ipfs://QmXxx.../file.html
-          ↓
-   Hash of actual content
-   If content changes, hash changes!
-```
-
-| 📋 Aspect | 🌐 HTTP | 🔗 IPFS |
-|----------|--------|---------|
-| Addressing | Location | Content hash |
-| Mutability | Content can change | Content is immutable |
-| Availability | Single server | Distributed nodes |
-| Censorship | Easy to block | Very difficult |
-
----
-
-## 📍 Slide 22 – 🔑 IPFS Key Concepts
-
-| 🔧 Concept | 📝 Description |
-|-----------|---------------|
-| **CID** | Content Identifier - hash of content |
-| **Node** | Computer running IPFS software |
-| **Pinning** | Keeping content available (prevent garbage collection) |
-| **Gateway** | HTTP bridge to IPFS content |
-| **IPNS** | Mutable pointer to IPFS content |
-
-**Example CIDs:**
-```
-QmXoypizjW3WknFiJnKLwHCnL72vedxjQkDDP1mXWo6uco
-bafybeigdyrzt5sfp7udm7hu76uh7y26nf3efuylqabf3oclgtqy55fbzdi
-```
-
----
-
-## 📍 Slide 23 – 📌 Pinning Services
-
-**The persistence problem:**
-
-```mermaid
-flowchart TD
-  A[📄 Add Content] --> B[🔗 Get CID]
-  B --> C{Who stores it?}
-  C --> |Your node| D[🖥️ Goes offline = Content unavailable]
-  C --> |Pinning service| E[☁️ Always available]
-```
-
-**Pinning services:**
-* 📌 **4EVERLAND** — Web3 hosting platform
-* 📌 **Pinata** — IPFS pinning
-* 📌 **Infura** — IPFS API
-* 📌 **web3.storage** — Free storage
-
----
-
-## 📍 Slide 24 – 🌐 4EVERLAND Platform
-
-**What is 4EVERLAND?**
-
-* 🌐 Web3 infrastructure platform
-* 📦 IPFS hosting made simple
-* 🔧 Deploy from Git (like Vercel/Netlify)
-* 💰 Free tier available
-
-**Services:**
-* 🚀 **Hosting:** Deploy static sites and SPAs
-* 📦 **Bucket:** IPFS storage (like S3)
-* 🌐 **Gateway:** Access IPFS content via HTTP
-
----
-
-## 📍 Slide 25 – 🚀 Deploying to 4EVERLAND
-
-**Process:**
-
-```mermaid
-flowchart LR
-  A[📝 Git Push] --> B[🔄 4EVERLAND Build]
-  B --> C[📦 Upload to IPFS]
-  C --> D[🔗 Get CID]
-  D --> E[🌐 Available via Gateway]
-```
-
-**Steps:**
-1. 🔗 Connect GitHub repository
-2. ⚙️ Configure build settings
-3. 🚀 Deploy
-4. 🔗 Access via CID or custom domain
-
-**URLs:**
-* `https://your-project.4everland.app`
-* `https://ipfs.4everland.link/ipfs/CID`
-
----
-
-## 📍 Slide 26 – 🔄 IPNS: Mutable Pointers
-
-**Problem:** CID changes when content changes
-
-**Solution:** IPNS (InterPlanetary Name System)
-
-```mermaid
-flowchart LR
-  A[🔑 IPNS Name] --> B[🔗 CID v1]
-  A --> |Update| C[🔗 CID v2]
-```
-
-| 📋 Type | 🔗 Address | 📝 Behavior |
-|--------|-----------|------------|
-| **IPFS** | `/ipfs/QmXxx` | Always same content |
-| **IPNS** | `/ipns/k51xxx` | Points to current version |
-
-**4EVERLAND handles this:** Your URL stays the same, content updates automatically
-
----
-
-## 📍 Slide 27 – 📊 Centralized vs Decentralized
-
-| 📋 Aspect | 🏢 Traditional | 🌐 IPFS/4EVERLAND |
-|----------|---------------|-------------------|
-| Single point of failure | Yes | No |
-| Censorship resistance | Low | High |
-| Content integrity | Trust server | Cryptographic verification |
-| Hosting cost | Ongoing | Pin once, available forever |
-| Update mechanism | Overwrite file | New CID (or IPNS) |
-| Speed | Fast (CDN) | Variable (depends on nodes) |
-| Best for | Dynamic apps | Static content, archives |
-
----
-
-## 📍 Slide 28 – 🎯 When to Choose IPFS/4EVERLAND
-
-**Good fit:**
-
-* ✅ Static websites and documentation
-* ✅ Content that must survive (archives, important documents)
-* ✅ Censorship-resistant publishing
-* ✅ NFT metadata and assets
-* ✅ Open source project hosting
-
-**Not ideal:**
-
-* ❌ Dynamic server-side applications
-* ❌ Real-time updates needed
-* ❌ Private content (IPFS is public by default)
-* ❌ High-performance requirements
-
----
-
-## 📍 Slide 29 – 🎯 Section 4: Making the Right Choice
-
-**Decision Framework:**
-
-```mermaid
-flowchart TD
-  A[📦 Your Application] --> B{Need dynamic backend?}
-  B --> |Yes| C{Team size?}
-  B --> |No, static| D{Permanence important?}
-
-  C --> |Large, experienced| E[☸️ Kubernetes]
-  C --> |Small| F{Global latency critical?}
-
-  F --> |Yes| G[✈️ Fly.io]
-  F --> |No| H[Simple hosting]
-
-  D --> |Yes| I[🌐 IPFS/4EVERLAND]
-  D --> |No| J[Static hosting CDN]
-```
-
----
-
-## 📍 Slide 30 – 📊 Summary Comparison
-
-| 📋 Criteria | ☸️ Kubernetes | ✈️ Fly.io | 🌐 4EVERLAND/IPFS |
-|------------|--------------|----------|-------------------|
-| **Complexity** | High | Low | Low |
-| **Control** | Full | Medium | Limited |
-| **Scalability** | Unlimited | Good | N/A (static) |
-| **Global distribution** | Manual | Automatic | Inherent |
-| **Cost at scale** | Efficient | Can be expensive | Very low |
-| **Learning curve** | Steep | Gentle | Minimal |
-| **Use case** | Microservices, enterprise | Global apps, startups | Static content, Web3 |
-
----
-
-## 📍 Slide 31 – 🏢 Real-World Examples
-
-**Kubernetes users:**
-* 🏢 **Spotify:** 200+ microservices
-* 🏢 **Pinterest:** ML workloads
-* 🏢 **Airbnb:** Multi-region deployments
-
-**Fly.io users:**
-* 🚀 **Small startups:** Quick global deployment
-* 🎮 **Game backends:** Low-latency requirements
-* 🛠️ **Developer tools:** API services
-
-**IPFS/Decentralized:**
-* 📚 **Wikipedia mirror:** Censorship-resistant access
-* 🎨 **NFT projects:** Metadata storage
-* 📰 **News archives:** Permanent preservation
-
----
-
-## 📍 Slide 32 – 🔮 The Future of Deployment
-
-**Trends to watch:**
-
-| 🔮 Trend | 📝 Description |
-|---------|---------------|
-| **Edge computing** | Code runs closer to users |
-| **WebAssembly** | Run any language at the edge |
-| **Decentralization** | Web3 infrastructure growth |
-| **Platform abstraction** | Less infra management |
-| **AI-assisted DevOps** | Automated operations |
-
-> 💬 *"The cloud is just someone else's computer. The edge is everyone's computer."*
-
----
-
-## 📍 Slide 33 – 📋 Practical Recommendations
-
-**For students and learning:**
-1. 🎓 Master Kubernetes fundamentals first
-2. ✈️ Try Fly.io for personal projects
-3. 🌐 Experiment with IPFS for static sites
-
-**For production decisions:**
-1. 📋 Start with requirements, not technology
-2. 📊 Consider team capabilities
-3. 💰 Factor in total cost (including time)
-4. 🔄 Plan for evolution
-
----
-
-## 📍 Slide 34 – 🎯 Key Takeaways
-
-1. ☸️ **Kubernetes is powerful** but comes with complexity costs
-2. ✈️ **Fly.io offers simplicity** for global, low-latency applications
-3. 🌐 **IPFS provides permanence** and censorship resistance
-4. 🎯 **No single best solution** — choose based on requirements
-5. 📊 **Consider the trade-offs:** control vs simplicity, cost vs features
-6. 🔮 **The landscape evolves** — stay curious, keep learning
-
-> 💬 *"The best architecture is the one your team can operate successfully."*
-
----
-
-## 📍 Slide 35 – 🧠 Course Mindset Shift
-
-| 😰 Before This Course | 🚀 After This Course |
-|----------------------|---------------------|
-| "How do I deploy this?" | "What's the best deployment model?" |
-| "Kubernetes is complicated" | "I understand K8s and its alternatives" |
-| "DevOps is ops work" | "DevOps is a culture and practice" |
-| "I write code, someone else deploys" | "I can deploy, monitor, and maintain" |
-| "Just get it working" | "Make it observable, scalable, reliable" |
-
----
-
-## 📍 Slide 36 – 📝 QUIZ — DEVOPS_L16_POST
-
----
-
-## 📍 Slide 37 – 🎓 Course Wrap-up
-
-**What you've learned:**
-
-```mermaid
-flowchart LR
-  A[🐳 Docker] --> B[☸️ Kubernetes]
-  B --> C[🔄 CI/CD]
-  C --> D[📊 Observability]
-  D --> E[🔐 Security]
-  E --> F[🌍 Global Deployment]
-```
-
-**Your DevOps toolkit:**
-* 🐳 **Containerization:** Docker, multi-stage builds
-* ☸️ **Orchestration:** Kubernetes, Helm, StatefulSets
-* 🔄 **GitOps:** ArgoCD, declarative infrastructure
-* 📊 **Observability:** Prometheus, Grafana, alerting
-* 🔐 **Security:** Secrets management, Vault
-* 🚀 **Progressive delivery:** Canary, blue-green
-* 🌍 **Beyond K8s:** Edge computing, decentralized hosting
-
-> 🎉 **Congratulations!** You're now equipped for production DevOps.
-
----
-
-## 📚 Resources
-
-**Fly.io:**
-* 📖 [Fly.io Documentation](https://fly.io/docs/)
-* 📖 [flyctl Reference](https://fly.io/docs/flyctl/)
-
-**IPFS & 4EVERLAND:**
-* 📖 [IPFS Documentation](https://docs.ipfs.tech/)
-* 📖 [4EVERLAND Docs](https://docs.4everland.org/)
-* 📖 [IPFS Concepts](https://docs.ipfs.tech/concepts/)
-
-**Further reading:**
-* 📕 *The DevOps Handbook* by Gene Kim, et al.
-* 📕 *Accelerate* by Nicole Forsgren, et al.
-* 📕 *Site Reliability Engineering* by Google
-
-**Keep learning:**
-* 🌐 [CNCF Landscape](https://landscape.cncf.io/)
-* 🌐 [DevOps Roadmap](https://roadmap.sh/devops)
+# 📌 Lecture 16 — Beyond Kubernetes: Alternative Deployment Models
+
+> 🎯 **From cluster management to platform abstraction and decentralized hosting**
+
+---
+
+## 📍 Slide 1 – 🚀 Kubernetes Isn't Always the Answer
+
+We've mastered Kubernetes. But is it always the right choice?
+
+* ☸️ **Kubernetes:** Powerful, but complex
+* ✈️ **PaaS (Fly.io):** Simple, global, managed
+* 🌐 **Decentralized (IPFS):** Permanent, censorship-resistant
+
+```mermaid
+flowchart LR
+  A[📦 Your App] --> B{What matters most?}
+  B --> |Control & Scale| C[☸️ Kubernetes]
+  B --> |Simplicity & Global| D[✈️ Fly.io]
+  B --> |Permanence & Decentralization| E[🌐 IPFS]
+```
+
+> 🎯 **Goal:** Understand when to choose each deployment model
+
+---
+
+## 📍 Slide 2 – 📚 Learning Outcomes
+
+By the end of this lecture, you will:
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | ✅ Evaluate **trade-offs** between deployment models |
+| 2 | ✅ Deploy applications to **Fly.io** edge network |
+| 3 | ✅ Understand **IPFS** and content addressing |
+| 4 | ✅ Use **4EVERLAND** for decentralized hosting |
+| 5 | ✅ Choose the **right tool** for different use cases |
+| 6 | ✅ Appreciate the **evolving cloud landscape** |
+
+---
+
+## 📍 Slide 3 – 🗺️ Lecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  SECTION 0: Introduction                    (Slides 1-4)   │
+├─────────────────────────────────────────────────────────────┤
+│  📝 PRE QUIZ                                (Slide 5)      │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 1: The Complexity Trade-off        (Slides 6-10)  │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 2: Edge Computing with Fly.io      (Slides 11-18) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 MID QUIZ                                (Slide 19)     │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 3: Decentralized Web & IPFS        (Slides 20-28) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 4: Choosing Your Path              (Slides 29-35) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 POST QUIZ                               (Slide 36)     │
+├─────────────────────────────────────────────────────────────┤
+│  FINAL: Course Wrap-up                      (Slide 37)     │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 📍 Slide 4 – 🤔 The Big Question
+
+> 💬 *"The best tool is the one that solves your problem with the least unnecessary complexity."*
+> — Practical Engineering Wisdom
+
+**Consider these scenarios:**
+
+* 🏢 **Enterprise with 500 microservices:** Probably needs Kubernetes
+* 🚀 **Startup with 3 developers:** Maybe doesn't need a cluster
+* 📰 **News article that must stay online forever:** Decentralized?
+* 🌍 **App serving users globally:** Edge deployment?
+
+> 🤔 **Think:** What does YOUR application actually need?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L16_PRE
+
+---
+
+## 📍 Slide 6 – ⚠️ Section 1: The Kubernetes Tax
+
+**What Kubernetes requires:**
+
+```mermaid
+flowchart TD
+  A[☸️ Kubernetes Cluster] --> B[🔧 Cluster Management]
+  A --> C[🔐 Security Hardening]
+  A --> D[📊 Monitoring Setup]
+  A --> E[🔄 Upgrade Planning]
+  A --> F[💰 Infrastructure Cost]
+```
+
+* 🔧 **Cluster operations:** Updates, scaling, troubleshooting
+* 🧠 **Team expertise:** Steep learning curve
+* 💰 **Cost:** Control plane, nodes, load balancers
+* ⏱️ **Time:** Setup, maintenance, incident response
+
+---
+
+## 📍 Slide 7 – 🔥 When Kubernetes Is Overkill
+
+**Signs you might not need Kubernetes:**
+
+| 🚩 Sign | 📝 Alternative |
+|--------|---------------|
+| Single application | PaaS (Fly.io, Railway, Render) |
+| Small team (1-5 devs) | Managed services |
+| Simple deployment needs | Container platforms |
+| Cost-sensitive startup | Serverless or PaaS |
+| No specialized workloads | Simpler solutions |
+
+> 💬 *"Don't use Kubernetes to solve problems you don't have."*
+
+---
+
+## 📍 Slide 8 – 📊 The Abstraction Spectrum
+
+```mermaid
+flowchart LR
+  A[🖥️ Bare Metal] --> B[☁️ VMs/IaaS]
+  B --> C[☸️ Kubernetes]
+  C --> D[✈️ PaaS]
+  D --> E[⚡ Serverless]
+  E --> F[🌐 Decentralized]
+
+  G[More Control] -.-> A
+  H[More Abstraction] -.-> F
+```
+
+| 🎚️ Level | 🔧 You Manage | ✅ Platform Manages |
+|----------|--------------|---------------------|
+| Bare Metal | Everything | Nothing |
+| IaaS (EC2) | OS, runtime, app | Hardware |
+| Kubernetes | App, configs | Orchestration |
+| PaaS | App code only | Everything else |
+| Serverless | Functions | Runtime, scaling |
+
+---
+
+## 📍 Slide 9 – 🎯 Right Tool, Right Job
+
+**Decision factors:**
+
+| 📋 Factor | ☸️ K8s | ✈️ PaaS | 🌐 IPFS |
+|----------|--------|--------|---------|
+| Team size | Large | Small | Varies |
+| Control needs | High | Medium | Low |
+| Cost at scale | Efficient | Can be expensive | Very low |
+| Setup time | Days/weeks | Minutes | Minutes |
+| Global distribution | Manual config | Built-in | Inherent |
+| Vendor lock-in | Low | Medium | None |
+
+---
+
+## 📍 Slide 10 – 💡 The Emergence of Edge Computing
+
+**Traditional deployment:**
+```
+User (Tokyo) → CDN → US-East Server → Response (200ms)
+```
+
+**Edge deployment:**
+```
+User (Tokyo) → Edge Server (Tokyo) → Response (20ms)
+```
+
+```mermaid
+flowchart TD
+  A[🌍 User Anywhere] --> B{Edge Network}
+  B --> C[🗼 Tokyo]
+  B --> D[🗼 London]
+  B --> E[🗼 New York]
+  B --> F[🗼 Sydney]
+```
+
+* ⚡ **Lower latency:** Code runs closer to users
+* 🌍 **Global by default:** No region configuration
+* 🔄 **Automatic routing:** Users hit nearest edge
+
+---
+
+## 📍 Slide 11 – ✈️ Section 2: Fly.io - Simplicity Meets Global
+
+**What is Fly.io?**
+
+* ✈️ Platform for running apps globally
+* 📦 Deploys Docker containers (or builds from source)
+* 🌍 Runs in 30+ regions automatically
+* 💰 Free tier for small apps
+
+```mermaid
+flowchart LR
+  A[📦 Your Container] --> B[✈️ Fly.io]
+  B --> C[🗼 Edge 1]
+  B --> D[🗼 Edge 2]
+  B --> E[🗼 Edge 3]
+  C --> F[👤 Users]
+  D --> F
+  E --> F
+```
+
+---
+
+## 📍 Slide 12 – 🛠️ Fly.io Architecture
+
+**Key concepts:**
+
+| 🔧 Concept | 📝 Description |
+|-----------|---------------|
+| **Machine** | A Fly VM running your app |
+| **App** | A named collection of Machines |
+| **Region** | A geographical location (ams, iad, sin) |
+| **Volume** | Persistent storage attached to Machine |
+| **Secret** | Encrypted environment variable |
+
+```toml
+# fly.toml
+app = "my-app"
+primary_region = "ams"
+
+[http_service]
+  internal_port = 8080
+  force_https = true
+  auto_stop_machines = true
+  auto_start_machines = true
+```
+
+---
+
+## 📍 Slide 13 – 🚀 Deploying to Fly.io
+
+**The entire deployment process:**
+
+```bash
+# 1. Install CLI
+curl -L https://fly.io/install.sh | sh
+
+# 2. Login
+fly auth login
+
+# 3. Launch (creates app + config)
+fly launch
+
+# 4. Deploy
+fly deploy
+
+# 5. Open in browser
+fly open
+```
+
+**That's it!** No cluster, no YAML manifests, no ingress controllers.
+
+---
+
+## 📍 Slide 14 – 🌍 Multi-Region Deployment
+
+**Adding regions:**
+
+```bash
+# Add regions
+fly regions add iad sin syd
+
+# Check machines
+fly machines list
+
+# Scale in specific region
+fly scale count 2 --region ams
+```
+
+```mermaid
+flowchart TD
+  A[✈️ Your App] --> B[🇳🇱 Amsterdam]
+  A --> C[🇺🇸 Virginia]
+  A --> D[🇸🇬 Singapore]
+  A --> E[🇦🇺 Sydney]
+
+  F[👤 European User] --> B
+  G[👤 US User] --> C
+  H[👤 Asian User] --> D
+  I[👤 Australian User] --> E
+```
+
+---
+
+## 📍 Slide 15 – 🔐 Secrets & Storage on Fly.io
+
+**Secrets:**
+```bash
+fly secrets set DATABASE_URL="postgres://..."
+fly secrets set API_KEY="secret123"
+fly secrets list
+```
+
+**Persistent storage:**
+```bash
+# Create volume
+fly volumes create mydata --size 1 --region ams
+```
+
+```toml
+# fly.toml
+[mounts]
+  source = "mydata"
+  destination = "/data"
+```
+
+---
+
+## 📍 Slide 16 – 📊 Fly.io vs Kubernetes Comparison
+
+| 📋 Aspect | ☸️ Kubernetes | ✈️ Fly.io |
+|----------|--------------|----------|
+| Setup time | Hours/days | Minutes |
+| Learning curve | Steep | Gentle |
+| Global distribution | Manual | Built-in |
+| Scaling | HPA, VPA, manual | Auto-scale, simple commands |
+| Cost (small app) | $50-100/month | Free tier available |
+| Control | Full | Limited |
+| Customization | Unlimited | Constrained |
+| Multi-cloud | Yes | No (Fly only) |
+
+---
+
+## 📍 Slide 17 – 🎯 When to Choose Fly.io
+
+**Good fit:**
+
+* ✅ Small to medium applications
+* ✅ Need for low global latency
+* ✅ Small team, limited DevOps resources
+* ✅ Rapid iteration, quick deployments
+* ✅ Cost-conscious early-stage projects
+
+**Not ideal:**
+
+* ❌ Complex microservices architectures
+* ❌ Need for specific cloud services (AWS RDS, etc.)
+* ❌ Compliance requirements for specific regions
+* ❌ Already invested heavily in Kubernetes
+
+---
+
+## 📍 Slide 18 – 🔧 Fly.io Best Practices
+
+| 📋 Practice | 📝 Reason |
+|------------|----------|
+| Use auto_stop_machines | Save costs when idle |
+| Add health checks | Enable auto-restart on failure |
+| Use volumes for stateful data | Machines are ephemeral |
+| Set min_machines_running | Prevent cold starts |
+| Use regions near your users | Optimize latency |
+
+```toml
+[http_service]
+  auto_stop_machines = true
+  auto_start_machines = true
+  min_machines_running = 1
+
+[checks]
+  [checks.health]
+    type = "http"
+    port = 8080
+    path = "/health"
+```
+
+---
+
+## 📍 Slide 19 – 📝 QUIZ — DEVOPS_L16_MID
+
+---
+
+## 📍 Slide 20 – 🌐 Section 3: IPFS & The Decentralized Web
+
+**What is IPFS?**
+
+* 🌐 **InterPlanetary File System**
+* 📦 Distributed, peer-to-peer storage
+* 🔗 Content-addressed (identified by hash, not location)
+* ♾️ Immutable, permanent storage
+
+```mermaid
+flowchart LR
+  A[📄 File] --> B[#️⃣ Hash]
+  B --> C[🔗 CID: QmXxx...]
+  C --> D[🌐 Available Globally]
+```
+
+> 💡 **Key insight:** Same content = same address, anywhere in the world
+
+---
+
+## 📍 Slide 21 – 🔍 Content Addressing Explained
+
+**Traditional web (location-based):**
+```
+https://server.com/path/to/file.html
+                    ↓
+        Server could change content!
+```
+
+**IPFS (content-based):**
+```
+ipfs://QmXxx.../file.html
+          ↓
+   Hash of actual content
+   If content changes, hash changes!
+```
+
+| 📋 Aspect | 🌐 HTTP | 🔗 IPFS |
+|----------|--------|---------|
+| Addressing | Location | Content hash |
+| Mutability | Content can change | Content is immutable |
+| Availability | Single server | Distributed nodes |
+| Censorship | Easy to block | Very difficult |
+
+---
+
+## 📍 Slide 22 – 🔑 IPFS Key Concepts
+
+| 🔧 Concept | 📝 Description |
+|-----------|---------------|
+| **CID** | Content Identifier - hash of content |
+| **Node** | Computer running IPFS software |
+| **Pinning** | Keeping content available (prevent garbage collection) |
+| **Gateway** | HTTP bridge to IPFS content |
+| **IPNS** | Mutable pointer to IPFS content |
+
+**Example CIDs:**
+```
+QmXoypizjW3WknFiJnKLwHCnL72vedxjQkDDP1mXWo6uco
+bafybeigdyrzt5sfp7udm7hu76uh7y26nf3efuylqabf3oclgtqy55fbzdi
+```
+
+---
+
+## 📍 Slide 23 – 📌 Pinning Services
+
+**The persistence problem:**
+
+```mermaid
+flowchart TD
+  A[📄 Add Content] --> B[🔗 Get CID]
+  B --> C{Who stores it?}
+  C --> |Your node| D[🖥️ Goes offline = Content unavailable]
+  C --> |Pinning service| E[☁️ Always available]
+```
+
+**Pinning services:**
+* 📌 **4EVERLAND** — Web3 hosting platform
+* 📌 **Pinata** — IPFS pinning
+* 📌 **Infura** — IPFS API
+* 📌 **web3.storage** — Free storage
+
+---
+
+## 📍 Slide 24 – 🌐 4EVERLAND Platform
+
+**What is 4EVERLAND?**
+
+* 🌐 Web3 infrastructure platform
+* 📦 IPFS hosting made simple
+* 🔧 Deploy from Git (like Vercel/Netlify)
+* 💰 Free tier available
+
+**Services:**
+* 🚀 **Hosting:** Deploy static sites and SPAs
+* 📦 **Bucket:** IPFS storage (like S3)
+* 🌐 **Gateway:** Access IPFS content via HTTP
+
+---
+
+## 📍 Slide 25 – 🚀 Deploying to 4EVERLAND
+
+**Process:**
+
+```mermaid
+flowchart LR
+  A[📝 Git Push] --> B[🔄 4EVERLAND Build]
+  B --> C[📦 Upload to IPFS]
+  C --> D[🔗 Get CID]
+  D --> E[🌐 Available via Gateway]
+```
+
+**Steps:**
+1. 🔗 Connect GitHub repository
+2. ⚙️ Configure build settings
+3. 🚀 Deploy
+4. 🔗 Access via CID or custom domain
+
+**URLs:**
+* `https://your-project.4everland.app`
+* `https://ipfs.4everland.link/ipfs/CID`
+
+---
+
+## 📍 Slide 26 – 🔄 IPNS: Mutable Pointers
+
+**Problem:** CID changes when content changes
+
+**Solution:** IPNS (InterPlanetary Name System)
+
+```mermaid
+flowchart LR
+  A[🔑 IPNS Name] --> B[🔗 CID v1]
+  A --> |Update| C[🔗 CID v2]
+```
+
+| 📋 Type | 🔗 Address | 📝 Behavior |
+|--------|-----------|------------|
+| **IPFS** | `/ipfs/QmXxx` | Always same content |
+| **IPNS** | `/ipns/k51xxx` | Points to current version |
+
+**4EVERLAND handles this:** Your URL stays the same, content updates automatically
+
+---
+
+## 📍 Slide 27 – 📊 Centralized vs Decentralized
+
+| 📋 Aspect | 🏢 Traditional | 🌐 IPFS/4EVERLAND |
+|----------|---------------|-------------------|
+| Single point of failure | Yes | No |
+| Censorship resistance | Low | High |
+| Content integrity | Trust server | Cryptographic verification |
+| Hosting cost | Ongoing | Pin once, available forever |
+| Update mechanism | Overwrite file | New CID (or IPNS) |
+| Speed | Fast (CDN) | Variable (depends on nodes) |
+| Best for | Dynamic apps | Static content, archives |
+
+---
+
+## 📍 Slide 28 – 🎯 When to Choose IPFS/4EVERLAND
+
+**Good fit:**
+
+* ✅ Static websites and documentation
+* ✅ Content that must survive (archives, important documents)
+* ✅ Censorship-resistant publishing
+* ✅ NFT metadata and assets
+* ✅ Open source project hosting
+
+**Not ideal:**
+
+* ❌ Dynamic server-side applications
+* ❌ Real-time updates needed
+* ❌ Private content (IPFS is public by default)
+* ❌ High-performance requirements
+
+---
+
+## 📍 Slide 29 – 🎯 Section 4: Making the Right Choice
+
+**Decision Framework:**
+
+```mermaid
+flowchart TD
+  A[📦 Your Application] --> B{Need dynamic backend?}
+  B --> |Yes| C{Team size?}
+  B --> |No, static| D{Permanence important?}
+
+  C --> |Large, experienced| E[☸️ Kubernetes]
+  C --> |Small| F{Global latency critical?}
+
+  F --> |Yes| G[✈️ Fly.io]
+  F --> |No| H[Simple hosting]
+
+  D --> |Yes| I[🌐 IPFS/4EVERLAND]
+  D --> |No| J[Static hosting CDN]
+```
+
+---
+
+## 📍 Slide 30 – 📊 Summary Comparison
+
+| 📋 Criteria | ☸️ Kubernetes | ✈️ Fly.io | 🌐 4EVERLAND/IPFS |
+|------------|--------------|----------|-------------------|
+| **Complexity** | High | Low | Low |
+| **Control** | Full | Medium | Limited |
+| **Scalability** | Unlimited | Good | N/A (static) |
+| **Global distribution** | Manual | Automatic | Inherent |
+| **Cost at scale** | Efficient | Can be expensive | Very low |
+| **Learning curve** | Steep | Gentle | Minimal |
+| **Use case** | Microservices, enterprise | Global apps, startups | Static content, Web3 |
+
+---
+
+## 📍 Slide 31 – 🏢 Real-World Examples
+
+**Kubernetes users:**
+* 🏢 **Spotify:** 200+ microservices
+* 🏢 **Pinterest:** ML workloads
+* 🏢 **Airbnb:** Multi-region deployments
+
+**Fly.io users:**
+* 🚀 **Small startups:** Quick global deployment
+* 🎮 **Game backends:** Low-latency requirements
+* 🛠️ **Developer tools:** API services
+
+**IPFS/Decentralized:**
+* 📚 **Wikipedia mirror:** Censorship-resistant access
+* 🎨 **NFT projects:** Metadata storage
+* 📰 **News archives:** Permanent preservation
+
+---
+
+## 📍 Slide 32 – 🔮 The Future of Deployment
+
+**Trends to watch:**
+
+| 🔮 Trend | 📝 Description |
+|---------|---------------|
+| **Edge computing** | Code runs closer to users |
+| **WebAssembly** | Run any language at the edge |
+| **Decentralization** | Web3 infrastructure growth |
+| **Platform abstraction** | Less infra management |
+| **AI-assisted DevOps** | Automated operations |
+
+> 💬 *"The cloud is just someone else's computer. The edge is everyone's computer."*
+
+---
+
+## 📍 Slide 33 – 📋 Practical Recommendations
+
+**For students and learning:**
+1. 🎓 Master Kubernetes fundamentals first
+2. ✈️ Try Fly.io for personal projects
+3. 🌐 Experiment with IPFS for static sites
+
+**For production decisions:**
+1. 📋 Start with requirements, not technology
+2. 📊 Consider team capabilities
+3. 💰 Factor in total cost (including time)
+4. 🔄 Plan for evolution
+
+---
+
+## 📍 Slide 34 – 🎯 Key Takeaways
+
+1. ☸️ **Kubernetes is powerful** but comes with complexity costs
+2. ✈️ **Fly.io offers simplicity** for global, low-latency applications
+3. 🌐 **IPFS provides permanence** and censorship resistance
+4. 🎯 **No single best solution** — choose based on requirements
+5. 📊 **Consider the trade-offs:** control vs simplicity, cost vs features
+6. 🔮 **The landscape evolves** — stay curious, keep learning
+
+> 💬 *"The best architecture is the one your team can operate successfully."*
+
+---
+
+## 📍 Slide 35 – 🧠 Course Mindset Shift
+
+| 😰 Before This Course | 🚀 After This Course |
+|----------------------|---------------------|
+| "How do I deploy this?" | "What's the best deployment model?" |
+| "Kubernetes is complicated" | "I understand K8s and its alternatives" |
+| "DevOps is ops work" | "DevOps is a culture and practice" |
+| "I write code, someone else deploys" | "I can deploy, monitor, and maintain" |
+| "Just get it working" | "Make it observable, scalable, reliable" |
+
+---
+
+## 📍 Slide 36 – 📝 QUIZ — DEVOPS_L16_POST
+
+---
+
+## 📍 Slide 37 – 🎓 Course Wrap-up
+
+**What you've learned:**
+
+```mermaid
+flowchart LR
+  A[🐳 Docker] --> B[☸️ Kubernetes]
+  B --> C[🔄 CI/CD]
+  C --> D[📊 Observability]
+  D --> E[🔐 Security]
+  E --> F[🌍 Global Deployment]
+```
+
+**Your DevOps toolkit:**
+* 🐳 **Containerization:** Docker, multi-stage builds
+* ☸️ **Orchestration:** Kubernetes, Helm, StatefulSets
+* 🔄 **GitOps:** ArgoCD, declarative infrastructure
+* 📊 **Observability:** Prometheus, Grafana, alerting
+* 🔐 **Security:** Secrets management, Vault
+* 🚀 **Progressive delivery:** Canary, blue-green
+* 🌍 **Beyond K8s:** Edge computing, decentralized hosting
+
+> 🎉 **Congratulations!** You're now equipped for production DevOps.
+
+---
+
+## 📚 Resources
+
+**Fly.io:**
+* 📖 [Fly.io Documentation](https://fly.io/docs/)
+* 📖 [flyctl Reference](https://fly.io/docs/flyctl/)
+
+**IPFS & 4EVERLAND:**
+* 📖 [IPFS Documentation](https://docs.ipfs.tech/)
+* 📖 [4EVERLAND Docs](https://docs.4everland.org/)
+* 📖 [IPFS Concepts](https://docs.ipfs.tech/concepts/)
+
+**Further reading:**
+* 📕 *The DevOps Handbook* by Gene Kim, et al.
+* 📕 *Accelerate* by Nicole Forsgren, et al.
+* 📕 *Site Reliability Engineering* by Google
+
+**Keep learning:**
+* 🌐 [CNCF Landscape](https://landscape.cncf.io/)
+* 🌐 [DevOps Roadmap](https://roadmap.sh/devops)
diff --git a/lectures/lec2.md b/lectures/lec2.md
index 46a3e0485a..b4c39dd0b9 100644
--- a/lectures/lec2.md
+++ b/lectures/lec2.md
@@ -1,1053 +1,1053 @@
-# 📌 Lecture 2 — Containerization with Docker: From "Works on My Machine" to Works Everywhere
-
-## 📍 Slide 1 – 🐳 Welcome to Containerization
-
-* 🌍 **"Works on my machine"** — the most expensive phrase in software
-* 📦 **Containers** = package your app + all dependencies together
-* 🚀 **Docker** = the tool that made containers mainstream
-* 🎯 This lecture: build production-ready containers from scratch
-
-```mermaid
-flowchart LR
-  Problem[😰 Works on My Machine] -->|Docker| Solution[🐳 Works Everywhere]
-  Solution --> Value[💎 Consistent Deployments]
-```
-
----
-
-## 📍 Slide 2 – 🎯 Learning Outcomes
-
-* ✅ Understand containers vs VMs and why containers win
-* ✅ Write production-ready Dockerfiles
-* ✅ Apply security best practices (rootless, distroless)
-* ✅ Optimize images with multi-stage builds
-* ✅ Publish images to Docker Hub
-
-**🎓 By the end of this lecture:**
-
-| # | 🎯 Outcome |
-|---|-----------|
-| 1 | 🧠 Explain container architecture and benefits |
-| 2 | 📝 Write optimized, secure Dockerfiles |
-| 3 | 🔐 Implement rootless containers |
-| 4 | 📦 Use multi-stage builds for smaller images |
-| 5 | 🚀 Push/pull images from Docker Hub |
-
----
-
-## 📍 Slide 3 – 📋 Lecture Overview
-
-* 📚 **Concepts + Diagrams** — how containers work
-* 🛠️ **Dockerfile deep dive** — instructions and best practices
-* 🔐 **Security patterns** — rootless and distroless
-* 📦 **Optimization** — multi-stage builds
-* 🌐 **Registry workflow** — Docker Hub
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction           → 📝 PRE Quiz
-Section 1: The Dependency Problem
-Section 2: Container Fundamentals
-Section 3: Dockerfile Scenarios   → 📝 MID Quiz
-Section 4: Advanced Patterns
-Section 5: Real World Usage
-Section 6: Reflection             → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – ❓ The Big Question
-
-* 📊 **65%** of organizations use containers in production (2024)
-* 🐳 **Docker Hub**: 14+ million images, 13+ billion pulls/month
-* 💥 Yet most Dockerfiles have **security vulnerabilities**
-
-> 💬 *"Containers are the new deployment unit"* — Kelsey Hightower
-
-**🤔 Think about it:**
-* Why do apps work locally but fail in production?
-* What's inside a container that makes it portable?
-* How small can a container image be?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L2_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Dependency Problem
-
-* 👨‍💻 **Developer**: "It works on my machine!"
-* ⚙️ **Ops**: "Well, we're not shipping your machine!"
-* 🧩 **The real problem**: dependencies, versions, configurations
-* 💥 **Result**: deployment failures, debugging nightmares
-
-```mermaid
-flowchart LR
-  Dev[👨‍💻 Dev Machine] -->|Different| Prod[🌐 Production]
-  Dev -->|Python 3.11| V1[📦 Version]
-  Prod -->|Python 3.9| V2[📦 Version]
-  V1 -.->|💥 Conflict| V2
-```
-
----
-
-## 📍 Slide 7 – 🧩 The Dependency Hell
-
-* 🐍 **Python version**: 3.9 vs 3.11 vs 3.12
-* 📚 **Library versions**: requests 2.28 vs 2.31
-* 🖥️ **OS differences**: Ubuntu vs Alpine vs macOS
-* ⚙️ **System libraries**: OpenSSL, libffi, glibc
-
-```mermaid
-flowchart TD
-  App[📱 Your App] --> Py[🐍 Python 3.11]
-  App --> Lib1[📚 Flask 2.3]
-  App --> Lib2[📚 Requests 2.31]
-  Py --> OS[🖥️ Ubuntu 22.04]
-  Lib1 --> SSL[🔐 OpenSSL 3.0]
-  OS --> Kernel[🧠 Linux Kernel]
-```
-
-> 🤔 **Think:** How many things can go wrong?
-
----
-
-## 📍 Slide 8 – 😱 The VM Solution (Heavy)
-
-* 🖥️ **Virtual Machines** = entire OS per application
-* 💾 **Size**: 10-50 GB per VM
-* ⏱️ **Boot time**: minutes
-* 🔧 **Resource overhead**: hypervisor, guest OS kernel
-
-```mermaid
-flowchart TD
-  subgraph VM1[🖥️ VM 1 - 15GB]
-    App1[📱 App] --> OS1[🖥️ Full OS]
-    OS1 --> Kernel1[🧠 Kernel]
-  end
-  subgraph VM2[🖥️ VM 2 - 15GB]
-    App2[📱 App] --> OS2[🖥️ Full OS]
-    OS2 --> Kernel2[🧠 Kernel]
-  end
-  VM1 --> Hyper[⚙️ Hypervisor]
-  VM2 --> Hyper
-  Hyper --> Host[🖥️ Host OS]
-```
-
-**😰 Problems:**
-* 🐌 Slow to start
-* 💸 Expensive (RAM, CPU, storage)
-* 🔧 Hard to manage at scale
-
----
-
-## 📍 Slide 9 – 🐳 The Container Solution (Light)
-
-* 📦 **Containers** = isolated processes sharing host kernel
-* 💾 **Size**: 5-500 MB typically
-* ⏱️ **Start time**: milliseconds
-* 🚀 **Density**: 10-100x more containers than VMs
-
-```mermaid
-flowchart TD
-  subgraph Containers
-    C1[📦 Container 1 - 50MB]
-    C2[📦 Container 2 - 50MB]
-    C3[📦 Container 3 - 50MB]
-  end
-  C1 --> Docker[🐳 Docker Engine]
-  C2 --> Docker
-  C3 --> Docker
-  Docker --> Host[🖥️ Host OS + Kernel]
-```
-
-**🚀 Benefits:**
-* ⚡ Start in milliseconds
-* 💰 Efficient resource usage
-* 📦 Portable across environments
-
----
-
-## 📍 Slide 10 – 💸 VMs vs Containers
-
-| 🔍 Aspect | 🖥️ Virtual Machine | 🐳 Container |
-|-----------|-------------------|--------------|
-| 💾 **Size** | 10-50 GB | 10-500 MB |
-| ⏱️ **Boot Time** | Minutes | Milliseconds |
-| 🧠 **Kernel** | Own kernel | Shared kernel |
-| 🔒 **Isolation** | Strong (hardware) | Process-level |
-| 📦 **Density** | 10-20 per host | 100s per host |
-| 🎯 **Use Case** | Full OS needed | App deployment |
-
-**📈 Real Numbers:**
-* 🖥️ **VM**: 1 app = ~2GB RAM overhead
-* 🐳 **Container**: 1 app = ~50MB overhead
-* 🚀 **Result**: 40x more efficient!
-
----
-
-## 📍 Slide 11 – 📜 History of Containerization
-
-* 🕰️ **1979**: `chroot` — change root directory (Unix V7)
-* 🔒 **2000**: FreeBSD Jails — first true isolation
-* 🐧 **2006**: cgroups — Google contributes to Linux kernel
-* 📦 **2008**: LXC (Linux Containers) — combines namespaces + cgroups
-* 🐳 **2013**: **Docker** — makes containers accessible to everyone
-* ☸️ **2014**: Kubernetes — container orchestration at scale
-* 📦 **2015**: OCI (Open Container Initiative) — standardization
-
-```mermaid
-flowchart LR
-  Chroot[🕰️ 1979: chroot] --> Jails[🔒 2000: Jails]
-  Jails --> Cgroups[🐧 2006: cgroups]
-  Cgroups --> LXC[📦 2008: LXC]
-  LXC --> Docker[🐳 2013: Docker]
-  Docker --> K8s[☸️ 2014: K8s]
-```
-
-> 💡 Docker didn't invent containers — it made them **usable**.
-
----
-
-## 📍 Slide 12 – 🐧 Linux Kernel: Namespaces
-
-* 🎯 **Namespaces** = isolate what a process **can see**
-* 🔒 Each container gets its own "view" of the system
-
-| 🏷️ Namespace | 🔒 Isolates | 📝 Example |
-|--------------|------------|-----------|
-| **PID** | Process IDs | Container sees PID 1 as its init |
-| **NET** | Network stack | Own IP, ports, routing |
-| **MNT** | Mount points | Own filesystem view |
-| **UTS** | Hostname | Own hostname |
-| **IPC** | Inter-process comm | Own message queues |
-| **USER** | User/Group IDs | UID 0 in container ≠ root on host |
-
-```mermaid
-flowchart TD
-  subgraph Host[🖥️ Host System]
-    subgraph NS1[📦 Container 1 Namespace]
-      P1[PID 1: app]
-      Net1[eth0: 172.17.0.2]
-    end
-    subgraph NS2[📦 Container 2 Namespace]
-      P2[PID 1: app]
-      Net2[eth0: 172.17.0.3]
-    end
-  end
-```
-
----
-
-## 📍 Slide 13 – 🎛️ Linux Kernel: cgroups
-
-* 🎯 **cgroups** (Control Groups) = limit what a process **can use**
-* 📊 Resource limits prevent one container from killing the host
-
-| 🎛️ cgroup | 🔧 Controls | 📝 Example |
-|-----------|------------|-----------|
-| **cpu** | CPU time | Max 50% of one core |
-| **memory** | RAM usage | Max 512MB |
-| **blkio** | Disk I/O | Max 100MB/s read |
-| **pids** | Process count | Max 100 processes |
-
-```mermaid
-flowchart LR
-  Container[🐳 Container] --> Cgroups[🎛️ cgroups]
-  Cgroups --> CPU[🖥️ CPU: 50%]
-  Cgroups --> RAM[💾 RAM: 512MB]
-  Cgroups --> IO[💿 I/O: 100MB/s]
-```
-
-**🛡️ Why it matters:**
-* ✅ Prevent runaway processes
-* ✅ Fair resource sharing
-* ✅ Predictable performance
-
----
-
-## 📍 Slide 14 – 📂 Linux Kernel: Union Filesystems
-
-* 🎯 **Union FS** = layer multiple filesystems as one
-* 📚 Docker uses **overlay2** (default on Linux)
-* 💾 Layers are **read-only**, changes go to top layer
-
-```mermaid
-flowchart TD
-  subgraph Image[📦 Image Layers - Read Only]
-    L1[🐧 Layer 1: Base OS]
-    L2[📦 Layer 2: Dependencies]
-    L3[📁 Layer 3: App Code]
-  end
-  subgraph Container[🏃 Container Layer - Read/Write]
-    L4[✏️ Layer 4: Runtime Changes]
-  end
-  L1 --> L2 --> L3 --> L4
-```
-
-**💡 Benefits:**
-* ✅ **Shared layers** — 10 containers can share base image
-* ✅ **Fast startup** — no copying, just add thin layer
-* ✅ **Efficient storage** — only differences stored
-
----
-
-## 📍 Slide 15 – 🧩 How It All Fits Together
-
-```mermaid
-flowchart TD
-  subgraph Docker[🐳 Docker Engine]
-    CLI[🖥️ Docker CLI]
-    Daemon[⚙️ dockerd]
-    Containerd[📦 containerd]
-    Runc[🏃 runc]
-  end
-  subgraph Kernel[🐧 Linux Kernel]
-    NS[🔒 Namespaces]
-    CG[🎛️ cgroups]
-    UFS[📂 overlay2]
-  end
-  CLI --> Daemon --> Containerd --> Runc
-  Runc --> NS
-  Runc --> CG
-  Runc --> UFS
-```
-
-**🔧 The Stack:**
-* 🖥️ **Docker CLI** — user interface
-* ⚙️ **dockerd** — Docker daemon (API)
-* 📦 **containerd** — container lifecycle management
-* 🏃 **runc** — OCI runtime (creates containers)
-* 🐧 **Kernel** — namespaces + cgroups + filesystem
-
----
-
-## 📍 Slide 16 – 💡 Section 2: Docker Fundamentals
-
-* 🐳 **Docker** = platform for building, shipping, running containers
-* 📦 **Image** = blueprint (read-only template)
-* 🏃 **Container** = running instance of an image
-* 📝 **Dockerfile** = recipe to build an image
-
-```mermaid
-flowchart LR
-  Dockerfile[📝 Dockerfile] -->|build| Image[📦 Image]
-  Image -->|run| Container[🏃 Container]
-  Image -->|push| Registry[🌐 Registry]
-  Registry -->|pull| Image2[📦 Image]
-```
-
-**📖 Definition:**
-> *A container is a standard unit of software that packages code and all its dependencies so the application runs quickly and reliably across environments.*
-
----
-
-## 📍 Slide 17 – 🏗️ Docker Architecture
-
-* 🖥️ **Docker Client** = CLI commands (`docker build`, `docker run`)
-* ⚙️ **Docker Daemon** = background service managing containers
-* 📦 **Images** = layered filesystem snapshots
-* 🌐 **Registry** = image storage (Docker Hub, ECR, GCR)
-
-```mermaid
-flowchart LR
-  CLI[🖥️ Docker CLI] -->|API| Daemon[⚙️ Docker Daemon]
-  Daemon --> Images[📦 Images]
-  Daemon --> Containers[🏃 Containers]
-  Daemon <-->|push/pull| Registry[🌐 Registry]
-```
-
-**🔧 Key Commands:**
-* 🔨 `docker build` — create image from Dockerfile
-* 🏃 `docker run` — start container from image
-* 📤 `docker push` — upload image to registry
-* 📥 `docker pull` — download image from registry
-
----
-
-## 📍 Slide 18 – 📚 Image Layers
-
-* 🎂 **Images are layered** = each instruction creates a layer
-* 💾 **Layers are cached** = faster rebuilds
-* 🔄 **Layers are shared** = efficient storage
-* 📝 **Order matters** = for cache efficiency
-
-```mermaid
-flowchart TD
-  L1[🐧 Layer 1: Base OS - python:3.12-slim]
-  L2[📦 Layer 2: Install dependencies]
-  L3[📁 Layer 3: Copy application code]
-  L4[⚙️ Layer 4: Configure runtime]
-  L1 --> L2 --> L3 --> L4
-  L4 --> Image[📦 Final Image]
-```
-
-**💡 Key Insight:**
-* ✅ Change code → only Layer 3-4 rebuild
-* ❌ Change base → ALL layers rebuild
-
----
-
-## 📍 Slide 19 – 📝 Dockerfile Basics
-
-```dockerfile
-# 🐍 Start from base image
-FROM python:3.12-slim
-
-# 📁 Set working directory
-WORKDIR /app
-
-# 📦 Copy and install dependencies FIRST (caching!)
-COPY requirements.txt .
-RUN pip install --no-cache-dir -r requirements.txt
-
-# 📁 Copy application code
-COPY . .
-
-# 🚀 Define startup command
-CMD ["python", "app.py"]
-```
-
-**📝 Key Instructions:**
-| Instruction | 🎯 Purpose |
-|-------------|-----------|
-| `FROM` | 🐧 Base image |
-| `WORKDIR` | 📁 Set directory |
-| `COPY` | 📄 Copy files |
-| `RUN` | ⚙️ Execute commands |
-| `CMD` | 🚀 Default command |
-| `EXPOSE` | 🔌 Document port |
-
----
-
-## 📍 Slide 20 – ⚡ Before vs After Docker
-
-| 😰 Before Docker | 🐳 After Docker |
-|-----------------|-----------------|
-| 📋 Manual server setup | 📝 Dockerfile defines everything |
-| 🔧 "Install Python 3.11, then..." | 🐳 `FROM python:3.11` |
-| 😱 "Works on my machine" | ✅ Works everywhere |
-| 📅 Deploy monthly (scary) | 🚀 Deploy daily (confident) |
-| 🐛 "Which version is prod?" | 📦 Image tag = version |
-| 💀 Snowflake servers | 🐄 Immutable containers |
-
-> 🤔 Which column describes your current workflow?
-
----
-
-## 📍 Slide 21 – 🎮 Section 3: Dockerfile Scenarios
-
-## 🕹️ Lab Preview: Containerize Your App
-
-* 🏢 **Scenario**: You have a Python Flask app from Lab 1
-* 🎯 **Goal**: Package it in a production-ready container
-* 📋 **Requirements**: Security, optimization, best practices
-
-**❓ What could go wrong?**
-
-> 💀 **A lot.** Let's see common mistakes and fixes.
-
-🎮 **Let's build it right.**
-
----
-
-## 📍 Slide 22 – 💥 Scenario 1: Running as Root
-
-**😰 The Problem:**
-```dockerfile
-FROM python:3.12
-COPY . /app
-CMD ["python", "app.py"]
-# 💀 Running as root by default!
-```
-
-* 🔓 Container runs as **root** (UID 0)
-* 💥 If attacker escapes container → **root on host**
-* 🚨 Kubernetes blocks root containers by default
-
-```mermaid
-flowchart LR
-  Attack[🔓 Container Escape] --> Root[👑 Root Access]
-  Root --> Host[💀 Host Compromised]
-```
-
-> ❓ **Why is this dangerous?**
-
----
-
-## 📍 Slide 23 – ✅ Solution: Rootless Containers
-
-## 🛠️ Fix: Create Non-Root User
-
-```dockerfile
-FROM python:3.12-slim
-
-# 👤 Create non-root user
-RUN useradd --create-home --shell /bin/bash appuser
-
-WORKDIR /app
-COPY requirements.txt .
-RUN pip install --no-cache-dir -r requirements.txt
-COPY . .
-
-# 🔒 Switch to non-root user
-USER appuser
-
-CMD ["python", "app.py"]
-```
-
-**🎯 Result:** Container runs as `appuser`, not root
-
-**🔐 Security Benefits:**
-* ✅ Limited privileges inside container
-* ✅ Can't modify system files
-* ✅ Container escape = unprivileged user
-* ✅ Kubernetes-compatible
-
----
-
-## 📍 Slide 24 – 🐌 Scenario 2: Slow Builds (Bad Layer Order)
-
-**😰 The Problem:**
-```dockerfile
-FROM python:3.12-slim
-WORKDIR /app
-
-# ❌ Copy EVERYTHING first
-COPY . .
-
-# 📦 Then install dependencies
-RUN pip install -r requirements.txt
-
-CMD ["python", "app.py"]
-```
-
-* 🔄 **Any code change** → reinstall ALL dependencies
-* ⏱️ Build time: **5 minutes** every time
-* 💸 Wasted CI/CD minutes
-
-```mermaid
-flowchart TD
-  Change[📝 Change 1 line of code] --> Copy[❌ COPY invalidated]
-  Copy --> Pip[❌ pip install runs again]
-  Pip --> Slow[🐌 5 min rebuild]
-```
-
----
-
-## 📍 Slide 25 – ✅ Solution: Optimized Layer Order
-
-## 🛠️ Fix: Dependencies Before Code
-
-```dockerfile
-FROM python:3.12-slim
-WORKDIR /app
-
-# 📦 Copy ONLY requirements first
-COPY requirements.txt .
-
-# 📦 Install dependencies (cached if requirements unchanged)
-RUN pip install --no-cache-dir -r requirements.txt
-
-# 📁 THEN copy application code
-COPY . .
-
-CMD ["python", "app.py"]
-```
-
-**🎯 Result:** Change code → only last layer rebuilds
-
-```mermaid
-flowchart TD
-  Change[📝 Change code] --> Skip1[✅ FROM cached]
-  Skip1 --> Skip2[✅ requirements cached]
-  Skip2 --> Skip3[✅ pip install cached]
-  Skip3 --> Rebuild[🔨 Only COPY . . rebuilds]
-  Rebuild --> Fast[⚡ 10 sec rebuild]
-```
-
-**⚡ Build time: 5 min → 10 sec**
-
----
-
-## 📍 Slide 26 – 📦 Scenario 3: Bloated Images
-
-**😰 The Problem:**
-```dockerfile
-FROM python:3.12
-# 💾 Full Python image = 1.0 GB!
-```
-
-* 💾 Image size: **1+ GB**
-* 🐌 Slow to pull/push
-* 💸 Storage costs
-* 🔓 Larger attack surface
-
-**📊 Python Image Sizes:**
-| Image | 💾 Size |
-|-------|--------|
-| `python:3.12` | 1.0 GB |
-| `python:3.12-slim` | 150 MB |
-| `python:3.12-alpine` | 50 MB |
-
-> 🤔 **Do you need the full image?**
-
----
-
-## 📍 Slide 27 – ✅ Solution: Slim Base Images
-
-## 🛠️ Fix: Use Minimal Base Images
-
-```dockerfile
-# ✅ Use slim variant
-FROM python:3.12-slim
-
-# ✅ No cache for pip (smaller image)
-RUN pip install --no-cache-dir -r requirements.txt
-
-# ✅ Only copy what's needed
-COPY app.py .
-COPY templates/ templates/
-```
-
-**🎯 Result:** 1 GB → 150 MB (85% reduction!)
-
-**📦 Base Image Guide:**
-| Image Type | 🎯 Use Case | 💾 Size |
-|------------|------------|--------|
-| `python:3.12` | Need compilation tools | 1.0 GB |
-| `python:3.12-slim` | Most apps (recommended) | 150 MB |
-| `python:3.12-alpine` | Size-critical, simple apps | 50 MB |
-
-**⚠️ Alpine Warning:** Uses musl libc, may break some packages
-
----
-
-## 📍 Slide 28 – 📁 Scenario 4: No .dockerignore
-
-**😰 The Problem:**
-```bash
-# Build context includes EVERYTHING
-Sending build context to Docker daemon  500MB
-```
-
-* 📁 `.git/` folder (100+ MB)
-* 📁 `node_modules/` or `venv/`
-* 📁 `__pycache__/` files
-* 📄 `.env` with secrets! 💀
-
-**💥 Consequences:**
-* 🐌 Slow builds
-* 💾 Bloated images
-* 🔓 Secrets leaked into image
-
----
-
-## 📍 Slide 29 – ✅ Solution: .dockerignore
-
-## 🛠️ Fix: Exclude Unnecessary Files
-
-```dockerignore
-# 🐙 Version control
-.git
-.gitignore
-
-# 🐍 Python
-__pycache__
-*.pyc
-*.pyo
-venv/
-.venv/
-
-# 🔐 Secrets (NEVER include!)
-.env
-*.pem
-secrets/
-
-# 📝 Documentation
-*.md
-docs/
-
-# 🧪 Tests (if not needed in container)
-tests/
-```
-
-**🎯 Result:**
-* ⚡ Build context: 500 MB → 5 MB
-* 🔐 No secrets in image
-* 🚀 Faster builds
-
----
-
-## 📍 Slide 30 – 📝 QUIZ — DEVOPS_L2_MID
-
----
-
-## 📍 Slide 31 – 🚀 Section 4: Advanced Patterns
-
-## 🏗️ Multi-Stage Builds
-
-* 🎯 **Problem**: Build tools bloat final image
-* 💡 **Solution**: Separate build and runtime stages
-* 📦 **Result**: Tiny production images
-
-```mermaid
-flowchart LR
-  subgraph Stage1[🔨 Builder Stage]
-    SDK[📦 Full SDK]
-    Compile[⚙️ Compile]
-  end
-  subgraph Stage2[🚀 Runtime Stage]
-    Binary[📦 Binary Only]
-    Minimal[🐧 Minimal OS]
-  end
-  Stage1 -->|copy binary| Stage2
-```
-
-**📊 Size Impact:**
-* 🔨 Builder: 1+ GB (SDK, compilers)
-* 🚀 Runtime: 10-50 MB (binary only)
-
----
-
-## 📍 Slide 32 – 📝 Multi-Stage Dockerfile
-
-```dockerfile
-# 🔨 Stage 1: Builder
-FROM golang:1.21 AS builder
-WORKDIR /app
-COPY go.mod go.sum ./
-RUN go mod download
-COPY . .
-RUN CGO_ENABLED=0 go build -o myapp
-
-# 🚀 Stage 2: Runtime
-FROM alpine:3.18
-RUN adduser -D appuser
-WORKDIR /app
-COPY --from=builder /app/myapp .
-USER appuser
-CMD ["./myapp"]
-```
-
-**🔍 Key Points:**
-* 🏷️ `AS builder` — name the stage
-* 📦 `COPY --from=builder` — copy from previous stage
-* 🗑️ Builder stage discarded in final image
-
-**📊 Result:** 1.2 GB → 15 MB
-
----
-
-## 📍 Slide 33 – 🔐 Distroless Images
-
-## 🛡️ Ultimate Minimal Images
-
-* 🚫 **No shell** — can't exec into container
-* 🚫 **No package manager** — can't install malware
-* 🚫 **No unnecessary files** — minimal attack surface
-* ✅ **Only your app** — and runtime dependencies
-
-```dockerfile
-# 🔨 Build stage
-FROM golang:1.21 AS builder
-WORKDIR /app
-COPY . .
-RUN CGO_ENABLED=0 go build -o myapp
-
-# 🔐 Distroless runtime
-FROM gcr.io/distroless/static-debian12
-COPY --from=builder /app/myapp /
-CMD ["/myapp"]
-```
-
-**📊 Distroless Options:**
-| Image | 🎯 For | 💾 Size |
-|-------|-------|--------|
-| `distroless/static` | Go, Rust (static) | 2 MB |
-| `distroless/base` | C/C++ apps | 20 MB |
-| `distroless/python3` | Python apps | 50 MB |
-| `distroless/java` | Java apps | 190 MB |
-
----
-
-## 📍 Slide 34 – 📊 Image Size Comparison
-
-## 📈 Same App, Different Images
-
-| 🏗️ Build Strategy | 💾 Image Size | 🔐 Security |
-|-------------------|--------------|-------------|
-| `FROM python:3.12` | 1.0 GB | 😰 Large attack surface |
-| `FROM python:3.12-slim` | 150 MB | 😊 Better |
-| Multi-stage + slim | 100 MB | 😄 Good |
-| Multi-stage + alpine | 50 MB | 😄 Good |
-| Multi-stage + distroless | 20 MB | 🔐 Excellent |
-| `FROM scratch` (Go) | 5 MB | 🔐 Maximum |
-
-```mermaid
-flowchart LR
-  Full[📦 1 GB] --> Slim[📦 150 MB]
-  Slim --> Multi[📦 50 MB]
-  Multi --> Distroless[📦 20 MB]
-  Distroless --> Scratch[📦 5 MB]
-```
-
-**🎯 Goal:** As small as possible while functional
-
----
-
-## 📍 Slide 35 – 🌐 Docker Hub & Registries
-
-## 📦 Publishing Your Images
-
-```mermaid
-flowchart LR
-  Build[🔨 Build] --> Tag[🏷️ Tag]
-  Tag --> Push[📤 Push]
-  Push --> Registry[🌐 Docker Hub]
-  Registry --> Pull[📥 Pull]
-  Pull --> Run[🏃 Run]
-```
-
-**🔧 Workflow:**
-```bash
-# 🔨 Build image
-docker build -t myapp:1.0 .
-
-# 🏷️ Tag for registry
-docker tag myapp:1.0 username/myapp:1.0
-
-# 🔐 Login to Docker Hub
-docker login
-
-# 📤 Push to registry
-docker push username/myapp:1.0
-```
-
-**📦 Registries:**
-* 🐳 Docker Hub — public/private
-* ☁️ AWS ECR — AWS integrated
-* 🌐 GCP GCR — Google integrated
-* 🦊 GitLab Registry — GitLab integrated
-
----
-
-## 📍 Slide 36 – 🏢 Section 5: Real World Usage
-
-## 📅 Docker in Production
-
-**🔨 Build Phase:**
-* 📝 Dockerfile in repo
-* 🤖 CI builds image on every commit
-* 🏷️ Tag with git SHA or semantic version
-* 📤 Push to registry
-
-**🚀 Deploy Phase:**
-* 📥 Pull image to servers
-* 🏃 Run containers
-* 📊 Monitor health
-* 🔄 Rolling updates
-
-```mermaid
-flowchart LR
-  Code[📝 Code] --> CI[🤖 CI Build]
-  CI --> Registry[🌐 Registry]
-  Registry --> K8s[☸️ Kubernetes]
-  K8s --> Prod[🌐 Production]
-```
-
----
-
-## 📍 Slide 37 – 🏷️ Tagging Strategies
-
-| 🏷️ Strategy | 📝 Example | 🎯 Use Case |
-|-------------|-----------|-------------|
-| **Semantic** | `myapp:1.2.3` | Releases |
-| **Git SHA** | `myapp:a1b2c3d` | Traceability |
-| **Branch** | `myapp:develop` | Dev environments |
-| **Latest** | `myapp:latest` | ⚠️ Avoid in prod! |
-| **Date** | `myapp:2024-01-15` | Daily builds |
-
-**⚠️ Never use `latest` in production:**
-* 🤷 Which version is "latest"?
-* 🔄 Changes without notice
-* 🐛 Can't rollback reliably
-
-**✅ Best Practice:**
-```bash
-# 🏷️ Immutable tags
-docker tag myapp:1.0.0 registry/myapp:1.0.0
-docker tag myapp:1.0.0 registry/myapp:sha-a1b2c3d
-```
-
----
-
-## 📍 Slide 38 – 🔐 Security Best Practices
-
-```mermaid
-flowchart TD
-  Scan[🔍 Scan Images] --> Base[📦 Minimal Base]
-  Base --> User[👤 Non-root User]
-  User --> Secrets[🔐 No Secrets in Image]
-  Secrets --> Update[🔄 Update Regularly]
-  Update --> Sign[✍️ Sign Images]
-```
-
-**🔐 Security Checklist:**
-* ✅ Run as non-root user (`USER appuser`)
-* ✅ Use minimal base images (slim, distroless)
-* ✅ Scan for vulnerabilities (Trivy, Snyk)
-* ✅ Never store secrets in images
-* ✅ Pin base image versions
-* ✅ Update base images regularly
-
-**🛠️ Scanning Tools:**
-* 🔍 **Trivy** — open source, fast
-* 🔍 **Snyk** — developer-friendly
-* 🔍 **Docker Scout** — built into Docker
-
----
-
-## 📍 Slide 39 – 📈 Career Skills
-
-```mermaid
-flowchart LR
-  Docker[🐳 Docker Basics] --> Compose[📦 Docker Compose]
-  Compose --> K8s[☸️ Kubernetes]
-  K8s --> GitOps[🔄 GitOps]
-  GitOps --> Platform[🏗️ Platform Engineering]
-```
-
-**🛠️ Docker Skills Progression:**
-* 🐳 **Level 1**: Write Dockerfiles, build/run containers
-* 📦 **Level 2**: Multi-stage builds, optimization
-* 🔐 **Level 3**: Security hardening, distroless
-* 📊 **Level 4**: Registry management, scanning
-* ☸️ **Level 5**: Container orchestration (K8s)
-
-**📊 Job Market (2024):**
-* 🐳 Docker required in **80%** of DevOps jobs
-* ☸️ Kubernetes in **65%** of container jobs
-* 💰 Container skills = **+15-20%** salary
-
----
-
-## 📍 Slide 40 – 🌍 Real Company Examples
-
-**🎬 Netflix:**
-* 🐳 Millions of containers daily
-* 📦 Custom base images (hardened)
-* 🔄 Immutable deployments
-
-**🛒 Shopify:**
-* 🐳 Containerized entire platform
-* ⚡ Deploy 80x/day
-* 📦 Standardized Dockerfiles
-
-**🚗 Uber:**
-* 🐳 4,000+ microservices in containers
-* 🔐 Strict security policies
-* 📊 Custom image scanning
-
-**📊 Common Patterns:**
-* ✅ Standardized base images
-* ✅ Automated security scanning
-* ✅ Multi-stage builds everywhere
-* ✅ No root containers
-
----
-
-## 📍 Slide 41 – 🎯 Section 6: Reflection
-
-## 📝 Key Takeaways
-
-1. 🐳 **Containers = lightweight, portable app packaging**
-2. 📝 **Dockerfile order matters** — dependencies before code
-3. 👤 **Always run as non-root** — security first
-4. 🏗️ **Multi-stage builds** — separate build from runtime
-5. 📦 **Smaller is better** — less attack surface, faster deploys
-
-> 💡 A good Dockerfile is secure, optimized, and maintainable.
-
----
-
-## 📍 Slide 42 – 🧠 The Mindset Shift
-
-| 😰 Old Mindset | 🐳 Container Mindset |
-|---------------|---------------------|
-| 🖥️ "Configure servers manually" | 📝 "Define in Dockerfile" |
-| 🔧 "Install dependencies on host" | 📦 "Bundle in container" |
-| 👑 "Run as root, it's easier" | 👤 "Run as non-root always" |
-| 💾 "Bigger image = more features" | ⚡ "Smaller = faster & safer" |
-| 🏷️ "Just use :latest" | 🔖 "Pin versions always" |
-
-> ❓ Which mindset will you adopt?
-
----
-
-## 📍 Slide 43 – ✅ Your Progress
-
-## 🎓 What You Now Understand
-
-* ✅ Why containers beat VMs for app deployment
-* ✅ Docker architecture: images, containers, registries
-* ✅ How to write optimized Dockerfiles
-* ✅ Security: rootless containers, minimal images
-* ✅ Multi-stage builds for smaller images
-* ✅ Docker Hub publishing workflow
-
-> 🚀 **You're ready for Lab 2!**
-
----
-
-## 📍 Slide 44 – 📝 QUIZ — DEVOPS_L2_POST
-
----
-
-## 📍 Slide 45 – 🚀 What Comes Next
-
-## 📚 Lab 2: Containerize Your App
-
-* 🐳 Write Dockerfile for your Python app
-* 👤 Implement non-root user
-* 📦 Optimize with layer ordering
-* 🌐 Push to Docker Hub
-* 🏆 Bonus: Multi-stage build for Go app
-
-**🔮 Future Lectures:**
-* 📦 **Lecture 3**: CI/CD with GitHub Actions
-* ☸️ **Lecture 9**: Kubernetes deployment
-* 🔄 **Lecture 13**: GitOps with ArgoCD
-
-```mermaid
-flowchart LR
-  You[👤 You] --> Docker[🐳 Docker Skills]
-  Docker --> K8s[☸️ Kubernetes]
-  K8s --> GitOps[🔄 GitOps]
-  GitOps --> Career[🚀 DevOps Career]
-```
-
-**👋 See you in the lab!**
-
----
-
-## 📚 Resources & Further Reading
-
-**📕 Books:**
-* 📖 *Docker Deep Dive* — Nigel Poulton
-* 📖 *Container Security* — Liz Rice
-* 📖 *Docker in Action* — Jeff Nickoloff
-
-**🔗 Links:**
-* 🌐 [Dockerfile Best Practices](https://docs.docker.com/develop/develop-images/dockerfile_best-practices/)
-* 🌐 [Distroless Images](https://github.com/GoogleContainerTools/distroless)
-* 🌐 [Docker Security](https://docs.docker.com/engine/security/)
-* 🌐 [Multi-Stage Builds](https://docs.docker.com/build/building/multi-stage/)
-
-**🛠️ Tools:**
-* 🔍 [Hadolint](https://github.com/hadolint/hadolint) — Dockerfile linter
-* 🔍 [Dive](https://github.com/wagoodman/dive) — Explore image layers
-* 🔍 [Trivy](https://github.com/aquasecurity/trivy) — Security scanner
-
----
+# 📌 Lecture 2 — Containerization with Docker: From "Works on My Machine" to Works Everywhere
+
+## 📍 Slide 1 – 🐳 Welcome to Containerization
+
+* 🌍 **"Works on my machine"** — the most expensive phrase in software
+* 📦 **Containers** = package your app + all dependencies together
+* 🚀 **Docker** = the tool that made containers mainstream
+* 🎯 This lecture: build production-ready containers from scratch
+
+```mermaid
+flowchart LR
+  Problem[😰 Works on My Machine] -->|Docker| Solution[🐳 Works Everywhere]
+  Solution --> Value[💎 Consistent Deployments]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 Learning Outcomes
+
+* ✅ Understand containers vs VMs and why containers win
+* ✅ Write production-ready Dockerfiles
+* ✅ Apply security best practices (rootless, distroless)
+* ✅ Optimize images with multi-stage builds
+* ✅ Publish images to Docker Hub
+
+**🎓 By the end of this lecture:**
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | 🧠 Explain container architecture and benefits |
+| 2 | 📝 Write optimized, secure Dockerfiles |
+| 3 | 🔐 Implement rootless containers |
+| 4 | 📦 Use multi-stage builds for smaller images |
+| 5 | 🚀 Push/pull images from Docker Hub |
+
+---
+
+## 📍 Slide 3 – 📋 Lecture Overview
+
+* 📚 **Concepts + Diagrams** — how containers work
+* 🛠️ **Dockerfile deep dive** — instructions and best practices
+* 🔐 **Security patterns** — rootless and distroless
+* 📦 **Optimization** — multi-stage builds
+* 🌐 **Registry workflow** — Docker Hub
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction           → 📝 PRE Quiz
+Section 1: The Dependency Problem
+Section 2: Container Fundamentals
+Section 3: Dockerfile Scenarios   → 📝 MID Quiz
+Section 4: Advanced Patterns
+Section 5: Real World Usage
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **65%** of organizations use containers in production (2024)
+* 🐳 **Docker Hub**: 14+ million images, 13+ billion pulls/month
+* 💥 Yet most Dockerfiles have **security vulnerabilities**
+
+> 💬 *"Containers are the new deployment unit"* — Kelsey Hightower
+
+**🤔 Think about it:**
+* Why do apps work locally but fail in production?
+* What's inside a container that makes it portable?
+* How small can a container image be?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L2_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Dependency Problem
+
+* 👨‍💻 **Developer**: "It works on my machine!"
+* ⚙️ **Ops**: "Well, we're not shipping your machine!"
+* 🧩 **The real problem**: dependencies, versions, configurations
+* 💥 **Result**: deployment failures, debugging nightmares
+
+```mermaid
+flowchart LR
+  Dev[👨‍💻 Dev Machine] -->|Different| Prod[🌐 Production]
+  Dev -->|Python 3.11| V1[📦 Version]
+  Prod -->|Python 3.9| V2[📦 Version]
+  V1 -.->|💥 Conflict| V2
+```
+
+---
+
+## 📍 Slide 7 – 🧩 The Dependency Hell
+
+* 🐍 **Python version**: 3.9 vs 3.11 vs 3.12
+* 📚 **Library versions**: requests 2.28 vs 2.31
+* 🖥️ **OS differences**: Ubuntu vs Alpine vs macOS
+* ⚙️ **System libraries**: OpenSSL, libffi, glibc
+
+```mermaid
+flowchart TD
+  App[📱 Your App] --> Py[🐍 Python 3.11]
+  App --> Lib1[📚 Flask 2.3]
+  App --> Lib2[📚 Requests 2.31]
+  Py --> OS[🖥️ Ubuntu 22.04]
+  Lib1 --> SSL[🔐 OpenSSL 3.0]
+  OS --> Kernel[🧠 Linux Kernel]
+```
+
+> 🤔 **Think:** How many things can go wrong?
+
+---
+
+## 📍 Slide 8 – 😱 The VM Solution (Heavy)
+
+* 🖥️ **Virtual Machines** = entire OS per application
+* 💾 **Size**: 10-50 GB per VM
+* ⏱️ **Boot time**: minutes
+* 🔧 **Resource overhead**: hypervisor, guest OS kernel
+
+```mermaid
+flowchart TD
+  subgraph VM1[🖥️ VM 1 - 15GB]
+    App1[📱 App] --> OS1[🖥️ Full OS]
+    OS1 --> Kernel1[🧠 Kernel]
+  end
+  subgraph VM2[🖥️ VM 2 - 15GB]
+    App2[📱 App] --> OS2[🖥️ Full OS]
+    OS2 --> Kernel2[🧠 Kernel]
+  end
+  VM1 --> Hyper[⚙️ Hypervisor]
+  VM2 --> Hyper
+  Hyper --> Host[🖥️ Host OS]
+```
+
+**😰 Problems:**
+* 🐌 Slow to start
+* 💸 Expensive (RAM, CPU, storage)
+* 🔧 Hard to manage at scale
+
+---
+
+## 📍 Slide 9 – 🐳 The Container Solution (Light)
+
+* 📦 **Containers** = isolated processes sharing host kernel
+* 💾 **Size**: 5-500 MB typically
+* ⏱️ **Start time**: milliseconds
+* 🚀 **Density**: 10-100x more containers than VMs
+
+```mermaid
+flowchart TD
+  subgraph Containers
+    C1[📦 Container 1 - 50MB]
+    C2[📦 Container 2 - 50MB]
+    C3[📦 Container 3 - 50MB]
+  end
+  C1 --> Docker[🐳 Docker Engine]
+  C2 --> Docker
+  C3 --> Docker
+  Docker --> Host[🖥️ Host OS + Kernel]
+```
+
+**🚀 Benefits:**
+* ⚡ Start in milliseconds
+* 💰 Efficient resource usage
+* 📦 Portable across environments
+
+---
+
+## 📍 Slide 10 – 💸 VMs vs Containers
+
+| 🔍 Aspect | 🖥️ Virtual Machine | 🐳 Container |
+|-----------|-------------------|--------------|
+| 💾 **Size** | 10-50 GB | 10-500 MB |
+| ⏱️ **Boot Time** | Minutes | Milliseconds |
+| 🧠 **Kernel** | Own kernel | Shared kernel |
+| 🔒 **Isolation** | Strong (hardware) | Process-level |
+| 📦 **Density** | 10-20 per host | 100s per host |
+| 🎯 **Use Case** | Full OS needed | App deployment |
+
+**📈 Real Numbers:**
+* 🖥️ **VM**: 1 app = ~2GB RAM overhead
+* 🐳 **Container**: 1 app = ~50MB overhead
+* 🚀 **Result**: 40x more efficient!
+
+---
+
+## 📍 Slide 11 – 📜 History of Containerization
+
+* 🕰️ **1979**: `chroot` — change root directory (Unix V7)
+* 🔒 **2000**: FreeBSD Jails — first true isolation
+* 🐧 **2006**: cgroups — Google contributes to Linux kernel
+* 📦 **2008**: LXC (Linux Containers) — combines namespaces + cgroups
+* 🐳 **2013**: **Docker** — makes containers accessible to everyone
+* ☸️ **2014**: Kubernetes — container orchestration at scale
+* 📦 **2015**: OCI (Open Container Initiative) — standardization
+
+```mermaid
+flowchart LR
+  Chroot[🕰️ 1979: chroot] --> Jails[🔒 2000: Jails]
+  Jails --> Cgroups[🐧 2006: cgroups]
+  Cgroups --> LXC[📦 2008: LXC]
+  LXC --> Docker[🐳 2013: Docker]
+  Docker --> K8s[☸️ 2014: K8s]
+```
+
+> 💡 Docker didn't invent containers — it made them **usable**.
+
+---
+
+## 📍 Slide 12 – 🐧 Linux Kernel: Namespaces
+
+* 🎯 **Namespaces** = isolate what a process **can see**
+* 🔒 Each container gets its own "view" of the system
+
+| 🏷️ Namespace | 🔒 Isolates | 📝 Example |
+|--------------|------------|-----------|
+| **PID** | Process IDs | Container sees PID 1 as its init |
+| **NET** | Network stack | Own IP, ports, routing |
+| **MNT** | Mount points | Own filesystem view |
+| **UTS** | Hostname | Own hostname |
+| **IPC** | Inter-process comm | Own message queues |
+| **USER** | User/Group IDs | UID 0 in container ≠ root on host |
+
+```mermaid
+flowchart TD
+  subgraph Host[🖥️ Host System]
+    subgraph NS1[📦 Container 1 Namespace]
+      P1[PID 1: app]
+      Net1[eth0: 172.17.0.2]
+    end
+    subgraph NS2[📦 Container 2 Namespace]
+      P2[PID 1: app]
+      Net2[eth0: 172.17.0.3]
+    end
+  end
+```
+
+---
+
+## 📍 Slide 13 – 🎛️ Linux Kernel: cgroups
+
+* 🎯 **cgroups** (Control Groups) = limit what a process **can use**
+* 📊 Resource limits prevent one container from killing the host
+
+| 🎛️ cgroup | 🔧 Controls | 📝 Example |
+|-----------|------------|-----------|
+| **cpu** | CPU time | Max 50% of one core |
+| **memory** | RAM usage | Max 512MB |
+| **blkio** | Disk I/O | Max 100MB/s read |
+| **pids** | Process count | Max 100 processes |
+
+```mermaid
+flowchart LR
+  Container[🐳 Container] --> Cgroups[🎛️ cgroups]
+  Cgroups --> CPU[🖥️ CPU: 50%]
+  Cgroups --> RAM[💾 RAM: 512MB]
+  Cgroups --> IO[💿 I/O: 100MB/s]
+```
+
+**🛡️ Why it matters:**
+* ✅ Prevent runaway processes
+* ✅ Fair resource sharing
+* ✅ Predictable performance
+
+---
+
+## 📍 Slide 14 – 📂 Linux Kernel: Union Filesystems
+
+* 🎯 **Union FS** = layer multiple filesystems as one
+* 📚 Docker uses **overlay2** (default on Linux)
+* 💾 Layers are **read-only**, changes go to top layer
+
+```mermaid
+flowchart TD
+  subgraph Image[📦 Image Layers - Read Only]
+    L1[🐧 Layer 1: Base OS]
+    L2[📦 Layer 2: Dependencies]
+    L3[📁 Layer 3: App Code]
+  end
+  subgraph Container[🏃 Container Layer - Read/Write]
+    L4[✏️ Layer 4: Runtime Changes]
+  end
+  L1 --> L2 --> L3 --> L4
+```
+
+**💡 Benefits:**
+* ✅ **Shared layers** — 10 containers can share base image
+* ✅ **Fast startup** — no copying, just add thin layer
+* ✅ **Efficient storage** — only differences stored
+
+---
+
+## 📍 Slide 15 – 🧩 How It All Fits Together
+
+```mermaid
+flowchart TD
+  subgraph Docker[🐳 Docker Engine]
+    CLI[🖥️ Docker CLI]
+    Daemon[⚙️ dockerd]
+    Containerd[📦 containerd]
+    Runc[🏃 runc]
+  end
+  subgraph Kernel[🐧 Linux Kernel]
+    NS[🔒 Namespaces]
+    CG[🎛️ cgroups]
+    UFS[📂 overlay2]
+  end
+  CLI --> Daemon --> Containerd --> Runc
+  Runc --> NS
+  Runc --> CG
+  Runc --> UFS
+```
+
+**🔧 The Stack:**
+* 🖥️ **Docker CLI** — user interface
+* ⚙️ **dockerd** — Docker daemon (API)
+* 📦 **containerd** — container lifecycle management
+* 🏃 **runc** — OCI runtime (creates containers)
+* 🐧 **Kernel** — namespaces + cgroups + filesystem
+
+---
+
+## 📍 Slide 16 – 💡 Section 2: Docker Fundamentals
+
+* 🐳 **Docker** = platform for building, shipping, running containers
+* 📦 **Image** = blueprint (read-only template)
+* 🏃 **Container** = running instance of an image
+* 📝 **Dockerfile** = recipe to build an image
+
+```mermaid
+flowchart LR
+  Dockerfile[📝 Dockerfile] -->|build| Image[📦 Image]
+  Image -->|run| Container[🏃 Container]
+  Image -->|push| Registry[🌐 Registry]
+  Registry -->|pull| Image2[📦 Image]
+```
+
+**📖 Definition:**
+> *A container is a standard unit of software that packages code and all its dependencies so the application runs quickly and reliably across environments.*
+
+---
+
+## 📍 Slide 17 – 🏗️ Docker Architecture
+
+* 🖥️ **Docker Client** = CLI commands (`docker build`, `docker run`)
+* ⚙️ **Docker Daemon** = background service managing containers
+* 📦 **Images** = layered filesystem snapshots
+* 🌐 **Registry** = image storage (Docker Hub, ECR, GCR)
+
+```mermaid
+flowchart LR
+  CLI[🖥️ Docker CLI] -->|API| Daemon[⚙️ Docker Daemon]
+  Daemon --> Images[📦 Images]
+  Daemon --> Containers[🏃 Containers]
+  Daemon <-->|push/pull| Registry[🌐 Registry]
+```
+
+**🔧 Key Commands:**
+* 🔨 `docker build` — create image from Dockerfile
+* 🏃 `docker run` — start container from image
+* 📤 `docker push` — upload image to registry
+* 📥 `docker pull` — download image from registry
+
+---
+
+## 📍 Slide 18 – 📚 Image Layers
+
+* 🎂 **Images are layered** = each instruction creates a layer
+* 💾 **Layers are cached** = faster rebuilds
+* 🔄 **Layers are shared** = efficient storage
+* 📝 **Order matters** = for cache efficiency
+
+```mermaid
+flowchart TD
+  L1[🐧 Layer 1: Base OS - python:3.12-slim]
+  L2[📦 Layer 2: Install dependencies]
+  L3[📁 Layer 3: Copy application code]
+  L4[⚙️ Layer 4: Configure runtime]
+  L1 --> L2 --> L3 --> L4
+  L4 --> Image[📦 Final Image]
+```
+
+**💡 Key Insight:**
+* ✅ Change code → only Layer 3-4 rebuild
+* ❌ Change base → ALL layers rebuild
+
+---
+
+## 📍 Slide 19 – 📝 Dockerfile Basics
+
+```dockerfile
+# 🐍 Start from base image
+FROM python:3.12-slim
+
+# 📁 Set working directory
+WORKDIR /app
+
+# 📦 Copy and install dependencies FIRST (caching!)
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+
+# 📁 Copy application code
+COPY . .
+
+# 🚀 Define startup command
+CMD ["python", "app.py"]
+```
+
+**📝 Key Instructions:**
+| Instruction | 🎯 Purpose |
+|-------------|-----------|
+| `FROM` | 🐧 Base image |
+| `WORKDIR` | 📁 Set directory |
+| `COPY` | 📄 Copy files |
+| `RUN` | ⚙️ Execute commands |
+| `CMD` | 🚀 Default command |
+| `EXPOSE` | 🔌 Document port |
+
+---
+
+## 📍 Slide 20 – ⚡ Before vs After Docker
+
+| 😰 Before Docker | 🐳 After Docker |
+|-----------------|-----------------|
+| 📋 Manual server setup | 📝 Dockerfile defines everything |
+| 🔧 "Install Python 3.11, then..." | 🐳 `FROM python:3.11` |
+| 😱 "Works on my machine" | ✅ Works everywhere |
+| 📅 Deploy monthly (scary) | 🚀 Deploy daily (confident) |
+| 🐛 "Which version is prod?" | 📦 Image tag = version |
+| 💀 Snowflake servers | 🐄 Immutable containers |
+
+> 🤔 Which column describes your current workflow?
+
+---
+
+## 📍 Slide 21 – 🎮 Section 3: Dockerfile Scenarios
+
+## 🕹️ Lab Preview: Containerize Your App
+
+* 🏢 **Scenario**: You have a Python Flask app from Lab 1
+* 🎯 **Goal**: Package it in a production-ready container
+* 📋 **Requirements**: Security, optimization, best practices
+
+**❓ What could go wrong?**
+
+> 💀 **A lot.** Let's see common mistakes and fixes.
+
+🎮 **Let's build it right.**
+
+---
+
+## 📍 Slide 22 – 💥 Scenario 1: Running as Root
+
+**😰 The Problem:**
+```dockerfile
+FROM python:3.12
+COPY . /app
+CMD ["python", "app.py"]
+# 💀 Running as root by default!
+```
+
+* 🔓 Container runs as **root** (UID 0)
+* 💥 If attacker escapes container → **root on host**
+* 🚨 Kubernetes blocks root containers by default
+
+```mermaid
+flowchart LR
+  Attack[🔓 Container Escape] --> Root[👑 Root Access]
+  Root --> Host[💀 Host Compromised]
+```
+
+> ❓ **Why is this dangerous?**
+
+---
+
+## 📍 Slide 23 – ✅ Solution: Rootless Containers
+
+## 🛠️ Fix: Create Non-Root User
+
+```dockerfile
+FROM python:3.12-slim
+
+# 👤 Create non-root user
+RUN useradd --create-home --shell /bin/bash appuser
+
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY . .
+
+# 🔒 Switch to non-root user
+USER appuser
+
+CMD ["python", "app.py"]
+```
+
+**🎯 Result:** Container runs as `appuser`, not root
+
+**🔐 Security Benefits:**
+* ✅ Limited privileges inside container
+* ✅ Can't modify system files
+* ✅ Container escape = unprivileged user
+* ✅ Kubernetes-compatible
+
+---
+
+## 📍 Slide 24 – 🐌 Scenario 2: Slow Builds (Bad Layer Order)
+
+**😰 The Problem:**
+```dockerfile
+FROM python:3.12-slim
+WORKDIR /app
+
+# ❌ Copy EVERYTHING first
+COPY . .
+
+# 📦 Then install dependencies
+RUN pip install -r requirements.txt
+
+CMD ["python", "app.py"]
+```
+
+* 🔄 **Any code change** → reinstall ALL dependencies
+* ⏱️ Build time: **5 minutes** every time
+* 💸 Wasted CI/CD minutes
+
+```mermaid
+flowchart TD
+  Change[📝 Change 1 line of code] --> Copy[❌ COPY invalidated]
+  Copy --> Pip[❌ pip install runs again]
+  Pip --> Slow[🐌 5 min rebuild]
+```
+
+---
+
+## 📍 Slide 25 – ✅ Solution: Optimized Layer Order
+
+## 🛠️ Fix: Dependencies Before Code
+
+```dockerfile
+FROM python:3.12-slim
+WORKDIR /app
+
+# 📦 Copy ONLY requirements first
+COPY requirements.txt .
+
+# 📦 Install dependencies (cached if requirements unchanged)
+RUN pip install --no-cache-dir -r requirements.txt
+
+# 📁 THEN copy application code
+COPY . .
+
+CMD ["python", "app.py"]
+```
+
+**🎯 Result:** Change code → only last layer rebuilds
+
+```mermaid
+flowchart TD
+  Change[📝 Change code] --> Skip1[✅ FROM cached]
+  Skip1 --> Skip2[✅ requirements cached]
+  Skip2 --> Skip3[✅ pip install cached]
+  Skip3 --> Rebuild[🔨 Only COPY . . rebuilds]
+  Rebuild --> Fast[⚡ 10 sec rebuild]
+```
+
+**⚡ Build time: 5 min → 10 sec**
+
+---
+
+## 📍 Slide 26 – 📦 Scenario 3: Bloated Images
+
+**😰 The Problem:**
+```dockerfile
+FROM python:3.12
+# 💾 Full Python image = 1.0 GB!
+```
+
+* 💾 Image size: **1+ GB**
+* 🐌 Slow to pull/push
+* 💸 Storage costs
+* 🔓 Larger attack surface
+
+**📊 Python Image Sizes:**
+| Image | 💾 Size |
+|-------|--------|
+| `python:3.12` | 1.0 GB |
+| `python:3.12-slim` | 150 MB |
+| `python:3.12-alpine` | 50 MB |
+
+> 🤔 **Do you need the full image?**
+
+---
+
+## 📍 Slide 27 – ✅ Solution: Slim Base Images
+
+## 🛠️ Fix: Use Minimal Base Images
+
+```dockerfile
+# ✅ Use slim variant
+FROM python:3.12-slim
+
+# ✅ No cache for pip (smaller image)
+RUN pip install --no-cache-dir -r requirements.txt
+
+# ✅ Only copy what's needed
+COPY app.py .
+COPY templates/ templates/
+```
+
+**🎯 Result:** 1 GB → 150 MB (85% reduction!)
+
+**📦 Base Image Guide:**
+| Image Type | 🎯 Use Case | 💾 Size |
+|------------|------------|--------|
+| `python:3.12` | Need compilation tools | 1.0 GB |
+| `python:3.12-slim` | Most apps (recommended) | 150 MB |
+| `python:3.12-alpine` | Size-critical, simple apps | 50 MB |
+
+**⚠️ Alpine Warning:** Uses musl libc, may break some packages
+
+---
+
+## 📍 Slide 28 – 📁 Scenario 4: No .dockerignore
+
+**😰 The Problem:**
+```bash
+# Build context includes EVERYTHING
+Sending build context to Docker daemon  500MB
+```
+
+* 📁 `.git/` folder (100+ MB)
+* 📁 `node_modules/` or `venv/`
+* 📁 `__pycache__/` files
+* 📄 `.env` with secrets! 💀
+
+**💥 Consequences:**
+* 🐌 Slow builds
+* 💾 Bloated images
+* 🔓 Secrets leaked into image
+
+---
+
+## 📍 Slide 29 – ✅ Solution: .dockerignore
+
+## 🛠️ Fix: Exclude Unnecessary Files
+
+```dockerignore
+# 🐙 Version control
+.git
+.gitignore
+
+# 🐍 Python
+__pycache__
+*.pyc
+*.pyo
+venv/
+.venv/
+
+# 🔐 Secrets (NEVER include!)
+.env
+*.pem
+secrets/
+
+# 📝 Documentation
+*.md
+docs/
+
+# 🧪 Tests (if not needed in container)
+tests/
+```
+
+**🎯 Result:**
+* ⚡ Build context: 500 MB → 5 MB
+* 🔐 No secrets in image
+* 🚀 Faster builds
+
+---
+
+## 📍 Slide 30 – 📝 QUIZ — DEVOPS_L2_MID
+
+---
+
+## 📍 Slide 31 – 🚀 Section 4: Advanced Patterns
+
+## 🏗️ Multi-Stage Builds
+
+* 🎯 **Problem**: Build tools bloat final image
+* 💡 **Solution**: Separate build and runtime stages
+* 📦 **Result**: Tiny production images
+
+```mermaid
+flowchart LR
+  subgraph Stage1[🔨 Builder Stage]
+    SDK[📦 Full SDK]
+    Compile[⚙️ Compile]
+  end
+  subgraph Stage2[🚀 Runtime Stage]
+    Binary[📦 Binary Only]
+    Minimal[🐧 Minimal OS]
+  end
+  Stage1 -->|copy binary| Stage2
+```
+
+**📊 Size Impact:**
+* 🔨 Builder: 1+ GB (SDK, compilers)
+* 🚀 Runtime: 10-50 MB (binary only)
+
+---
+
+## 📍 Slide 32 – 📝 Multi-Stage Dockerfile
+
+```dockerfile
+# 🔨 Stage 1: Builder
+FROM golang:1.21 AS builder
+WORKDIR /app
+COPY go.mod go.sum ./
+RUN go mod download
+COPY . .
+RUN CGO_ENABLED=0 go build -o myapp
+
+# 🚀 Stage 2: Runtime
+FROM alpine:3.18
+RUN adduser -D appuser
+WORKDIR /app
+COPY --from=builder /app/myapp .
+USER appuser
+CMD ["./myapp"]
+```
+
+**🔍 Key Points:**
+* 🏷️ `AS builder` — name the stage
+* 📦 `COPY --from=builder` — copy from previous stage
+* 🗑️ Builder stage discarded in final image
+
+**📊 Result:** 1.2 GB → 15 MB
+
+---
+
+## 📍 Slide 33 – 🔐 Distroless Images
+
+## 🛡️ Ultimate Minimal Images
+
+* 🚫 **No shell** — can't exec into container
+* 🚫 **No package manager** — can't install malware
+* 🚫 **No unnecessary files** — minimal attack surface
+* ✅ **Only your app** — and runtime dependencies
+
+```dockerfile
+# 🔨 Build stage
+FROM golang:1.21 AS builder
+WORKDIR /app
+COPY . .
+RUN CGO_ENABLED=0 go build -o myapp
+
+# 🔐 Distroless runtime
+FROM gcr.io/distroless/static-debian12
+COPY --from=builder /app/myapp /
+CMD ["/myapp"]
+```
+
+**📊 Distroless Options:**
+| Image | 🎯 For | 💾 Size |
+|-------|-------|--------|
+| `distroless/static` | Go, Rust (static) | 2 MB |
+| `distroless/base` | C/C++ apps | 20 MB |
+| `distroless/python3` | Python apps | 50 MB |
+| `distroless/java` | Java apps | 190 MB |
+
+---
+
+## 📍 Slide 34 – 📊 Image Size Comparison
+
+## 📈 Same App, Different Images
+
+| 🏗️ Build Strategy | 💾 Image Size | 🔐 Security |
+|-------------------|--------------|-------------|
+| `FROM python:3.12` | 1.0 GB | 😰 Large attack surface |
+| `FROM python:3.12-slim` | 150 MB | 😊 Better |
+| Multi-stage + slim | 100 MB | 😄 Good |
+| Multi-stage + alpine | 50 MB | 😄 Good |
+| Multi-stage + distroless | 20 MB | 🔐 Excellent |
+| `FROM scratch` (Go) | 5 MB | 🔐 Maximum |
+
+```mermaid
+flowchart LR
+  Full[📦 1 GB] --> Slim[📦 150 MB]
+  Slim --> Multi[📦 50 MB]
+  Multi --> Distroless[📦 20 MB]
+  Distroless --> Scratch[📦 5 MB]
+```
+
+**🎯 Goal:** As small as possible while functional
+
+---
+
+## 📍 Slide 35 – 🌐 Docker Hub & Registries
+
+## 📦 Publishing Your Images
+
+```mermaid
+flowchart LR
+  Build[🔨 Build] --> Tag[🏷️ Tag]
+  Tag --> Push[📤 Push]
+  Push --> Registry[🌐 Docker Hub]
+  Registry --> Pull[📥 Pull]
+  Pull --> Run[🏃 Run]
+```
+
+**🔧 Workflow:**
+```bash
+# 🔨 Build image
+docker build -t myapp:1.0 .
+
+# 🏷️ Tag for registry
+docker tag myapp:1.0 username/myapp:1.0
+
+# 🔐 Login to Docker Hub
+docker login
+
+# 📤 Push to registry
+docker push username/myapp:1.0
+```
+
+**📦 Registries:**
+* 🐳 Docker Hub — public/private
+* ☁️ AWS ECR — AWS integrated
+* 🌐 GCP GCR — Google integrated
+* 🦊 GitLab Registry — GitLab integrated
+
+---
+
+## 📍 Slide 36 – 🏢 Section 5: Real World Usage
+
+## 📅 Docker in Production
+
+**🔨 Build Phase:**
+* 📝 Dockerfile in repo
+* 🤖 CI builds image on every commit
+* 🏷️ Tag with git SHA or semantic version
+* 📤 Push to registry
+
+**🚀 Deploy Phase:**
+* 📥 Pull image to servers
+* 🏃 Run containers
+* 📊 Monitor health
+* 🔄 Rolling updates
+
+```mermaid
+flowchart LR
+  Code[📝 Code] --> CI[🤖 CI Build]
+  CI --> Registry[🌐 Registry]
+  Registry --> K8s[☸️ Kubernetes]
+  K8s --> Prod[🌐 Production]
+```
+
+---
+
+## 📍 Slide 37 – 🏷️ Tagging Strategies
+
+| 🏷️ Strategy | 📝 Example | 🎯 Use Case |
+|-------------|-----------|-------------|
+| **Semantic** | `myapp:1.2.3` | Releases |
+| **Git SHA** | `myapp:a1b2c3d` | Traceability |
+| **Branch** | `myapp:develop` | Dev environments |
+| **Latest** | `myapp:latest` | ⚠️ Avoid in prod! |
+| **Date** | `myapp:2024-01-15` | Daily builds |
+
+**⚠️ Never use `latest` in production:**
+* 🤷 Which version is "latest"?
+* 🔄 Changes without notice
+* 🐛 Can't rollback reliably
+
+**✅ Best Practice:**
+```bash
+# 🏷️ Immutable tags
+docker tag myapp:1.0.0 registry/myapp:1.0.0
+docker tag myapp:1.0.0 registry/myapp:sha-a1b2c3d
+```
+
+---
+
+## 📍 Slide 38 – 🔐 Security Best Practices
+
+```mermaid
+flowchart TD
+  Scan[🔍 Scan Images] --> Base[📦 Minimal Base]
+  Base --> User[👤 Non-root User]
+  User --> Secrets[🔐 No Secrets in Image]
+  Secrets --> Update[🔄 Update Regularly]
+  Update --> Sign[✍️ Sign Images]
+```
+
+**🔐 Security Checklist:**
+* ✅ Run as non-root user (`USER appuser`)
+* ✅ Use minimal base images (slim, distroless)
+* ✅ Scan for vulnerabilities (Trivy, Snyk)
+* ✅ Never store secrets in images
+* ✅ Pin base image versions
+* ✅ Update base images regularly
+
+**🛠️ Scanning Tools:**
+* 🔍 **Trivy** — open source, fast
+* 🔍 **Snyk** — developer-friendly
+* 🔍 **Docker Scout** — built into Docker
+
+---
+
+## 📍 Slide 39 – 📈 Career Skills
+
+```mermaid
+flowchart LR
+  Docker[🐳 Docker Basics] --> Compose[📦 Docker Compose]
+  Compose --> K8s[☸️ Kubernetes]
+  K8s --> GitOps[🔄 GitOps]
+  GitOps --> Platform[🏗️ Platform Engineering]
+```
+
+**🛠️ Docker Skills Progression:**
+* 🐳 **Level 1**: Write Dockerfiles, build/run containers
+* 📦 **Level 2**: Multi-stage builds, optimization
+* 🔐 **Level 3**: Security hardening, distroless
+* 📊 **Level 4**: Registry management, scanning
+* ☸️ **Level 5**: Container orchestration (K8s)
+
+**📊 Job Market (2024):**
+* 🐳 Docker required in **80%** of DevOps jobs
+* ☸️ Kubernetes in **65%** of container jobs
+* 💰 Container skills = **+15-20%** salary
+
+---
+
+## 📍 Slide 40 – 🌍 Real Company Examples
+
+**🎬 Netflix:**
+* 🐳 Millions of containers daily
+* 📦 Custom base images (hardened)
+* 🔄 Immutable deployments
+
+**🛒 Shopify:**
+* 🐳 Containerized entire platform
+* ⚡ Deploy 80x/day
+* 📦 Standardized Dockerfiles
+
+**🚗 Uber:**
+* 🐳 4,000+ microservices in containers
+* 🔐 Strict security policies
+* 📊 Custom image scanning
+
+**📊 Common Patterns:**
+* ✅ Standardized base images
+* ✅ Automated security scanning
+* ✅ Multi-stage builds everywhere
+* ✅ No root containers
+
+---
+
+## 📍 Slide 41 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🐳 **Containers = lightweight, portable app packaging**
+2. 📝 **Dockerfile order matters** — dependencies before code
+3. 👤 **Always run as non-root** — security first
+4. 🏗️ **Multi-stage builds** — separate build from runtime
+5. 📦 **Smaller is better** — less attack surface, faster deploys
+
+> 💡 A good Dockerfile is secure, optimized, and maintainable.
+
+---
+
+## 📍 Slide 42 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🐳 Container Mindset |
+|---------------|---------------------|
+| 🖥️ "Configure servers manually" | 📝 "Define in Dockerfile" |
+| 🔧 "Install dependencies on host" | 📦 "Bundle in container" |
+| 👑 "Run as root, it's easier" | 👤 "Run as non-root always" |
+| 💾 "Bigger image = more features" | ⚡ "Smaller = faster & safer" |
+| 🏷️ "Just use :latest" | 🔖 "Pin versions always" |
+
+> ❓ Which mindset will you adopt?
+
+---
+
+## 📍 Slide 43 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Why containers beat VMs for app deployment
+* ✅ Docker architecture: images, containers, registries
+* ✅ How to write optimized Dockerfiles
+* ✅ Security: rootless containers, minimal images
+* ✅ Multi-stage builds for smaller images
+* ✅ Docker Hub publishing workflow
+
+> 🚀 **You're ready for Lab 2!**
+
+---
+
+## 📍 Slide 44 – 📝 QUIZ — DEVOPS_L2_POST
+
+---
+
+## 📍 Slide 45 – 🚀 What Comes Next
+
+## 📚 Lab 2: Containerize Your App
+
+* 🐳 Write Dockerfile for your Python app
+* 👤 Implement non-root user
+* 📦 Optimize with layer ordering
+* 🌐 Push to Docker Hub
+* 🏆 Bonus: Multi-stage build for Go app
+
+**🔮 Future Lectures:**
+* 📦 **Lecture 3**: CI/CD with GitHub Actions
+* ☸️ **Lecture 9**: Kubernetes deployment
+* 🔄 **Lecture 13**: GitOps with ArgoCD
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Docker[🐳 Docker Skills]
+  Docker --> K8s[☸️ Kubernetes]
+  K8s --> GitOps[🔄 GitOps]
+  GitOps --> Career[🚀 DevOps Career]
+```
+
+**👋 See you in the lab!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Docker Deep Dive* — Nigel Poulton
+* 📖 *Container Security* — Liz Rice
+* 📖 *Docker in Action* — Jeff Nickoloff
+
+**🔗 Links:**
+* 🌐 [Dockerfile Best Practices](https://docs.docker.com/develop/develop-images/dockerfile_best-practices/)
+* 🌐 [Distroless Images](https://github.com/GoogleContainerTools/distroless)
+* 🌐 [Docker Security](https://docs.docker.com/engine/security/)
+* 🌐 [Multi-Stage Builds](https://docs.docker.com/build/building/multi-stage/)
+
+**🛠️ Tools:**
+* 🔍 [Hadolint](https://github.com/hadolint/hadolint) — Dockerfile linter
+* 🔍 [Dive](https://github.com/wagoodman/dive) — Explore image layers
+* 🔍 [Trivy](https://github.com/aquasecurity/trivy) — Security scanner
+
+---
diff --git a/lectures/lec3.md b/lectures/lec3.md
index 9afebb8b15..e89ace9fcd 100644
--- a/lectures/lec3.md
+++ b/lectures/lec3.md
@@ -1,978 +1,978 @@
-# 📌 Lecture 3 — Continuous Integration: Automate Testing & Build Confidence
-
-## 📍 Slide 1 – 🤖 Welcome to CI/CD
-
-* 🐛 **Manual testing** = slow, error-prone, doesn't scale
-* 🤖 **Continuous Integration** = automate testing, building, and validation
-* ✅ **Goal**: Catch bugs before they reach production
-* 🚀 This lecture: Build your first CI/CD pipeline with GitHub Actions
-
-```mermaid
-flowchart LR
-  Manual[😰 Manual Testing] -->|CI/CD| Auto[🤖 Automated Pipeline]
-  Auto --> Confidence[💪 Deploy with Confidence]
-```
-
----
-
-## 📍 Slide 2 – 🎯 Learning Outcomes
-
-* ✅ Understand CI/CD principles and benefits
-* ✅ Write effective unit tests
-* ✅ Build GitHub Actions workflows
-* ✅ Implement security scanning with Snyk
-* ✅ Apply CI/CD best practices (caching, versioning)
-
-**🎓 By the end of this lecture:**
-
-| # | 🎯 Outcome |
-|---|-----------|
-| 1 | 🧠 Explain CI/CD and why it matters |
-| 2 | 🧪 Write meaningful unit tests |
-| 3 | ⚙️ Create GitHub Actions workflows |
-| 4 | 🔐 Integrate security scanning |
-| 5 | 📦 Automate Docker builds & publishing |
-
----
-
-## 📍 Slide 3 – 📋 Lecture Overview
-
-* 📚 **CI/CD fundamentals** — what, why, how
-* 🧪 **Testing strategies** — unit, integration, coverage
-* ⚙️ **GitHub Actions** — YAML workflows, actions marketplace
-* 🔐 **Security** — Snyk vulnerability scanning
-* 🚀 **Automation** — Docker builds, versioning, caching
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction           → 📝 PRE Quiz
-Section 1: The Testing Problem
-Section 2: CI/CD Fundamentals
-Section 3: GitHub Actions Hands-on → 📝 MID Quiz
-Section 4: Advanced CI Patterns
-Section 5: Production Practices
-Section 6: Reflection             → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – ❓ The Big Question
-
-* 📊 **85%** of software bugs are found in production (2024)
-* ⏱️ Average cost to fix a prod bug: **100x** more than dev bug
-* 🚀 Teams with good CI deploy **46x** more frequently
-
-> 💬 *"If it hurts, do it more often"* — Continuous Delivery principle
-
-**🤔 Think about it:**
-* How do you know your code works before deploying?
-* What happens when someone breaks the main branch?
-* How many bugs could be caught automatically?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L3_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Testing Problem
-
-* 👨‍💻 **Developer**: "It works on my machine!"
-* 🐛 **Production**: 500 errors, users complaining
-* 😰 **The gap**: No automated testing or validation
-* 💥 **Result**: Bugs slip through, confidence is low
-
-```mermaid
-flowchart LR
-  Dev[👨‍💻 Dev: Works!] -->|No Tests| Prod[🌐 Production]
-  Prod --> Bug[🐛 Bug Found]
-  Bug --> Fire[🔥 Firefighting]
-```
-
----
-
-## 📍 Slide 7 – 🧪 Manual Testing Hell
-
-* 📋 **Manual checklist**: 50 steps to test before deploy
-* ⏱️ **Time**: 2 hours per test cycle
-* 😴 **Human error**: Forgot to test one endpoint
-* 🔄 **Frequency**: Only before big releases (too painful)
-
-```mermaid
-flowchart TD
-  Code[📝 Write Code] --> Manual[📋 Manual Testing]
-  Manual --> Bug[🐛 Found Bug]
-  Bug --> Fix[🔧 Fix Code]
-  Fix --> Manual
-  Manual --> Deploy[😮‍💨 Finally Deploy]
-```
-
-**😰 Problems:**
-* 🐌 Slow feedback loop
-* 🎰 Testing is inconsistent
-* 🧠 Requires human to remember all steps
-* 💀 Nobody wants to test
-
----
-
-## 📍 Slide 8 – 💥 The Integration Problem
-
-* 👥 **Multiple developers** pushing to main branch
-* 🔀 **Merge conflicts** caught too late
-* 💥 **Breaking changes** not detected
-* 🤷 **"Who broke the build?"** — the blame game
-
-```mermaid
-flowchart LR
-  Dev1[👨‍💻 Dev 1] -->|Push| Main[🌳 Main Branch]
-  Dev2[👩‍💻 Dev 2] -->|Push| Main
-  Dev3[👨‍💻 Dev 3] -->|Push| Main
-  Main --> Break[💥 Build Broken]
-```
-
-> 🤔 **Think:** How do we prevent this?
-
----
-
-## 📍 Slide 9 – 🔐 The Security Gap
-
-* 📦 **Dependencies** with known vulnerabilities
-* 🔓 **Secrets** accidentally committed
-* 🚨 **CVEs** discovered after deployment
-* 🤷 **Nobody checked** before merging
-
-**📊 Real Stats:**
-* 🔍 **84%** of codebases have vulnerable dependencies
-* ⏱️ Average time to detect vulnerability: **54 days**
-* 💰 Average breach cost: **$4.45 million**
-
----
-
-## 📍 Slide 10 – 💸 The Cost of No CI
-
-| 🔥 Problem | 💥 Impact |
-|------------|-----------|
-| 🐛 Bugs in production | Customer churn, reputation damage |
-| ⏱️ Slow feedback | Wasted development time |
-| 😰 Fear of deployment | Infrequent releases |
-| 🔒 Security vulnerabilities | Data breaches, compliance issues |
-
-**📈 Real Numbers:**
-* 🐛 Prod bug fix cost: **$10,000 - $100,000**
-* 🕒 Time to detect + fix: **4-8 hours**
-* 🏢 Without CI: Deploy **monthly**
-* 🚀 With CI: Deploy **daily**
-
----
-
-## 📍 Slide 11 – 💡 Section 2: CI/CD Fundamentals
-
-* 🤖 **Continuous Integration (CI)** = automatically test every change
-* 🚀 **Continuous Delivery (CD)** = always ready to deploy
-* 📦 **Continuous Deployment** = automatically deploy to production
-* 🎯 **Goal**: Fast, reliable, automated software delivery
-
-```mermaid
-flowchart LR
-  CI[🤖 CI: Test] --> CD[📦 CD: Package]
-  CD --> Deploy[🚀 Deploy]
-```
-
-**📖 Definitions:**
-> *CI: Developers integrate code into shared repository frequently. Each integration is verified by automated build and tests.*
-> *CD: Software can be released to production at any time.*
-
----
-
-## 📍 Slide 12 – 🔄 The CI/CD Pipeline
-
-```mermaid
-flowchart LR
-  Commit[📝 Commit] --> Trigger[⚡ Trigger CI]
-  Trigger --> Checkout[📥 Checkout Code]
-  Checkout --> Build[🔨 Build]
-  Build --> Test[🧪 Test]
-  Test --> Lint[🔍 Lint]
-  Lint --> Scan[🔐 Security Scan]
-  Scan --> Package[📦 Package]
-  Package --> Publish[🚀 Publish]
-```
-
-**🔧 Stages:**
-1. 📝 **Commit** — Developer pushes code
-2. ⚡ **Trigger** — CI system detects change
-3. 🔨 **Build** — Compile/prepare code
-4. 🧪 **Test** — Run automated tests
-5. 🔍 **Lint** — Check code quality
-6. 🔐 **Scan** — Security vulnerabilities
-7. 📦 **Package** — Build artifacts (Docker image)
-8. 🚀 **Publish** — Push to registry
-
----
-
-## 📍 Slide 13 – ✅ CI/CD Benefits
-
-| 🎯 Benefit | 📊 Impact |
-|-----------|----------|
-| ⚡ **Fast Feedback** | Know in 5 min if code works |
-| 🐛 **Early Bug Detection** | Catch before production |
-| 🔒 **Security** | Automated vulnerability scanning |
-| 📦 **Consistent Builds** | Same process every time |
-| 💪 **Confidence** | Deploy without fear |
-| 🚀 **Faster Releases** | Deploy multiple times per day |
-
-**📈 DORA Metrics (Elite Performers):**
-* 📦 Deploy frequency: **Multiple times/day**
-* ⏱️ Lead time: **< 1 hour**
-* 🔧 MTTR: **< 1 hour**
-* ❌ Change failure rate: **< 15%**
-
----
-
-## 📍 Slide 14 – 🧪 Testing Pyramid
-
-```mermaid
-flowchart TD
-  subgraph Pyramid[🔺 Testing Pyramid]
-    E2E[🌐 E2E Tests<br/>Few, Slow, Expensive]
-    INT[🔗 Integration Tests<br/>Some, Moderate]
-    UNIT[🧪 Unit Tests<br/>Many, Fast, Cheap]
-  end
-  E2E --> INT --> UNIT
-```
-
-**🎯 Test Types:**
-* 🧪 **Unit Tests** (80%) — Test individual functions
-* 🔗 **Integration Tests** (15%) — Test components together
-* 🌐 **End-to-End Tests** (5%) — Test full user flows
-
-**💡 Why the pyramid?**
-* ✅ Unit tests: Fast (ms), cheap, catch most bugs
-* ✅ Integration: Slower (seconds), catch interface bugs
-* ⚠️ E2E: Slowest (minutes), brittle, expensive
-
----
-
-## 📍 Slide 15 – ⚡ Before vs After CI/CD
-
-| 😰 Before CI/CD | 🚀 After CI/CD |
-|-----------------|----------------|
-| 📋 Manual testing checklist | 🤖 Automated test suite |
-| 🎰 "Fingers crossed" deploys | ✅ Confident deployments |
-| 🐛 Bugs found in production | 🧪 Bugs caught in CI |
-| ⏱️ 2 hour test cycle | ⚡ 5 minute feedback |
-| 😱 Deploy monthly | 🚀 Deploy daily |
-| 🤷 "Who broke it?" | 📊 Git bisect + logs |
-
-> 🤔 Which column is your current process?
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: GitHub Actions Hands-On
-
-## 🕹️ Lab Preview: Build Your CI Pipeline
-
-* 🏢 **Scenario**: You have a Python Flask app
-* 🎯 **Goal**: Automate testing and Docker builds
-* 📋 **Requirements**: Tests, lint, security scan, publish
-
-**❓ How do we automate all this?**
-
-> 🤖 **GitHub Actions** to the rescue!
-
-🎮 **Let's build it step by step.**
-
----
-
-## 📍 Slide 17 – 💥 Scenario 1: No Tests
-
-**😰 The Problem:**
-```python
-# app.py
-@app.route('/')
-def home():
-    return {"message": "Hello", "hostname": os.getenv("HOSTNAME")}
-
-# 🚫 No tests!
-```
-
-* 📝 Code looks fine
-* 💥 Deploy → crashes because `HOSTNAME` is None
-* 🐛 Users see 500 errors
-* 😱 Rollback emergency
-
-> ❓ **How do we catch this before deploy?**
-
----
-
-## 📍 Slide 18 – ✅ Solution: Unit Testing
-
-## 🛠️ Fix: Write Tests First
-
-```python
-# tests/test_app.py
-import pytest
-from app import app
-
-def test_home_endpoint():
-    """Test that home returns expected structure"""
-    client = app.test_client()
-    response = client.get('/')
-
-    assert response.status_code == 200
-    data = response.get_json()
-    assert "message" in data
-    assert "hostname" in data
-    assert isinstance(data["message"], str)
-
-def test_health_endpoint():
-    """Test health check"""
-    client = app.test_client()
-    response = client.get('/health')
-
-    assert response.status_code == 200
-    assert response.get_json()["status"] == "healthy"
-```
-
-**🎯 Result:** Tests catch the bug before deploy!
-
----
-
-## 📍 Slide 19 – 🧪 Testing Frameworks
-
-## Python Testing Options
-
-| Framework | 🎯 Pros | ⚠️ Cons |
-|-----------|--------|--------|
-| **pytest** | Simple, powerful, fixtures | Extra dependency |
-| **unittest** | Built-in, no dependencies | Verbose, old-style |
-
-```bash
-# 🧪 pytest (recommended)
-pip install pytest
-pytest tests/
-
-# 🧪 unittest (built-in)
-python -m unittest discover tests/
-```
-
-**💡 Why pytest?**
-* ✅ Simple syntax (`assert` instead of `self.assertEqual`)
-* ✅ Powerful fixtures (setup/teardown)
-* ✅ Great plugins (coverage, parallel, etc.)
-* ✅ Industry standard
-
----
-
-## 📍 Slide 20 – 📝 Scenario 2: Manual Docker Builds
-
-**😰 The Problem:**
-```bash
-# 🐌 Manual process every time
-docker build -t myapp:latest .
-docker tag myapp:latest username/myapp:v1.2.3
-docker login
-docker push username/myapp:v1.2.3
-docker push username/myapp:latest
-
-# 😱 Forgot to update version tag!
-# 💀 Built from wrong branch!
-```
-
-* ⏱️ Takes 10 minutes
-* 🎰 Inconsistent (human error)
-* 📋 No validation before build
-* 🤷 Can't track what version is deployed
-
----
-
-## 📍 Slide 21 – ✅ Solution: GitHub Actions CI/CD
-
-## 🛠️ Fix: Automate Everything
-
-```yaml
-# .github/workflows/python-ci.yml
-name: Python CI
-
-on:
-  push:
-    branches: [ main ]
-  pull_request:
-
-jobs:
-  test:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-
-      - uses: actions/setup-python@v5
-        with:
-          python-version: '3.12'
-
-      - name: Install dependencies
-        run: |
-          pip install -r requirements.txt
-          pip install pytest flake8
-
-      - name: Lint
-        run: flake8 app.py
-
-      - name: Test
-        run: pytest tests/
-```
-
-**🎯 Result:** Every commit automatically tested!
-
----
-
-## 📍 Slide 22 – 🐳 Docker Build Automation
-
-```yaml
-  docker:
-    needs: test  # ✅ Only run if tests pass
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Login to Docker Hub
-        uses: docker/login-action@v3
-        with:
-          username: ${{ secrets.DOCKER_USERNAME }}
-          password: ${{ secrets.DOCKER_TOKEN }}
-
-      - name: Build and push
-        uses: docker/build-push-action@v5
-        with:
-          context: ./app_python
-          push: true
-          tags: |
-            ${{ secrets.DOCKER_USERNAME }}/myapp:latest
-            ${{ secrets.DOCKER_USERNAME }}/myapp:${{ github.sha }}
-```
-
-**🔐 Security Note:** Never hardcode credentials!
-
----
-
-## 📍 Slide 23 – 🔓 Scenario 3: Vulnerable Dependencies
-
-**😰 The Problem:**
-```bash
-# requirements.txt
-flask==2.0.1  # 💀 Known CVE-2023-30861
-requests==2.25.0  # 🔓 Security vulnerability
-
-# 🤷 Nobody checked before deploying
-```
-
-* 🔍 **84%** of apps have vulnerable dependencies
-* ⏱️ Takes **weeks** to discover
-* 💀 Already in production when found
-
-**📊 Real Example:**
-* 📦 Log4Shell (2021) — **35,000+ CVE**
-* 💰 Cost to remediate: **Billions of dollars**
-
----
-
-## 📍 Slide 24 – ✅ Solution: Snyk Security Scanning
-
-## 🛠️ Fix: Automated Vulnerability Scanning
-
-```yaml
-  security:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Run Snyk
-        uses: snyk/actions/python-3.10@master
-        env:
-          SNYK_TOKEN: ${{ secrets.SNYK_TOKEN }}
-        with:
-          args: --severity-threshold=high
-```
-
-**🎯 What Snyk Does:**
-* 🔍 Scans dependencies for known CVEs
-* 📊 Reports severity (low/medium/high/critical)
-* 🔧 Suggests fixes
-* ❌ Fails build if critical vulnerabilities found
-
-**🔐 Result:** Catch vulnerabilities before production!
-
----
-
-## 📍 Slide 25 – 🐌 Scenario 4: Slow CI Builds
-
-**😰 The Problem:**
-```
-[Run 1] Installing dependencies... 2 minutes
-[Run 2] Installing dependencies... 2 minutes
-[Run 3] Installing dependencies... 2 minutes
-# 💸 Wasting 6 minutes downloading same packages!
-```
-
-* ⏱️ Each run: **5-10 minutes**
-* 🔄 Re-downloading same dependencies
-* 💰 Wasting CI minutes (costs money!)
-* 😴 Slow feedback loop
-
----
-
-## 📍 Slide 26 – ✅ Solution: Dependency Caching
-
-## 🛠️ Fix: Cache Dependencies
-
-```yaml
-- uses: actions/setup-python@v5
-  with:
-    python-version: '3.12'
-    cache: 'pip'  # ✅ Enable caching
-    cache-dependency-path: 'requirements.txt'
-
-# Alternative with explicit cache
-- uses: actions/cache@v4
-  with:
-    path: ~/.cache/pip
-    key: ${{ runner.os }}-pip-${{ hashFiles('requirements.txt') }}
-```
-
-**📊 Performance Impact:**
-* ⏱️ **Before caching**: 5 minutes
-* ⚡ **After caching**: 30 seconds
-* 🚀 **10x faster!**
-
-**💡 Cache Key Strategy:**
-* 🔑 Key includes `requirements.txt` hash
-* 🔄 Cache invalidates when dependencies change
-* ✅ Fresh install when needed, cached otherwise
-
----
-
-## 📍 Slide 27 – 📝 QUIZ — DEVOPS_L3_MID
-
----
-
-## 📍 Slide 28 – 🏷️ Section 4: Versioning Strategies
-
-## 📦 How to Version Your Images?
-
-**Two main approaches:**
-
-**🔢 Semantic Versioning (SemVer):**
-* Format: `MAJOR.MINOR.PATCH` (e.g., `1.2.3`)
-* 🎯 Use when: Breaking changes matter
-* 📚 Example: Libraries, APIs
-
-**📅 Calendar Versioning (CalVer):**
-* Format: `YYYY.MM.DD` (e.g., `2024.01.15`)
-* 🎯 Use when: Continuous deployment
-* 🚀 Example: Web services, SaaS
-
-```mermaid
-flowchart LR
-  Code[📝 Code] --> SemVer[🔢 v1.2.3]
-  Code --> CalVer[📅 2024.01]
-  SemVer --> Lib[📚 Library]
-  CalVer --> Service[🌐 Service]
-```
-
----
-
-## 📍 Slide 29 – 🔢 Semantic Versioning (SemVer)
-
-## v MAJOR.MINOR.PATCH
-
-| Version | 🎯 When to Bump |
-|---------|----------------|
-| **MAJOR** (v2.0.0) | Breaking changes (API changed) |
-| **MINOR** (v1.1.0) | New features (backward-compatible) |
-| **PATCH** (v1.0.1) | Bug fixes (backward-compatible) |
-
-```yaml
-# 🏷️ Multiple tags per release
-tags: |
-  username/app:1.2.3
-  username/app:1.2
-  username/app:1
-  username/app:latest
-```
-
-**✅ Pros:**
-* 📖 Clear breaking change signals
-* 🎯 Industry standard for libraries
-* 🔄 Users can pin to major version
-
-**⚠️ Cons:**
-* 🤔 Requires discipline
-* 📋 Need to track what's breaking vs feature
-
----
-
-## 📍 Slide 30 – 📅 Calendar Versioning (CalVer)
-
-## YYYY.MM.DD or YYYY.MM
-
-| Format | 📝 Example | 🎯 Use Case |
-|--------|-----------|-------------|
-| `YYYY.MM.DD` | `2024.01.15` | Daily releases |
-| `YYYY.MM.MICRO` | `2024.01.3` | Monthly + patch |
-| `YYYY.0M` | `2024.01` | Monthly releases |
-
-```yaml
-# 📅 Generate version from date
-- name: Generate version
-  run: echo "VERSION=$(date +%Y.%m.%d)" >> $GITHUB_ENV
-
-tags: |
-  username/app:2024.01.15
-  username/app:2024.01
-  username/app:latest
-```
-
-**✅ Pros:**
-* 📆 No ambiguity (date is date)
-* 🚀 Perfect for continuous deployment
-* 🧠 Easy to remember
-
-**⚠️ Cons:**
-* 🤷 Doesn't indicate breaking changes
-
----
-
-## 📍 Slide 31 – 🔀 Matrix Builds
-
-## Test Multiple Versions
-
-```yaml
-jobs:
-  test:
-    runs-on: ubuntu-latest
-    strategy:
-      matrix:
-        python-version: ['3.11', '3.12', '3.13']
-
-    steps:
-      - uses: actions/setup-python@v5
-        with:
-          python-version: ${{ matrix.python-version }}
-
-      - run: pytest tests/
-```
-
-**🎯 What This Does:**
-* 🔄 Runs tests **3 times** (one per Python version)
-* ⚡ Runs in **parallel**
-* ✅ Ensures compatibility across versions
-
-```mermaid
-flowchart LR
-  Test[🧪 Tests] --> Py311[🐍 Python 3.11]
-  Test --> Py312[🐍 Python 3.12]
-  Test --> Py313[🐍 Python 3.13]
-```
-
----
-
-## 📍 Slide 32 – 📂 Path Filters (Monorepo)
-
-## Only Run CI for Changed Apps
-
-```yaml
-# Python CI only runs when Python code changes
-on:
-  push:
-    paths:
-      - 'app_python/**'
-      - '.github/workflows/python-ci.yml'
-
-# Go CI only runs when Go code changes
-on:
-  push:
-    paths:
-      - 'app_go/**'
-      - '.github/workflows/go-ci.yml'
-```
-
-**🎯 Benefits:**
-* ⚡ Faster CI (don't run unnecessary builds)
-* 💰 Save CI minutes
-* 🔕 Less noise (only relevant notifications)
-
-**📊 Impact:**
-* 🐌 Without filters: Every commit runs **all** CI
-* 🚀 With filters: Only **affected** apps run
-
----
-
-## 📍 Slide 33 – 📊 Test Coverage
-
-## Measure What's Tested
-
-```yaml
-- name: Run tests with coverage
-  run: |
-    pip install pytest-cov
-    pytest --cov=app_python --cov-report=xml --cov-report=term
-
-- name: Upload to Codecov
-  uses: codecov/codecov-action@v4
-  with:
-    file: ./coverage.xml
-```
-
-**📊 Coverage Badge:**
-```markdown
-![Coverage](https://codecov.io/gh/user/repo/branch/main/graph/badge.svg)
-```
-
-**🎯 What's Good Coverage?**
-* 🥉 **60-70%** — Okay, could be better
-* 🥈 **70-85%** — Good, most code tested
-* 🥇 **85-95%** — Excellent coverage
-* ⚠️ **100%** — Usually overkill (diminishing returns)
-
----
-
-## 📍 Slide 34 – ✅ CI Best Practices
-
-| 🎯 Practice | 💡 Why It Matters |
-|------------|------------------|
-| ⚡ **Fail Fast** | Stop on first failure, save time |
-| 🔗 **Job Dependencies** | Don't push if tests fail |
-| 🔒 **Secrets in Vault** | Never hardcode credentials |
-| 📦 **Cache Dependencies** | 10x faster builds |
-| 🔍 **Security Scanning** | Catch CVEs early |
-| 📊 **Status Badges** | Visibility into health |
-| 🎯 **Branch Protection** | Require CI before merge |
-| ♻️ **Concurrency Control** | Cancel outdated runs |
-
-**🔐 Security:**
-* ✅ Use `secrets.*` for sensitive data
-* ✅ Minimum permissions (`permissions:`)
-* ✅ Pin action versions (`actions/checkout@v4`)
-
----
-
-## 📍 Slide 35 – 🌐 GitHub Actions Marketplace
-
-## Reusable Actions
-
-```mermaid
-flowchart LR
-  Marketplace[🏪 Actions Marketplace] --> Setup[⚙️ Setup Actions]
-  Marketplace --> Build[🔨 Build Actions]
-  Marketplace --> Deploy[🚀 Deploy Actions]
-  Marketplace --> Security[🔐 Security Actions]
-```
-
-**🔥 Popular Actions:**
-* ⚙️ `actions/checkout@v4` — Clone repo
-* 🐍 `actions/setup-python@v5` — Setup Python
-* 🐳 `docker/build-push-action@v5` — Build Docker
-* 🔐 `snyk/actions@master` — Security scan
-* 📊 `codecov/codecov-action@v4` — Coverage
-
-**🔍 Find Actions:**
-* 🌐 [github.com/marketplace](https://github.com/marketplace?type=actions)
-* ⭐ Check stars/downloads
-* 📖 Read documentation
-* 🔒 Verify source/security
-
----
-
-## 📍 Slide 36 – 🏢 Section 5: Production CI/CD
-
-## Real-World CI Workflows
-
-**🎬 Netflix:**
-* 🚀 **3000+** builds per day
-* 🔄 Full CI pipeline in **<10 minutes**
-* 🎯 A/B test deployments
-
-**🛒 Shopify:**
-* ⚡ Deploy **80+ times per day**
-* 🤖 Auto-rollback on failure
-* 📊 Real-time metrics in CI
-
-**🔍 Google:**
-* 🏗️ **Monorepo** with 2 billion LOC
-* 🧪 **100+ million tests** daily
-* 📦 Bazel build system
-
----
-
-## 📍 Slide 37 – 🚦 Branch Protection Rules
-
-## Require CI Before Merge
-
-```mermaid
-flowchart LR
-  PR[📝 Pull Request] --> CI[🤖 CI Runs]
-  CI -->|✅ Pass| Merge[✅ Can Merge]
-  CI -->|❌ Fail| Block[🚫 Blocked]
-```
-
-**⚙️ GitHub Settings:**
-* ✅ Require status checks to pass
-* ✅ Require branches to be up to date
-* ✅ Require review from code owners
-* 🔒 Prevent direct push to main
-
-**🎯 Result:**
-* 🚫 No broken code in main branch
-* ✅ Every change is tested
-* 📊 Full history of CI results
-
----
-
-## 📍 Slide 38 – 🔄 GitOps Preview
-
-## From CI to CD
-
-```mermaid
-flowchart LR
-  CI[🤖 CI: Test & Build] --> Push[📦 Push Image]
-  Push --> ArgoCD[🔄 ArgoCD Detects]
-  ArgoCD --> Deploy[🚀 Auto Deploy]
-  Deploy --> K8s[☸️ Kubernetes]
-```
-
-**🔮 Coming Up:**
-* 📦 **Lab 13**: ArgoCD deploys what CI builds
-* ☸️ **K8s**: Orchestrate containers
-* 🔄 **GitOps**: Git as source of truth
-* 🚀 **Full automation**: Commit → Production
-
----
-
-## 📍 Slide 39 – 💡 CI/CD Anti-Patterns
-
-| ❌ Anti-Pattern | ✅ Better Approach |
-|----------------|-------------------|
-| 🎰 "It works on my machine" | 🧪 Automated tests catch issues |
-| 📋 Manual deployment checklist | 🤖 Automated pipeline |
-| 🤷 No tests, just deploy | 🧪 Comprehensive test suite |
-| 💀 Long-lived feature branches | 🔄 Trunk-based development |
-| 🐌 Slow CI (>30 min) | ⚡ Optimize, parallelize, cache |
-| 🔓 Secrets in code | 🔒 Environment variables |
-
----
-
-## 📍 Slide 40 – 📈 CI Metrics to Track
-
-| 📊 Metric | 🎯 Target |
-|-----------|----------|
-| ⏱️ **Build Time** | < 10 minutes |
-| ✅ **Success Rate** | > 95% |
-| 🐛 **Bugs Caught in CI** | Maximize |
-| 📦 **Deploy Frequency** | Multiple/day |
-| 🔧 **Time to Fix Broken Build** | < 10 minutes |
-| 📊 **Test Coverage** | > 80% |
-
-```mermaid
-flowchart LR
-  Fast[⚡ Fast CI] --> Deploy[🚀 Deploy Often]
-  Deploy --> Confidence[💪 High Confidence]
-  Confidence --> Fast
-```
-
----
-
-## 📍 Slide 41 – 🎯 Section 6: Reflection
-
-## 📝 Key Takeaways
-
-1. 🤖 **CI automates testing** — catch bugs before production
-2. 🧪 **Unit tests are essential** — fast feedback loop
-3. ⚙️ **GitHub Actions** — powerful, free CI/CD platform
-4. 🔐 **Security scanning** — integrate Snyk, scan dependencies
-5. 📦 **Versioning matters** — SemVer or CalVer, be consistent
-
-> 💡 CI isn't just about automation — it's about building confidence.
-
----
-
-## 📍 Slide 42 – 🧠 The Mindset Shift
-
-| 😰 Old Mindset | 🚀 CI/CD Mindset |
-|---------------|------------------|
-| 📋 "Test before release" | 🧪 "Test every commit" |
-| 🤞 "Hope it works" | ✅ "Know it works" |
-| 🎰 Manual deployments | 🤖 Automated pipelines |
-| 😱 "Who broke it?" | 📊 "CI caught it" |
-| 🐌 Deploy monthly | 🚀 Deploy daily |
-| 🔍 Find bugs in prod | 🧪 Catch bugs in CI |
-
-> ❓ Which mindset will you adopt?
-
----
-
-## 📍 Slide 43 – ✅ Your Progress
-
-## 🎓 What You Now Understand
-
-* ✅ Why CI/CD is critical for modern development
-* ✅ How to write effective unit tests
-* ✅ GitHub Actions workflow syntax
-* ✅ Security scanning with Snyk
-* ✅ Versioning strategies (SemVer vs CalVer)
-* ✅ CI best practices (caching, matrix builds, path filters)
-
-> 🚀 **You're ready for Lab 3!**
-
----
-
-## 📍 Slide 44 – 📝 QUIZ — DEVOPS_L3_POST
-
----
-
-## 📍 Slide 45 – 🚀 What Comes Next
-
-## 📚 Lab 3: Build Your CI Pipeline
-
-* 🧪 Write unit tests for your Flask app
-* ⚙️ Create GitHub Actions workflow
-* 🔐 Integrate Snyk security scanning
-* 📦 Automate Docker builds and versioning
-* ⚡ Apply caching and best practices
-* 🏆 Bonus: Multi-app CI with path filters
-
-**🔮 Future Lectures:**
-* 📦 **Lecture 7**: Monitoring & Observability
-* ☸️ **Lecture 9**: Kubernetes Deployment
-* 🔄 **Lecture 13**: GitOps with ArgoCD
-
-```mermaid
-flowchart LR
-  You[👤 You] --> Tests[🧪 Write Tests]
-  Tests --> CI[🤖 GitHub Actions]
-  CI --> Automation[⚡ Full Automation]
-  Automation --> Career[🚀 DevOps Skills]
-```
-
-**👋 See you in the lab!**
-
----
-
-## 📚 Resources & Further Reading
-
-**📕 Books:**
-* 📖 *Continuous Delivery* — Jez Humble
-* 📖 *The DevOps Handbook* — Gene Kim
-* 📖 *Accelerate* — Nicole Forsgren
-
-**🔗 Links:**
-* 🌐 [GitHub Actions Docs](https://docs.github.com/en/actions)
-* 🌐 [Pytest Documentation](https://docs.pytest.org/)
-* 🌐 [Snyk Security](https://snyk.io/)
-* 🌐 [SemVer](https://semver.org/)
-* 🌐 [CalVer](https://calver.org/)
-
-**🛠️ Tools:**
-* 🔍 [act](https://github.com/nektos/act) — Run GitHub Actions locally
-* 🔍 [actionlint](https://github.com/rhysd/actionlint) — Lint workflows
-* 📊 [Codecov](https://codecov.io/) — Coverage tracking
-
----
+# 📌 Lecture 3 — Continuous Integration: Automate Testing & Build Confidence
+
+## 📍 Slide 1 – 🤖 Welcome to CI/CD
+
+* 🐛 **Manual testing** = slow, error-prone, doesn't scale
+* 🤖 **Continuous Integration** = automate testing, building, and validation
+* ✅ **Goal**: Catch bugs before they reach production
+* 🚀 This lecture: Build your first CI/CD pipeline with GitHub Actions
+
+```mermaid
+flowchart LR
+  Manual[😰 Manual Testing] -->|CI/CD| Auto[🤖 Automated Pipeline]
+  Auto --> Confidence[💪 Deploy with Confidence]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 Learning Outcomes
+
+* ✅ Understand CI/CD principles and benefits
+* ✅ Write effective unit tests
+* ✅ Build GitHub Actions workflows
+* ✅ Implement security scanning with Snyk
+* ✅ Apply CI/CD best practices (caching, versioning)
+
+**🎓 By the end of this lecture:**
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | 🧠 Explain CI/CD and why it matters |
+| 2 | 🧪 Write meaningful unit tests |
+| 3 | ⚙️ Create GitHub Actions workflows |
+| 4 | 🔐 Integrate security scanning |
+| 5 | 📦 Automate Docker builds & publishing |
+
+---
+
+## 📍 Slide 3 – 📋 Lecture Overview
+
+* 📚 **CI/CD fundamentals** — what, why, how
+* 🧪 **Testing strategies** — unit, integration, coverage
+* ⚙️ **GitHub Actions** — YAML workflows, actions marketplace
+* 🔐 **Security** — Snyk vulnerability scanning
+* 🚀 **Automation** — Docker builds, versioning, caching
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction           → 📝 PRE Quiz
+Section 1: The Testing Problem
+Section 2: CI/CD Fundamentals
+Section 3: GitHub Actions Hands-on → 📝 MID Quiz
+Section 4: Advanced CI Patterns
+Section 5: Production Practices
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **85%** of software bugs are found in production (2024)
+* ⏱️ Average cost to fix a prod bug: **100x** more than dev bug
+* 🚀 Teams with good CI deploy **46x** more frequently
+
+> 💬 *"If it hurts, do it more often"* — Continuous Delivery principle
+
+**🤔 Think about it:**
+* How do you know your code works before deploying?
+* What happens when someone breaks the main branch?
+* How many bugs could be caught automatically?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L3_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Testing Problem
+
+* 👨‍💻 **Developer**: "It works on my machine!"
+* 🐛 **Production**: 500 errors, users complaining
+* 😰 **The gap**: No automated testing or validation
+* 💥 **Result**: Bugs slip through, confidence is low
+
+```mermaid
+flowchart LR
+  Dev[👨‍💻 Dev: Works!] -->|No Tests| Prod[🌐 Production]
+  Prod --> Bug[🐛 Bug Found]
+  Bug --> Fire[🔥 Firefighting]
+```
+
+---
+
+## 📍 Slide 7 – 🧪 Manual Testing Hell
+
+* 📋 **Manual checklist**: 50 steps to test before deploy
+* ⏱️ **Time**: 2 hours per test cycle
+* 😴 **Human error**: Forgot to test one endpoint
+* 🔄 **Frequency**: Only before big releases (too painful)
+
+```mermaid
+flowchart TD
+  Code[📝 Write Code] --> Manual[📋 Manual Testing]
+  Manual --> Bug[🐛 Found Bug]
+  Bug --> Fix[🔧 Fix Code]
+  Fix --> Manual
+  Manual --> Deploy[😮‍💨 Finally Deploy]
+```
+
+**😰 Problems:**
+* 🐌 Slow feedback loop
+* 🎰 Testing is inconsistent
+* 🧠 Requires human to remember all steps
+* 💀 Nobody wants to test
+
+---
+
+## 📍 Slide 8 – 💥 The Integration Problem
+
+* 👥 **Multiple developers** pushing to main branch
+* 🔀 **Merge conflicts** caught too late
+* 💥 **Breaking changes** not detected
+* 🤷 **"Who broke the build?"** — the blame game
+
+```mermaid
+flowchart LR
+  Dev1[👨‍💻 Dev 1] -->|Push| Main[🌳 Main Branch]
+  Dev2[👩‍💻 Dev 2] -->|Push| Main
+  Dev3[👨‍💻 Dev 3] -->|Push| Main
+  Main --> Break[💥 Build Broken]
+```
+
+> 🤔 **Think:** How do we prevent this?
+
+---
+
+## 📍 Slide 9 – 🔐 The Security Gap
+
+* 📦 **Dependencies** with known vulnerabilities
+* 🔓 **Secrets** accidentally committed
+* 🚨 **CVEs** discovered after deployment
+* 🤷 **Nobody checked** before merging
+
+**📊 Real Stats:**
+* 🔍 **84%** of codebases have vulnerable dependencies
+* ⏱️ Average time to detect vulnerability: **54 days**
+* 💰 Average breach cost: **$4.45 million**
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of No CI
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐛 Bugs in production | Customer churn, reputation damage |
+| ⏱️ Slow feedback | Wasted development time |
+| 😰 Fear of deployment | Infrequent releases |
+| 🔒 Security vulnerabilities | Data breaches, compliance issues |
+
+**📈 Real Numbers:**
+* 🐛 Prod bug fix cost: **$10,000 - $100,000**
+* 🕒 Time to detect + fix: **4-8 hours**
+* 🏢 Without CI: Deploy **monthly**
+* 🚀 With CI: Deploy **daily**
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: CI/CD Fundamentals
+
+* 🤖 **Continuous Integration (CI)** = automatically test every change
+* 🚀 **Continuous Delivery (CD)** = always ready to deploy
+* 📦 **Continuous Deployment** = automatically deploy to production
+* 🎯 **Goal**: Fast, reliable, automated software delivery
+
+```mermaid
+flowchart LR
+  CI[🤖 CI: Test] --> CD[📦 CD: Package]
+  CD --> Deploy[🚀 Deploy]
+```
+
+**📖 Definitions:**
+> *CI: Developers integrate code into shared repository frequently. Each integration is verified by automated build and tests.*
+> *CD: Software can be released to production at any time.*
+
+---
+
+## 📍 Slide 12 – 🔄 The CI/CD Pipeline
+
+```mermaid
+flowchart LR
+  Commit[📝 Commit] --> Trigger[⚡ Trigger CI]
+  Trigger --> Checkout[📥 Checkout Code]
+  Checkout --> Build[🔨 Build]
+  Build --> Test[🧪 Test]
+  Test --> Lint[🔍 Lint]
+  Lint --> Scan[🔐 Security Scan]
+  Scan --> Package[📦 Package]
+  Package --> Publish[🚀 Publish]
+```
+
+**🔧 Stages:**
+1. 📝 **Commit** — Developer pushes code
+2. ⚡ **Trigger** — CI system detects change
+3. 🔨 **Build** — Compile/prepare code
+4. 🧪 **Test** — Run automated tests
+5. 🔍 **Lint** — Check code quality
+6. 🔐 **Scan** — Security vulnerabilities
+7. 📦 **Package** — Build artifacts (Docker image)
+8. 🚀 **Publish** — Push to registry
+
+---
+
+## 📍 Slide 13 – ✅ CI/CD Benefits
+
+| 🎯 Benefit | 📊 Impact |
+|-----------|----------|
+| ⚡ **Fast Feedback** | Know in 5 min if code works |
+| 🐛 **Early Bug Detection** | Catch before production |
+| 🔒 **Security** | Automated vulnerability scanning |
+| 📦 **Consistent Builds** | Same process every time |
+| 💪 **Confidence** | Deploy without fear |
+| 🚀 **Faster Releases** | Deploy multiple times per day |
+
+**📈 DORA Metrics (Elite Performers):**
+* 📦 Deploy frequency: **Multiple times/day**
+* ⏱️ Lead time: **< 1 hour**
+* 🔧 MTTR: **< 1 hour**
+* ❌ Change failure rate: **< 15%**
+
+---
+
+## 📍 Slide 14 – 🧪 Testing Pyramid
+
+```mermaid
+flowchart TD
+  subgraph Pyramid[🔺 Testing Pyramid]
+    E2E[🌐 E2E Tests<br/>Few, Slow, Expensive]
+    INT[🔗 Integration Tests<br/>Some, Moderate]
+    UNIT[🧪 Unit Tests<br/>Many, Fast, Cheap]
+  end
+  E2E --> INT --> UNIT
+```
+
+**🎯 Test Types:**
+* 🧪 **Unit Tests** (80%) — Test individual functions
+* 🔗 **Integration Tests** (15%) — Test components together
+* 🌐 **End-to-End Tests** (5%) — Test full user flows
+
+**💡 Why the pyramid?**
+* ✅ Unit tests: Fast (ms), cheap, catch most bugs
+* ✅ Integration: Slower (seconds), catch interface bugs
+* ⚠️ E2E: Slowest (minutes), brittle, expensive
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After CI/CD
+
+| 😰 Before CI/CD | 🚀 After CI/CD |
+|-----------------|----------------|
+| 📋 Manual testing checklist | 🤖 Automated test suite |
+| 🎰 "Fingers crossed" deploys | ✅ Confident deployments |
+| 🐛 Bugs found in production | 🧪 Bugs caught in CI |
+| ⏱️ 2 hour test cycle | ⚡ 5 minute feedback |
+| 😱 Deploy monthly | 🚀 Deploy daily |
+| 🤷 "Who broke it?" | 📊 Git bisect + logs |
+
+> 🤔 Which column is your current process?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: GitHub Actions Hands-On
+
+## 🕹️ Lab Preview: Build Your CI Pipeline
+
+* 🏢 **Scenario**: You have a Python Flask app
+* 🎯 **Goal**: Automate testing and Docker builds
+* 📋 **Requirements**: Tests, lint, security scan, publish
+
+**❓ How do we automate all this?**
+
+> 🤖 **GitHub Actions** to the rescue!
+
+🎮 **Let's build it step by step.**
+
+---
+
+## 📍 Slide 17 – 💥 Scenario 1: No Tests
+
+**😰 The Problem:**
+```python
+# app.py
+@app.route('/')
+def home():
+    return {"message": "Hello", "hostname": os.getenv("HOSTNAME")}
+
+# 🚫 No tests!
+```
+
+* 📝 Code looks fine
+* 💥 Deploy → crashes because `HOSTNAME` is None
+* 🐛 Users see 500 errors
+* 😱 Rollback emergency
+
+> ❓ **How do we catch this before deploy?**
+
+---
+
+## 📍 Slide 18 – ✅ Solution: Unit Testing
+
+## 🛠️ Fix: Write Tests First
+
+```python
+# tests/test_app.py
+import pytest
+from app import app
+
+def test_home_endpoint():
+    """Test that home returns expected structure"""
+    client = app.test_client()
+    response = client.get('/')
+
+    assert response.status_code == 200
+    data = response.get_json()
+    assert "message" in data
+    assert "hostname" in data
+    assert isinstance(data["message"], str)
+
+def test_health_endpoint():
+    """Test health check"""
+    client = app.test_client()
+    response = client.get('/health')
+
+    assert response.status_code == 200
+    assert response.get_json()["status"] == "healthy"
+```
+
+**🎯 Result:** Tests catch the bug before deploy!
+
+---
+
+## 📍 Slide 19 – 🧪 Testing Frameworks
+
+## Python Testing Options
+
+| Framework | 🎯 Pros | ⚠️ Cons |
+|-----------|--------|--------|
+| **pytest** | Simple, powerful, fixtures | Extra dependency |
+| **unittest** | Built-in, no dependencies | Verbose, old-style |
+
+```bash
+# 🧪 pytest (recommended)
+pip install pytest
+pytest tests/
+
+# 🧪 unittest (built-in)
+python -m unittest discover tests/
+```
+
+**💡 Why pytest?**
+* ✅ Simple syntax (`assert` instead of `self.assertEqual`)
+* ✅ Powerful fixtures (setup/teardown)
+* ✅ Great plugins (coverage, parallel, etc.)
+* ✅ Industry standard
+
+---
+
+## 📍 Slide 20 – 📝 Scenario 2: Manual Docker Builds
+
+**😰 The Problem:**
+```bash
+# 🐌 Manual process every time
+docker build -t myapp:latest .
+docker tag myapp:latest username/myapp:v1.2.3
+docker login
+docker push username/myapp:v1.2.3
+docker push username/myapp:latest
+
+# 😱 Forgot to update version tag!
+# 💀 Built from wrong branch!
+```
+
+* ⏱️ Takes 10 minutes
+* 🎰 Inconsistent (human error)
+* 📋 No validation before build
+* 🤷 Can't track what version is deployed
+
+---
+
+## 📍 Slide 21 – ✅ Solution: GitHub Actions CI/CD
+
+## 🛠️ Fix: Automate Everything
+
+```yaml
+# .github/workflows/python-ci.yml
+name: Python CI
+
+on:
+  push:
+    branches: [ main ]
+  pull_request:
+
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - uses: actions/setup-python@v5
+        with:
+          python-version: '3.12'
+
+      - name: Install dependencies
+        run: |
+          pip install -r requirements.txt
+          pip install pytest flake8
+
+      - name: Lint
+        run: flake8 app.py
+
+      - name: Test
+        run: pytest tests/
+```
+
+**🎯 Result:** Every commit automatically tested!
+
+---
+
+## 📍 Slide 22 – 🐳 Docker Build Automation
+
+```yaml
+  docker:
+    needs: test  # ✅ Only run if tests pass
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Login to Docker Hub
+        uses: docker/login-action@v3
+        with:
+          username: ${{ secrets.DOCKER_USERNAME }}
+          password: ${{ secrets.DOCKER_TOKEN }}
+
+      - name: Build and push
+        uses: docker/build-push-action@v5
+        with:
+          context: ./app_python
+          push: true
+          tags: |
+            ${{ secrets.DOCKER_USERNAME }}/myapp:latest
+            ${{ secrets.DOCKER_USERNAME }}/myapp:${{ github.sha }}
+```
+
+**🔐 Security Note:** Never hardcode credentials!
+
+---
+
+## 📍 Slide 23 – 🔓 Scenario 3: Vulnerable Dependencies
+
+**😰 The Problem:**
+```bash
+# requirements.txt
+flask==2.0.1  # 💀 Known CVE-2023-30861
+requests==2.25.0  # 🔓 Security vulnerability
+
+# 🤷 Nobody checked before deploying
+```
+
+* 🔍 **84%** of apps have vulnerable dependencies
+* ⏱️ Takes **weeks** to discover
+* 💀 Already in production when found
+
+**📊 Real Example:**
+* 📦 Log4Shell (2021) — **35,000+ CVE**
+* 💰 Cost to remediate: **Billions of dollars**
+
+---
+
+## 📍 Slide 24 – ✅ Solution: Snyk Security Scanning
+
+## 🛠️ Fix: Automated Vulnerability Scanning
+
+```yaml
+  security:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Run Snyk
+        uses: snyk/actions/python-3.10@master
+        env:
+          SNYK_TOKEN: ${{ secrets.SNYK_TOKEN }}
+        with:
+          args: --severity-threshold=high
+```
+
+**🎯 What Snyk Does:**
+* 🔍 Scans dependencies for known CVEs
+* 📊 Reports severity (low/medium/high/critical)
+* 🔧 Suggests fixes
+* ❌ Fails build if critical vulnerabilities found
+
+**🔐 Result:** Catch vulnerabilities before production!
+
+---
+
+## 📍 Slide 25 – 🐌 Scenario 4: Slow CI Builds
+
+**😰 The Problem:**
+```
+[Run 1] Installing dependencies... 2 minutes
+[Run 2] Installing dependencies... 2 minutes
+[Run 3] Installing dependencies... 2 minutes
+# 💸 Wasting 6 minutes downloading same packages!
+```
+
+* ⏱️ Each run: **5-10 minutes**
+* 🔄 Re-downloading same dependencies
+* 💰 Wasting CI minutes (costs money!)
+* 😴 Slow feedback loop
+
+---
+
+## 📍 Slide 26 – ✅ Solution: Dependency Caching
+
+## 🛠️ Fix: Cache Dependencies
+
+```yaml
+- uses: actions/setup-python@v5
+  with:
+    python-version: '3.12'
+    cache: 'pip'  # ✅ Enable caching
+    cache-dependency-path: 'requirements.txt'
+
+# Alternative with explicit cache
+- uses: actions/cache@v4
+  with:
+    path: ~/.cache/pip
+    key: ${{ runner.os }}-pip-${{ hashFiles('requirements.txt') }}
+```
+
+**📊 Performance Impact:**
+* ⏱️ **Before caching**: 5 minutes
+* ⚡ **After caching**: 30 seconds
+* 🚀 **10x faster!**
+
+**💡 Cache Key Strategy:**
+* 🔑 Key includes `requirements.txt` hash
+* 🔄 Cache invalidates when dependencies change
+* ✅ Fresh install when needed, cached otherwise
+
+---
+
+## 📍 Slide 27 – 📝 QUIZ — DEVOPS_L3_MID
+
+---
+
+## 📍 Slide 28 – 🏷️ Section 4: Versioning Strategies
+
+## 📦 How to Version Your Images?
+
+**Two main approaches:**
+
+**🔢 Semantic Versioning (SemVer):**
+* Format: `MAJOR.MINOR.PATCH` (e.g., `1.2.3`)
+* 🎯 Use when: Breaking changes matter
+* 📚 Example: Libraries, APIs
+
+**📅 Calendar Versioning (CalVer):**
+* Format: `YYYY.MM.DD` (e.g., `2024.01.15`)
+* 🎯 Use when: Continuous deployment
+* 🚀 Example: Web services, SaaS
+
+```mermaid
+flowchart LR
+  Code[📝 Code] --> SemVer[🔢 v1.2.3]
+  Code --> CalVer[📅 2024.01]
+  SemVer --> Lib[📚 Library]
+  CalVer --> Service[🌐 Service]
+```
+
+---
+
+## 📍 Slide 29 – 🔢 Semantic Versioning (SemVer)
+
+## v MAJOR.MINOR.PATCH
+
+| Version | 🎯 When to Bump |
+|---------|----------------|
+| **MAJOR** (v2.0.0) | Breaking changes (API changed) |
+| **MINOR** (v1.1.0) | New features (backward-compatible) |
+| **PATCH** (v1.0.1) | Bug fixes (backward-compatible) |
+
+```yaml
+# 🏷️ Multiple tags per release
+tags: |
+  username/app:1.2.3
+  username/app:1.2
+  username/app:1
+  username/app:latest
+```
+
+**✅ Pros:**
+* 📖 Clear breaking change signals
+* 🎯 Industry standard for libraries
+* 🔄 Users can pin to major version
+
+**⚠️ Cons:**
+* 🤔 Requires discipline
+* 📋 Need to track what's breaking vs feature
+
+---
+
+## 📍 Slide 30 – 📅 Calendar Versioning (CalVer)
+
+## YYYY.MM.DD or YYYY.MM
+
+| Format | 📝 Example | 🎯 Use Case |
+|--------|-----------|-------------|
+| `YYYY.MM.DD` | `2024.01.15` | Daily releases |
+| `YYYY.MM.MICRO` | `2024.01.3` | Monthly + patch |
+| `YYYY.0M` | `2024.01` | Monthly releases |
+
+```yaml
+# 📅 Generate version from date
+- name: Generate version
+  run: echo "VERSION=$(date +%Y.%m.%d)" >> $GITHUB_ENV
+
+tags: |
+  username/app:2024.01.15
+  username/app:2024.01
+  username/app:latest
+```
+
+**✅ Pros:**
+* 📆 No ambiguity (date is date)
+* 🚀 Perfect for continuous deployment
+* 🧠 Easy to remember
+
+**⚠️ Cons:**
+* 🤷 Doesn't indicate breaking changes
+
+---
+
+## 📍 Slide 31 – 🔀 Matrix Builds
+
+## Test Multiple Versions
+
+```yaml
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python-version: ['3.11', '3.12', '3.13']
+
+    steps:
+      - uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python-version }}
+
+      - run: pytest tests/
+```
+
+**🎯 What This Does:**
+* 🔄 Runs tests **3 times** (one per Python version)
+* ⚡ Runs in **parallel**
+* ✅ Ensures compatibility across versions
+
+```mermaid
+flowchart LR
+  Test[🧪 Tests] --> Py311[🐍 Python 3.11]
+  Test --> Py312[🐍 Python 3.12]
+  Test --> Py313[🐍 Python 3.13]
+```
+
+---
+
+## 📍 Slide 32 – 📂 Path Filters (Monorepo)
+
+## Only Run CI for Changed Apps
+
+```yaml
+# Python CI only runs when Python code changes
+on:
+  push:
+    paths:
+      - 'app_python/**'
+      - '.github/workflows/python-ci.yml'
+
+# Go CI only runs when Go code changes
+on:
+  push:
+    paths:
+      - 'app_go/**'
+      - '.github/workflows/go-ci.yml'
+```
+
+**🎯 Benefits:**
+* ⚡ Faster CI (don't run unnecessary builds)
+* 💰 Save CI minutes
+* 🔕 Less noise (only relevant notifications)
+
+**📊 Impact:**
+* 🐌 Without filters: Every commit runs **all** CI
+* 🚀 With filters: Only **affected** apps run
+
+---
+
+## 📍 Slide 33 – 📊 Test Coverage
+
+## Measure What's Tested
+
+```yaml
+- name: Run tests with coverage
+  run: |
+    pip install pytest-cov
+    pytest --cov=app_python --cov-report=xml --cov-report=term
+
+- name: Upload to Codecov
+  uses: codecov/codecov-action@v4
+  with:
+    file: ./coverage.xml
+```
+
+**📊 Coverage Badge:**
+```markdown
+![Coverage](https://codecov.io/gh/user/repo/branch/main/graph/badge.svg)
+```
+
+**🎯 What's Good Coverage?**
+* 🥉 **60-70%** — Okay, could be better
+* 🥈 **70-85%** — Good, most code tested
+* 🥇 **85-95%** — Excellent coverage
+* ⚠️ **100%** — Usually overkill (diminishing returns)
+
+---
+
+## 📍 Slide 34 – ✅ CI Best Practices
+
+| 🎯 Practice | 💡 Why It Matters |
+|------------|------------------|
+| ⚡ **Fail Fast** | Stop on first failure, save time |
+| 🔗 **Job Dependencies** | Don't push if tests fail |
+| 🔒 **Secrets in Vault** | Never hardcode credentials |
+| 📦 **Cache Dependencies** | 10x faster builds |
+| 🔍 **Security Scanning** | Catch CVEs early |
+| 📊 **Status Badges** | Visibility into health |
+| 🎯 **Branch Protection** | Require CI before merge |
+| ♻️ **Concurrency Control** | Cancel outdated runs |
+
+**🔐 Security:**
+* ✅ Use `secrets.*` for sensitive data
+* ✅ Minimum permissions (`permissions:`)
+* ✅ Pin action versions (`actions/checkout@v4`)
+
+---
+
+## 📍 Slide 35 – 🌐 GitHub Actions Marketplace
+
+## Reusable Actions
+
+```mermaid
+flowchart LR
+  Marketplace[🏪 Actions Marketplace] --> Setup[⚙️ Setup Actions]
+  Marketplace --> Build[🔨 Build Actions]
+  Marketplace --> Deploy[🚀 Deploy Actions]
+  Marketplace --> Security[🔐 Security Actions]
+```
+
+**🔥 Popular Actions:**
+* ⚙️ `actions/checkout@v4` — Clone repo
+* 🐍 `actions/setup-python@v5` — Setup Python
+* 🐳 `docker/build-push-action@v5` — Build Docker
+* 🔐 `snyk/actions@master` — Security scan
+* 📊 `codecov/codecov-action@v4` — Coverage
+
+**🔍 Find Actions:**
+* 🌐 [github.com/marketplace](https://github.com/marketplace?type=actions)
+* ⭐ Check stars/downloads
+* 📖 Read documentation
+* 🔒 Verify source/security
+
+---
+
+## 📍 Slide 36 – 🏢 Section 5: Production CI/CD
+
+## Real-World CI Workflows
+
+**🎬 Netflix:**
+* 🚀 **3000+** builds per day
+* 🔄 Full CI pipeline in **<10 minutes**
+* 🎯 A/B test deployments
+
+**🛒 Shopify:**
+* ⚡ Deploy **80+ times per day**
+* 🤖 Auto-rollback on failure
+* 📊 Real-time metrics in CI
+
+**🔍 Google:**
+* 🏗️ **Monorepo** with 2 billion LOC
+* 🧪 **100+ million tests** daily
+* 📦 Bazel build system
+
+---
+
+## 📍 Slide 37 – 🚦 Branch Protection Rules
+
+## Require CI Before Merge
+
+```mermaid
+flowchart LR
+  PR[📝 Pull Request] --> CI[🤖 CI Runs]
+  CI -->|✅ Pass| Merge[✅ Can Merge]
+  CI -->|❌ Fail| Block[🚫 Blocked]
+```
+
+**⚙️ GitHub Settings:**
+* ✅ Require status checks to pass
+* ✅ Require branches to be up to date
+* ✅ Require review from code owners
+* 🔒 Prevent direct push to main
+
+**🎯 Result:**
+* 🚫 No broken code in main branch
+* ✅ Every change is tested
+* 📊 Full history of CI results
+
+---
+
+## 📍 Slide 38 – 🔄 GitOps Preview
+
+## From CI to CD
+
+```mermaid
+flowchart LR
+  CI[🤖 CI: Test & Build] --> Push[📦 Push Image]
+  Push --> ArgoCD[🔄 ArgoCD Detects]
+  ArgoCD --> Deploy[🚀 Auto Deploy]
+  Deploy --> K8s[☸️ Kubernetes]
+```
+
+**🔮 Coming Up:**
+* 📦 **Lab 13**: ArgoCD deploys what CI builds
+* ☸️ **K8s**: Orchestrate containers
+* 🔄 **GitOps**: Git as source of truth
+* 🚀 **Full automation**: Commit → Production
+
+---
+
+## 📍 Slide 39 – 💡 CI/CD Anti-Patterns
+
+| ❌ Anti-Pattern | ✅ Better Approach |
+|----------------|-------------------|
+| 🎰 "It works on my machine" | 🧪 Automated tests catch issues |
+| 📋 Manual deployment checklist | 🤖 Automated pipeline |
+| 🤷 No tests, just deploy | 🧪 Comprehensive test suite |
+| 💀 Long-lived feature branches | 🔄 Trunk-based development |
+| 🐌 Slow CI (>30 min) | ⚡ Optimize, parallelize, cache |
+| 🔓 Secrets in code | 🔒 Environment variables |
+
+---
+
+## 📍 Slide 40 – 📈 CI Metrics to Track
+
+| 📊 Metric | 🎯 Target |
+|-----------|----------|
+| ⏱️ **Build Time** | < 10 minutes |
+| ✅ **Success Rate** | > 95% |
+| 🐛 **Bugs Caught in CI** | Maximize |
+| 📦 **Deploy Frequency** | Multiple/day |
+| 🔧 **Time to Fix Broken Build** | < 10 minutes |
+| 📊 **Test Coverage** | > 80% |
+
+```mermaid
+flowchart LR
+  Fast[⚡ Fast CI] --> Deploy[🚀 Deploy Often]
+  Deploy --> Confidence[💪 High Confidence]
+  Confidence --> Fast
+```
+
+---
+
+## 📍 Slide 41 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🤖 **CI automates testing** — catch bugs before production
+2. 🧪 **Unit tests are essential** — fast feedback loop
+3. ⚙️ **GitHub Actions** — powerful, free CI/CD platform
+4. 🔐 **Security scanning** — integrate Snyk, scan dependencies
+5. 📦 **Versioning matters** — SemVer or CalVer, be consistent
+
+> 💡 CI isn't just about automation — it's about building confidence.
+
+---
+
+## 📍 Slide 42 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🚀 CI/CD Mindset |
+|---------------|------------------|
+| 📋 "Test before release" | 🧪 "Test every commit" |
+| 🤞 "Hope it works" | ✅ "Know it works" |
+| 🎰 Manual deployments | 🤖 Automated pipelines |
+| 😱 "Who broke it?" | 📊 "CI caught it" |
+| 🐌 Deploy monthly | 🚀 Deploy daily |
+| 🔍 Find bugs in prod | 🧪 Catch bugs in CI |
+
+> ❓ Which mindset will you adopt?
+
+---
+
+## 📍 Slide 43 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Why CI/CD is critical for modern development
+* ✅ How to write effective unit tests
+* ✅ GitHub Actions workflow syntax
+* ✅ Security scanning with Snyk
+* ✅ Versioning strategies (SemVer vs CalVer)
+* ✅ CI best practices (caching, matrix builds, path filters)
+
+> 🚀 **You're ready for Lab 3!**
+
+---
+
+## 📍 Slide 44 – 📝 QUIZ — DEVOPS_L3_POST
+
+---
+
+## 📍 Slide 45 – 🚀 What Comes Next
+
+## 📚 Lab 3: Build Your CI Pipeline
+
+* 🧪 Write unit tests for your Flask app
+* ⚙️ Create GitHub Actions workflow
+* 🔐 Integrate Snyk security scanning
+* 📦 Automate Docker builds and versioning
+* ⚡ Apply caching and best practices
+* 🏆 Bonus: Multi-app CI with path filters
+
+**🔮 Future Lectures:**
+* 📦 **Lecture 7**: Monitoring & Observability
+* ☸️ **Lecture 9**: Kubernetes Deployment
+* 🔄 **Lecture 13**: GitOps with ArgoCD
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Tests[🧪 Write Tests]
+  Tests --> CI[🤖 GitHub Actions]
+  CI --> Automation[⚡ Full Automation]
+  Automation --> Career[🚀 DevOps Skills]
+```
+
+**👋 See you in the lab!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Continuous Delivery* — Jez Humble
+* 📖 *The DevOps Handbook* — Gene Kim
+* 📖 *Accelerate* — Nicole Forsgren
+
+**🔗 Links:**
+* 🌐 [GitHub Actions Docs](https://docs.github.com/en/actions)
+* 🌐 [Pytest Documentation](https://docs.pytest.org/)
+* 🌐 [Snyk Security](https://snyk.io/)
+* 🌐 [SemVer](https://semver.org/)
+* 🌐 [CalVer](https://calver.org/)
+
+**🛠️ Tools:**
+* 🔍 [act](https://github.com/nektos/act) — Run GitHub Actions locally
+* 🔍 [actionlint](https://github.com/rhysd/actionlint) — Lint workflows
+* 📊 [Codecov](https://codecov.io/) — Coverage tracking
+
+---
diff --git a/lectures/lec4.md b/lectures/lec4.md
index acfe810526..ecf08345c7 100644
--- a/lectures/lec4.md
+++ b/lectures/lec4.md
@@ -1,801 +1,801 @@
-# 📌 Lecture 4 — Infrastructure as Code: From Snowflakes to Cattle
-
-## 📍 Slide 1 – 🚀 Welcome to Infrastructure as Code
-
-* 🌍 **Infrastructure used to be physical** — racks, cables, manual configuration
-* 😰 Manual setup leads to inconsistency, drift, and undocumented "snowflakes"
-* 🏗️ **Infrastructure as Code (IaC)** treats infrastructure like software
-* 🎯 This lecture: learn to define, version, and automate your infrastructure
-
-```mermaid
-flowchart LR
-  Manual[🔧 Manual Setup] -->|IaC| Code[📝 Code-Defined]
-  Code --> Reproducible[🔄 Reproducible Infrastructure]
-```
-
----
-
-## 📍 Slide 2 – 🎯 What You Will Learn
-
-* ✅ Understand Infrastructure as Code principles
-* ✅ Compare declarative vs imperative IaC approaches
-* ✅ Apply Terraform workflows to real cloud infrastructure
-* ✅ Manage infrastructure state securely
-
-**🎓 Learning Outcomes:**
-| # | Outcome |
-|---|---------|
-| 1 | 🧠 Define IaC and explain its benefits |
-| 2 | 🔍 Distinguish between Terraform and Pulumi |
-| 3 | 🛠️ Write basic Terraform configurations |
-| 4 | 🗺️ Understand state management and security |
-
----
-
-## 📍 Slide 3 – 📋 How This Lecture Works
-
-* 📚 **Concepts + Code examples** — hands-on focus
-* 🎮 **Real-world scenarios** — cloud provisioning challenges
-* 📝 **3 quiz checkpoints**: PRE / MID / POST
-* 🛠️ **Tool comparison**: Terraform vs Pulumi
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction (now)     → 📝 PRE Quiz
-Section 1: The Infrastructure Problem
-Section 2: IaC Fundamentals
-Section 3: Terraform Deep Dive    → 📝 MID Quiz
-Section 4: State & Security
-Section 5: Real World IaC
-Section 6: Reflection             → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – ❓ The Big Question
-
-* 📊 **73%** of organizations report configuration drift as a major issue
-* ⏱️ Average time to provision a server manually: **hours to days**
-* 💥 Most outages caused by **configuration changes**
-
-> 💬 *"It works in staging but not production"* — Every ops engineer, ever
-
-**🤔 Think about it:**
-* How do you recreate your production environment?
-* What happens when the person who set it up leaves?
-* Can you spin up a new environment in minutes?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L4_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Infrastructure Problem
-
-* 🐶 **Pet Servers** = unique, hand-crafted, irreplaceable
-* 🔧 Manual configuration via SSH and console clicks
-* 📋 Documentation gets outdated immediately
-* 💥 Result: **snowflake infrastructure** — no two servers are the same
-
-```mermaid
-flowchart LR
-  Server1[🖥️ Server 1: Ubuntu 20 + patches]
-  Server2[🖥️ Server 2: Ubuntu 22 + different patches]
-  Server3[🖥️ Server 3: ???]
-  Server1 --> Chaos[😱 Configuration Chaos]
-  Server2 --> Chaos
-  Server3 --> Chaos
-```
-
----
-
-## 📍 Slide 7 – 🐶 Pets vs Cattle
-
-* 🐶 **Pets**: Named servers, nursed back to health when sick
-* 🐄 **Cattle**: Numbered, identical, replaced when broken
-* 🌍 Cloud-native = cattle mindset
-
-```mermaid
-flowchart TD
-  subgraph 🐶 Pets
-    P1[web-prod-01]
-    P2[db-master]
-    P3[app-legacy]
-  end
-  subgraph 🐄 Cattle
-    C1[instance-001]
-    C2[instance-002]
-    C3[instance-003]
-  end
-  Pets -->|😰 Unique, fragile| Problem[Hard to scale]
-  Cattle -->|🔄 Identical, disposable| Solution[Easy to scale]
-```
-
-> 🤔 **Think:** Are your servers pets or cattle?
-
----
-
-## 📍 Slide 8 – 😱 Configuration Drift
-
-* 📅 Server configured once, modified many times
-* 🔧 "Quick fixes" applied directly in production
-* 📋 No record of what changed
-* 💀 Disaster recovery = guesswork
-
-```mermaid
-flowchart TD
-  Initial[✅ Initial Setup] --> Month1[📅 Month 1: Hotfix applied]
-  Month1 --> Month3[📅 Month 3: Security patch]
-  Month3 --> Month6[📅 Month 6: Unknown changes]
-  Month6 --> Drift[😱 Configuration Drift]
-  Drift --> Unknown[❓ What's actually running?]
-```
-
-**📊 The Numbers:**
-* 🔍 **65%** of downtime caused by configuration issues
-* ⏱️ Average recovery time: **4+ hours**
-* 💰 Cost per hour of downtime: **$300,000** (enterprise)
-
----
-
-## 📍 Slide 9 – 😨 The Bus Factor
-
-* 👤 One person knows how the infrastructure works
-* 🚌 They leave, get sick, or go on vacation
-* 🙈 Nobody can recreate or fix the environment
-* 💀 Business continuity at risk
-
-> ⚠️ **Bus Factor = 1** means your infrastructure is fragile
-
-**😰 Signs of Low Bus Factor:**
-* 🔇 "Ask John, he set that up"
-* 📝 Documentation is outdated or missing
-* 🐌 Changes require specific people
-* 🚪 Knowledge walks out the door
-
-**💬 Discussion:** What's your infrastructure bus factor?
-
----
-
-## 📍 Slide 10 – 💸 The Cost of Manual Infrastructure
-
-| 🔥 Problem | 💥 Impact |
-|------------|-----------|
-| 🐢 Slow provisioning | Days to spin up new environments |
-| 📋 Manual processes | Human error, inconsistency |
-| 👉 No audit trail | Compliance violations |
-| 🙈 Configuration drift | Unpredictable behavior |
-
-**📈 Real Numbers:**
-* 🏢 **Manual provisioning**: 2-4 hours per server
-* 🚀 **With IaC**: 2-4 minutes per server
-* 🔄 **Environment recreation**: hours vs seconds
-
-**💰 Time Cost:**
-* 👨‍💻 Engineer time: **$75-150/hour**
-* 🖥️ 10 servers manually: **$1,500-3,000**
-* 🤖 10 servers with IaC: **$15-30**
-
----
-
-## 📍 Slide 11 – 💡 Section 2: What Infrastructure as Code Is
-
-* 📝 **IaC** = defining infrastructure in version-controlled files
-* 🔄 Infrastructure becomes **reproducible** and **auditable**
-* 🚫 No more clicking through consoles
-* 🎯 Same infrastructure, every time
-
-```mermaid
-flowchart LR
-  Code[📝 Code] -->|🔄 Apply| Cloud[☁️ Cloud]
-  Cloud --> Infra[🏗️ Infrastructure]
-  Code -->|📜 Git| Version[Version Control]
-```
-
-**📖 Definition:**
-> *Infrastructure as Code is the practice of managing and provisioning infrastructure through machine-readable configuration files rather than through manual processes or interactive tools.*
-
----
-
-## 📍 Slide 12 – 🚫 What IaC is NOT
-
-| ❌ Myth | ✅ Reality |
-|---------|-----------|
-| "Just automation scripts" | 📝 Declarative desired state |
-| "Only for cloud" | 🖥️ Works for any infrastructure |
-| "Replaces ops people" | 🤝 Empowers ops teams |
-| "Too complex for small teams" | 🎯 Benefits scale to any size |
-| "One-time setup" | 🔄 Continuous lifecycle management |
-
-> 🔥 **Hot take:** If you can't recreate your infrastructure from code, you don't have IaC.
-
-**🎯 IaC is about:**
-* 🧠 Declarative definitions
-* 🤝 Team collaboration on infrastructure
-* 🔄 Repeatable, consistent environments
-* 📊 Audit trails and compliance
-
----
-
-## 📍 Slide 13 – 🔀 Declarative vs Imperative
-
-```mermaid
-flowchart TD
-  subgraph Declarative
-    D1[📝 Define desired state]
-    D2[🤖 Tool figures out how]
-    D1 --> D2
-  end
-  subgraph Imperative
-    I1[📝 Define exact steps]
-    I2[🔧 Execute step by step]
-    I1 --> I2
-  end
-```
-
-| 📋 Aspect | 🌍 Declarative | 🔧 Imperative |
-|-----------|---------------|---------------|
-| 📝 What you write | Desired end state | Exact steps |
-| 🛠️ Tool | Terraform, CloudFormation | Pulumi, Scripts |
-| 🔄 Idempotency | Built-in | You implement |
-| 📚 Example | "3 VMs exist" | "Create VM 1, 2, 3" |
-
-**📚 Source:** Terraform documentation
-
----
-
-## 📍 Slide 14 – 🛠️ IaC Tool Landscape
-
-```mermaid
-graph TD
-  IaC[🏗️ Infrastructure as Code]
-  IaC --> Prov[📦 Provisioning]
-  IaC --> Config[⚙️ Configuration]
-  Prov --> Terraform[🌍 Terraform]
-  Prov --> Pulumi[📦 Pulumi]
-  Prov --> Cloud[☁️ CloudFormation/ARM]
-  Config --> Ansible[🔧 Ansible]
-  Config --> Chef[👨‍🍳 Chef]
-  Config --> Puppet[🎭 Puppet]
-```
-
-| 🛠️ Tool | 🎯 Focus | 📝 Language |
-|---------|---------|------------|
-| 🌍 **Terraform** | Provisioning | HCL (declarative) |
-| 📦 **Pulumi** | Provisioning | Python, TS, Go |
-| 🔧 **Ansible** | Configuration | YAML |
-| ☁️ **CloudFormation** | AWS only | YAML/JSON |
-
----
-
-## 📍 Slide 15 – ⚡ Before vs After IaC
-
-| 😰 Before | 🚀 After |
-|----------|---------|
-| 📅 Days to provision | ⚡ Minutes to provision |
-| 📋 Manual documentation | 📝 Code IS documentation |
-| 👉 "Who changed that?" | 📜 Git history shows all |
-| 😨 Fear of recreation | 💪 Confident rebuilds |
-| 🐶 Unique snowflakes | 🐄 Identical cattle |
-| 🙅 "Don't touch prod" | 🔄 Infrastructure is disposable |
-
-> 🤔 How confident are you in recreating your infrastructure?
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: Terraform Deep Dive
-
-## 🌍 Why Terraform?
-
-* 🌐 **Multi-cloud**: AWS, GCP, Azure, Yandex, and 3000+ providers
-* 📝 **HCL**: Human-readable configuration language
-* 🔄 **State management**: Tracks what exists
-* 🏢 **Industry standard**: Most widely adopted IaC tool
-
-**🎮 Let's build infrastructure.**
-
----
-
-## 📍 Slide 17 – 📝 Terraform Workflow
-
-```mermaid
-flowchart LR
-  Write[📝 Write] --> Init[🔧 Init]
-  Init --> Plan[📋 Plan]
-  Plan --> Apply[🚀 Apply]
-  Apply --> Destroy[💥 Destroy]
-```
-
-* 📝 **Write**: Define resources in `.tf` files
-* 🔧 **Init**: Download provider plugins
-* 📋 **Plan**: Preview changes (dry run)
-* 🚀 **Apply**: Create/update infrastructure
-* 💥 **Destroy**: Remove all resources
-
-**🛠️ Commands:**
-```bash
-terraform init      # Download providers
-terraform plan      # Preview changes
-terraform apply     # Apply changes
-terraform destroy   # Remove everything
-```
-
----
-
-## 📍 Slide 18 – 🧱 Terraform Building Blocks
-
-```mermaid
-flowchart TD
-  Config[📁 Configuration]
-  Config --> Provider[☁️ Provider]
-  Config --> Resource[🏗️ Resource]
-  Config --> Variable[📊 Variable]
-  Config --> Output[📤 Output]
-  Config --> Data[🔍 Data Source]
-```
-
-* ☁️ **Provider**: Cloud API connection (AWS, GCP, Yandex)
-* 🏗️ **Resource**: Infrastructure component (VM, network, firewall)
-* 📊 **Variable**: Configurable inputs
-* 📤 **Output**: Values to display/export
-* 🔍 **Data Source**: Query existing infrastructure
-
----
-
-## 📍 Slide 19 – 💻 Terraform Example: VM Creation
-
-```hcl
-# ☁️ Provider configuration
-provider "yandex" {
-  zone = "ru-central1-a"
-}
-
-# 🏗️ Virtual machine resource
-resource "yandex_compute_instance" "web" {
-  name        = "web-server"
-  platform_id = "standard-v2"
-
-  resources {
-    cores  = 2
-    memory = 2
-  }
-
-  boot_disk {
-    initialize_params {
-      image_id = "fd8vmcue7aajqdge3bp0"  # Ubuntu 22.04
-    }
-  }
-}
-```
-
-**🎯 Result:** One command creates a VM in the cloud
-
----
-
-## 📍 Slide 20 – 📊 Variables and Outputs
-
-```hcl
-# 📊 Input variables
-variable "instance_count" {
-  description = "Number of VMs to create"
-  type        = number
-  default     = 1
-}
-
-variable "environment" {
-  description = "Environment name"
-  type        = string
-}
-
-# 📤 Output values
-output "vm_ip" {
-  description = "Public IP of the VM"
-  value       = yandex_compute_instance.web.network_interface.0.nat_ip_address
-}
-```
-
-**🛠️ Usage:**
-```bash
-terraform apply -var="instance_count=3" -var="environment=prod"
-```
-
----
-
-## 📍 Slide 21 – 🔄 Terraform Plan
-
-```mermaid
-flowchart LR
-  Code[📝 Config] --> Plan[📋 terraform plan]
-  State[📦 State] --> Plan
-  Plan --> Diff[🔍 Difference]
-  Diff --> Preview[👀 What will change?]
-```
-
-**📋 Plan Output Example:**
-```
-# yandex_compute_instance.web will be created
-+ resource "yandex_compute_instance" "web" {
-    + name        = "web-server"
-    + platform_id = "standard-v2"
-    + status      = (known after apply)
-
-    + resources {
-        + cores  = 2
-        + memory = 2
-      }
-  }
-
-Plan: 1 to add, 0 to change, 0 to destroy.
-```
-
-**🎯 Always review the plan before applying!**
-
----
-
-## 📍 Slide 22 – 📦 Pulumi Alternative
-
-```mermaid
-flowchart LR
-  Terraform[🌍 Terraform] -->|HCL| Declarative[📝 Declarative]
-  Pulumi[📦 Pulumi] -->|Python/TS/Go| Imperative[💻 Imperative]
-```
-
-**📦 Pulumi Python Example:**
-```python
-import pulumi
-import pulumi_yandex as yandex
-
-# 🏗️ Create VM using Python
-vm = yandex.ComputeInstance("web",
-    name="web-server",
-    platform_id="standard-v2",
-    resources=yandex.ComputeInstanceResourcesArgs(
-        cores=2,
-        memory=2,
-    ))
-
-# 📤 Export IP address
-pulumi.export("ip", vm.network_interfaces[0].nat_ip_address)
-```
-
-**🎯 Same result, real programming language**
-
----
-
-## 📍 Slide 23 – ⚖️ Terraform vs Pulumi
-
-| 📋 Aspect | 🌍 Terraform | 📦 Pulumi |
-|-----------|-------------|----------|
-| 📝 Language | HCL (domain-specific) | Python, TS, Go, C# |
-| 📚 Learning curve | New syntax to learn | Familiar languages |
-| 🔄 Logic | Limited (count, for_each) | Full programming |
-| 🧪 Testing | External tools | Native unit tests |
-| 📦 State | Local or S3 | Pulumi Cloud (free tier) |
-| 🔐 Secrets | Plain in state | Encrypted by default |
-
-> ❓ **When to use which?**
-> * 🌍 **Terraform**: Larger community, more examples, declarative simplicity
-> * 📦 **Pulumi**: Complex logic, existing codebase, testing requirements
-
----
-
-## 📍 Slide 24 – 🔐 Security Best Practices
-
-```yaml
-# ❌ NEVER do this
-provider "aws" {
-  access_key = "AKIAIOSFODNN7EXAMPLE"    # 💀 Hardcoded secret!
-  secret_key = "wJalrXUtnFEMI/..."       # 💀 Hardcoded secret!
-}
-
-# ✅ Use environment variables
-# export AWS_ACCESS_KEY_ID="..."
-# export AWS_SECRET_ACCESS_KEY="..."
-provider "aws" {
-  # Automatically uses env vars
-}
-```
-
-**🔐 Security Rules:**
-* 🚫 Never commit secrets to Git
-* 📁 Use `.gitignore` for state and tfvars
-* 🔑 Use environment variables or secret managers
-* 🔒 Encrypt state file at rest
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L4_MID
-
----
-
-## 📍 Slide 26 – 📦 Section 4: State Management
-
-## 🗃️ What is Terraform State?
-
-* 📝 Maps configuration to real-world resources
-* 🔍 Tracks what Terraform manages
-* 🔄 Determines what changes are needed
-* ⚠️ Contains sensitive data
-
-```mermaid
-flowchart LR
-  Config[📝 Config Files] --> TF[🌍 Terraform]
-  State[📦 State File] --> TF
-  TF --> Cloud[☁️ Real Infrastructure]
-  Cloud --> State
-```
-
----
-
-## 📍 Slide 27 – 📁 State File Contents
-
-```json
-{
-  "version": 4,
-  "terraform_version": "1.9.0",
-  "resources": [
-    {
-      "type": "yandex_compute_instance",
-      "name": "web",
-      "instances": [
-        {
-          "attributes": {
-            "id": "fhm1234567890",
-            "name": "web-server",
-            "network_interface": [
-              {
-                "ip_address": "192.168.1.10",
-                "nat_ip_address": "51.250.1.100"
-              }
-            ]
-          }
-        }
-      ]
-    }
-  ]
-}
-```
-
-**⚠️ Never edit state manually!**
-
----
-
-## 📍 Slide 28 – 🌐 Remote State
-
-```mermaid
-flowchart TD
-  Dev1[👨‍💻 Developer 1] --> Remote[🌐 Remote State]
-  Dev2[👨‍💻 Developer 2] --> Remote
-  Dev3[👨‍💻 Developer 3] --> Remote
-  Remote --> Cloud[☁️ Cloud Infrastructure]
-```
-
-**🌐 Remote State Benefits:**
-* 🤝 Team collaboration
-* 🔒 Locking prevents conflicts
-* 🔐 Encrypted at rest
-* 📜 Versioning and backup
-
-**📦 Backend Options:**
-* ☁️ **S3/GCS**: Object storage
-* 🏢 **Terraform Cloud**: HashiCorp managed
-* 🔐 **Consul**: HashiCorp Consul
-
----
-
-## 📍 Slide 29 – 📊 IaC Metrics
-
-| 📊 Metric | 📏 Measures | 🏆 Target |
-|-----------|------------|---------|
-| ⏱️ **Provisioning Time** | Time to create env | < 15 minutes |
-| 🔄 **Environment Parity** | Dev = Staging = Prod | 100% |
-| ❌ **Drift Detection** | Config drift incidents | 0 per month |
-| 📜 **Audit Compliance** | Changes tracked in Git | 100% |
-
-> 📚 These metrics indicate IaC maturity.
-
-**🤔 Question:** How long does it take to spin up a new environment?
-
----
-
-## 📍 Slide 30 – 🌊 From Snowflakes to Cattle
-
-```mermaid
-flowchart LR
-  subgraph 😱 Snowflakes
-    Manual[🔧 Manual Setup]
-    Unique[❄️ Unique Servers]
-    Drift[📋 Configuration Drift]
-  end
-  subgraph 🐄 Cattle
-    Code[📝 Code-Defined]
-    Identical[🔄 Identical Servers]
-    Reproducible[✅ Reproducible]
-  end
-  Snowflakes -->|🚀 IaC| Cattle
-```
-
-**🎯 Goal State:**
-* ⚡ Any environment recreatable in minutes
-* 🔄 All changes through code review
-* 📈 Teams deploy infrastructure confidently
-
----
-
-## 📍 Slide 31 – 🏢 Section 5: IaC in Real Life
-
-## 📅 A Day with IaC
-
-**☀️ Morning:**
-* 📊 Review infrastructure PR
-* 👀 Check `terraform plan` output
-* ✅ Approve and merge
-
-**🌤️ Afternoon:**
-* 🚨 Need new test environment
-* 🔧 Copy `terraform.tfvars`
-* 🚀 `terraform apply` — **done in 10 minutes**
-
-**🌙 Evening:**
-* 🗑️ `terraform destroy` test environment
-* 💰 No resources running overnight
-
----
-
-## 📍 Slide 32 – 👥 IaC Team Workflow
-
-| 👤 Role | 🎯 IaC Responsibility |
-|---------|----------------------|
-| 🔧 **DevOps/Platform** | Write and maintain IaC modules |
-| 👨‍💻 **Developer** | Use modules, request infrastructure |
-| 🛡️ **Security** | Review IaC for compliance |
-| 📊 **FinOps** | Monitor infrastructure costs |
-
-**🔗 Common Workflow:**
-* 📝 Create branch with IaC changes
-* 🔍 CI runs `terraform plan`
-* 👀 Team reviews the plan
-* ✅ Merge triggers `terraform apply`
-
----
-
-## 📍 Slide 33 – 🤝 GitOps for Infrastructure
-
-```mermaid
-flowchart TD
-  Dev[👨‍💻 Developer] -->|📝 PR| Git[🐙 Git Repository]
-  Git -->|🔄 CI/CD| Plan[📋 Terraform Plan]
-  Plan -->|👀 Review| Approve[✅ Approve]
-  Approve -->|🚀 Merge| Apply[🌍 Terraform Apply]
-  Apply --> Cloud[☁️ Infrastructure]
-```
-
-**🤝 GitOps Practices:**
-* 📟 All changes through pull requests
-* 📝 Plan output in PR comments
-* 👥 Required approvals
-* 🔓 Protected main branch
-
----
-
-## 📍 Slide 34 – 📈 Career Path: IaC Skills
-
-```mermaid
-flowchart LR
-  Junior[🌱 Junior: Basic Terraform] --> Mid[💼 Mid: Modules & CI/CD]
-  Mid --> Senior[⭐ Senior: Multi-cloud & Architecture]
-  Senior --> Principal[🏆 Principal: Platform Strategy]
-```
-
-**🛠️ Skills to Build:**
-* 🌍 Terraform HCL fluency
-* ☁️ Cloud provider APIs
-* 🔐 Security best practices
-* 📦 Module design
-* 🔄 CI/CD integration
-
----
-
-## 📍 Slide 35 – 🌍 Real Company Examples
-
-**🏢 HashiCorp Customers:**
-* 🏦 **Stripe**: Terraform for AWS infrastructure
-* 🎮 **Riot Games**: Multi-cloud with Terraform
-* 🛒 **Shopify**: Thousands of resources managed
-
-**☁️ Cloud Native:**
-* 🔍 **Google**: Uses Terraform internally
-* 📦 **Spotify**: IaC for Kubernetes infrastructure
-* 🎬 **Netflix**: Custom tooling built on IaC principles
-
-**📊 Stats:**
-* 🌍 **2M+** Terraform users worldwide
-* 📦 **3000+** providers available
-* 🏢 **Fortune 500**: 85% use IaC
-
----
-
-## 📍 Slide 36 – 🎯 Section 6: Reflection
-
-## 📝 Key Takeaways
-
-1. 🏗️ **IaC = Infrastructure defined in code**
-2. 🐄 **Cattle not pets** — servers are disposable
-3. 📝 **Version control everything** — Git for infrastructure
-4. 📋 **Plan before apply** — always review changes
-5. 🔐 **Never commit secrets** — use environment variables
-
-> 💡 If you can't recreate it from code, it's not really infrastructure as code.
-
----
-
-## 📍 Slide 37 – 🧠 The Mindset Shift
-
-| 😰 Old Mindset | 🚀 IaC Mindset |
-|---------------|------------------|
-| 🙅 "SSH and fix it" | 📝 "Change the code" |
-| 🚫 "Don't touch that server" | 💪 "Destroy and recreate" |
-| 👉 "Who set this up?" | 📜 "Git blame shows history" |
-| 😨 "Manual is faster" | ⚡ "Automation is faster at scale" |
-| 💻 "Works on my cloud" | 🌍 "Works on any cloud" |
-
-> ❓ Which mindset describes your team?
-
----
-
-## 📍 Slide 38 – ✅ Your Progress
-
-## 🎓 What You Now Understand
-
-* ✅ Why IaC is essential for modern infrastructure
-* ✅ The difference between declarative and imperative
-* ✅ How Terraform and Pulumi work
-* ✅ State management and security practices
-* ✅ Real-world IaC workflows
-
-> 🚀 **You're ready for Lab 4: Terraform & Pulumi**
-
----
-
-## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L4_POST
-
----
-
-## 📍 Slide 40 – 🚀 What Comes Next
-
-## 📚 Next Lecture: Configuration Management with Ansible
-
-* 🔧 Ansible fundamentals
-* 📦 Roles and playbooks
-* 🤖 Automating server configuration
-* 💻 Hands-on: Deploying Docker with Ansible
-
-**🎉 Your IaC journey begins.**
-
-> 🐄 From snowflakes to cattle — one terraform apply at a time.
-
-```mermaid
-flowchart LR
-  You[👤 You] --> IaC[🏗️ IaC Skills]
-  IaC --> Reproducible[🔄 Reproducible Infra]
-  Reproducible --> Career[🚀 Career Growth]
-```
-
-**👋 See you in the next lecture!**
-
----
-
-## 📚 Resources & Further Reading
-
-**📕 Books:**
-* 📖 *Terraform: Up & Running* — Yevgeniy Brikman
-* 📖 *Infrastructure as Code* — Kief Morris
-* 📖 *The DevOps Handbook* — Gene Kim et al.
-
-**🔗 Links:**
-* 🌐 [Terraform Documentation](https://developer.hashicorp.com/terraform/docs)
-* 🌐 [Pulumi Documentation](https://www.pulumi.com/docs/)
-* 🌐 [Terraform Registry](https://registry.terraform.io/)
-
----
+# 📌 Lecture 4 — Infrastructure as Code: From Snowflakes to Cattle
+
+## 📍 Slide 1 – 🚀 Welcome to Infrastructure as Code
+
+* 🌍 **Infrastructure used to be physical** — racks, cables, manual configuration
+* 😰 Manual setup leads to inconsistency, drift, and undocumented "snowflakes"
+* 🏗️ **Infrastructure as Code (IaC)** treats infrastructure like software
+* 🎯 This lecture: learn to define, version, and automate your infrastructure
+
+```mermaid
+flowchart LR
+  Manual[🔧 Manual Setup] -->|IaC| Code[📝 Code-Defined]
+  Code --> Reproducible[🔄 Reproducible Infrastructure]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand Infrastructure as Code principles
+* ✅ Compare declarative vs imperative IaC approaches
+* ✅ Apply Terraform workflows to real cloud infrastructure
+* ✅ Manage infrastructure state securely
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Define IaC and explain its benefits |
+| 2 | 🔍 Distinguish between Terraform and Pulumi |
+| 3 | 🛠️ Write basic Terraform configurations |
+| 4 | 🗺️ Understand state management and security |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + Code examples** — hands-on focus
+* 🎮 **Real-world scenarios** — cloud provisioning challenges
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Tool comparison**: Terraform vs Pulumi
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Infrastructure Problem
+Section 2: IaC Fundamentals
+Section 3: Terraform Deep Dive    → 📝 MID Quiz
+Section 4: State & Security
+Section 5: Real World IaC
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **73%** of organizations report configuration drift as a major issue
+* ⏱️ Average time to provision a server manually: **hours to days**
+* 💥 Most outages caused by **configuration changes**
+
+> 💬 *"It works in staging but not production"* — Every ops engineer, ever
+
+**🤔 Think about it:**
+* How do you recreate your production environment?
+* What happens when the person who set it up leaves?
+* Can you spin up a new environment in minutes?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L4_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Infrastructure Problem
+
+* 🐶 **Pet Servers** = unique, hand-crafted, irreplaceable
+* 🔧 Manual configuration via SSH and console clicks
+* 📋 Documentation gets outdated immediately
+* 💥 Result: **snowflake infrastructure** — no two servers are the same
+
+```mermaid
+flowchart LR
+  Server1[🖥️ Server 1: Ubuntu 20 + patches]
+  Server2[🖥️ Server 2: Ubuntu 22 + different patches]
+  Server3[🖥️ Server 3: ???]
+  Server1 --> Chaos[😱 Configuration Chaos]
+  Server2 --> Chaos
+  Server3 --> Chaos
+```
+
+---
+
+## 📍 Slide 7 – 🐶 Pets vs Cattle
+
+* 🐶 **Pets**: Named servers, nursed back to health when sick
+* 🐄 **Cattle**: Numbered, identical, replaced when broken
+* 🌍 Cloud-native = cattle mindset
+
+```mermaid
+flowchart TD
+  subgraph 🐶 Pets
+    P1[web-prod-01]
+    P2[db-master]
+    P3[app-legacy]
+  end
+  subgraph 🐄 Cattle
+    C1[instance-001]
+    C2[instance-002]
+    C3[instance-003]
+  end
+  Pets -->|😰 Unique, fragile| Problem[Hard to scale]
+  Cattle -->|🔄 Identical, disposable| Solution[Easy to scale]
+```
+
+> 🤔 **Think:** Are your servers pets or cattle?
+
+---
+
+## 📍 Slide 8 – 😱 Configuration Drift
+
+* 📅 Server configured once, modified many times
+* 🔧 "Quick fixes" applied directly in production
+* 📋 No record of what changed
+* 💀 Disaster recovery = guesswork
+
+```mermaid
+flowchart TD
+  Initial[✅ Initial Setup] --> Month1[📅 Month 1: Hotfix applied]
+  Month1 --> Month3[📅 Month 3: Security patch]
+  Month3 --> Month6[📅 Month 6: Unknown changes]
+  Month6 --> Drift[😱 Configuration Drift]
+  Drift --> Unknown[❓ What's actually running?]
+```
+
+**📊 The Numbers:**
+* 🔍 **65%** of downtime caused by configuration issues
+* ⏱️ Average recovery time: **4+ hours**
+* 💰 Cost per hour of downtime: **$300,000** (enterprise)
+
+---
+
+## 📍 Slide 9 – 😨 The Bus Factor
+
+* 👤 One person knows how the infrastructure works
+* 🚌 They leave, get sick, or go on vacation
+* 🙈 Nobody can recreate or fix the environment
+* 💀 Business continuity at risk
+
+> ⚠️ **Bus Factor = 1** means your infrastructure is fragile
+
+**😰 Signs of Low Bus Factor:**
+* 🔇 "Ask John, he set that up"
+* 📝 Documentation is outdated or missing
+* 🐌 Changes require specific people
+* 🚪 Knowledge walks out the door
+
+**💬 Discussion:** What's your infrastructure bus factor?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Manual Infrastructure
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow provisioning | Days to spin up new environments |
+| 📋 Manual processes | Human error, inconsistency |
+| 👉 No audit trail | Compliance violations |
+| 🙈 Configuration drift | Unpredictable behavior |
+
+**📈 Real Numbers:**
+* 🏢 **Manual provisioning**: 2-4 hours per server
+* 🚀 **With IaC**: 2-4 minutes per server
+* 🔄 **Environment recreation**: hours vs seconds
+
+**💰 Time Cost:**
+* 👨‍💻 Engineer time: **$75-150/hour**
+* 🖥️ 10 servers manually: **$1,500-3,000**
+* 🤖 10 servers with IaC: **$15-30**
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Infrastructure as Code Is
+
+* 📝 **IaC** = defining infrastructure in version-controlled files
+* 🔄 Infrastructure becomes **reproducible** and **auditable**
+* 🚫 No more clicking through consoles
+* 🎯 Same infrastructure, every time
+
+```mermaid
+flowchart LR
+  Code[📝 Code] -->|🔄 Apply| Cloud[☁️ Cloud]
+  Cloud --> Infra[🏗️ Infrastructure]
+  Code -->|📜 Git| Version[Version Control]
+```
+
+**📖 Definition:**
+> *Infrastructure as Code is the practice of managing and provisioning infrastructure through machine-readable configuration files rather than through manual processes or interactive tools.*
+
+---
+
+## 📍 Slide 12 – 🚫 What IaC is NOT
+
+| ❌ Myth | ✅ Reality |
+|---------|-----------|
+| "Just automation scripts" | 📝 Declarative desired state |
+| "Only for cloud" | 🖥️ Works for any infrastructure |
+| "Replaces ops people" | 🤝 Empowers ops teams |
+| "Too complex for small teams" | 🎯 Benefits scale to any size |
+| "One-time setup" | 🔄 Continuous lifecycle management |
+
+> 🔥 **Hot take:** If you can't recreate your infrastructure from code, you don't have IaC.
+
+**🎯 IaC is about:**
+* 🧠 Declarative definitions
+* 🤝 Team collaboration on infrastructure
+* 🔄 Repeatable, consistent environments
+* 📊 Audit trails and compliance
+
+---
+
+## 📍 Slide 13 – 🔀 Declarative vs Imperative
+
+```mermaid
+flowchart TD
+  subgraph Declarative
+    D1[📝 Define desired state]
+    D2[🤖 Tool figures out how]
+    D1 --> D2
+  end
+  subgraph Imperative
+    I1[📝 Define exact steps]
+    I2[🔧 Execute step by step]
+    I1 --> I2
+  end
+```
+
+| 📋 Aspect | 🌍 Declarative | 🔧 Imperative |
+|-----------|---------------|---------------|
+| 📝 What you write | Desired end state | Exact steps |
+| 🛠️ Tool | Terraform, CloudFormation | Pulumi, Scripts |
+| 🔄 Idempotency | Built-in | You implement |
+| 📚 Example | "3 VMs exist" | "Create VM 1, 2, 3" |
+
+**📚 Source:** Terraform documentation
+
+---
+
+## 📍 Slide 14 – 🛠️ IaC Tool Landscape
+
+```mermaid
+graph TD
+  IaC[🏗️ Infrastructure as Code]
+  IaC --> Prov[📦 Provisioning]
+  IaC --> Config[⚙️ Configuration]
+  Prov --> Terraform[🌍 Terraform]
+  Prov --> Pulumi[📦 Pulumi]
+  Prov --> Cloud[☁️ CloudFormation/ARM]
+  Config --> Ansible[🔧 Ansible]
+  Config --> Chef[👨‍🍳 Chef]
+  Config --> Puppet[🎭 Puppet]
+```
+
+| 🛠️ Tool | 🎯 Focus | 📝 Language |
+|---------|---------|------------|
+| 🌍 **Terraform** | Provisioning | HCL (declarative) |
+| 📦 **Pulumi** | Provisioning | Python, TS, Go |
+| 🔧 **Ansible** | Configuration | YAML |
+| ☁️ **CloudFormation** | AWS only | YAML/JSON |
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After IaC
+
+| 😰 Before | 🚀 After |
+|----------|---------|
+| 📅 Days to provision | ⚡ Minutes to provision |
+| 📋 Manual documentation | 📝 Code IS documentation |
+| 👉 "Who changed that?" | 📜 Git history shows all |
+| 😨 Fear of recreation | 💪 Confident rebuilds |
+| 🐶 Unique snowflakes | 🐄 Identical cattle |
+| 🙅 "Don't touch prod" | 🔄 Infrastructure is disposable |
+
+> 🤔 How confident are you in recreating your infrastructure?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Terraform Deep Dive
+
+## 🌍 Why Terraform?
+
+* 🌐 **Multi-cloud**: AWS, GCP, Azure, Yandex, and 3000+ providers
+* 📝 **HCL**: Human-readable configuration language
+* 🔄 **State management**: Tracks what exists
+* 🏢 **Industry standard**: Most widely adopted IaC tool
+
+**🎮 Let's build infrastructure.**
+
+---
+
+## 📍 Slide 17 – 📝 Terraform Workflow
+
+```mermaid
+flowchart LR
+  Write[📝 Write] --> Init[🔧 Init]
+  Init --> Plan[📋 Plan]
+  Plan --> Apply[🚀 Apply]
+  Apply --> Destroy[💥 Destroy]
+```
+
+* 📝 **Write**: Define resources in `.tf` files
+* 🔧 **Init**: Download provider plugins
+* 📋 **Plan**: Preview changes (dry run)
+* 🚀 **Apply**: Create/update infrastructure
+* 💥 **Destroy**: Remove all resources
+
+**🛠️ Commands:**
+```bash
+terraform init      # Download providers
+terraform plan      # Preview changes
+terraform apply     # Apply changes
+terraform destroy   # Remove everything
+```
+
+---
+
+## 📍 Slide 18 – 🧱 Terraform Building Blocks
+
+```mermaid
+flowchart TD
+  Config[📁 Configuration]
+  Config --> Provider[☁️ Provider]
+  Config --> Resource[🏗️ Resource]
+  Config --> Variable[📊 Variable]
+  Config --> Output[📤 Output]
+  Config --> Data[🔍 Data Source]
+```
+
+* ☁️ **Provider**: Cloud API connection (AWS, GCP, Yandex)
+* 🏗️ **Resource**: Infrastructure component (VM, network, firewall)
+* 📊 **Variable**: Configurable inputs
+* 📤 **Output**: Values to display/export
+* 🔍 **Data Source**: Query existing infrastructure
+
+---
+
+## 📍 Slide 19 – 💻 Terraform Example: VM Creation
+
+```hcl
+# ☁️ Provider configuration
+provider "yandex" {
+  zone = "ru-central1-a"
+}
+
+# 🏗️ Virtual machine resource
+resource "yandex_compute_instance" "web" {
+  name        = "web-server"
+  platform_id = "standard-v2"
+
+  resources {
+    cores  = 2
+    memory = 2
+  }
+
+  boot_disk {
+    initialize_params {
+      image_id = "fd8vmcue7aajqdge3bp0"  # Ubuntu 22.04
+    }
+  }
+}
+```
+
+**🎯 Result:** One command creates a VM in the cloud
+
+---
+
+## 📍 Slide 20 – 📊 Variables and Outputs
+
+```hcl
+# 📊 Input variables
+variable "instance_count" {
+  description = "Number of VMs to create"
+  type        = number
+  default     = 1
+}
+
+variable "environment" {
+  description = "Environment name"
+  type        = string
+}
+
+# 📤 Output values
+output "vm_ip" {
+  description = "Public IP of the VM"
+  value       = yandex_compute_instance.web.network_interface.0.nat_ip_address
+}
+```
+
+**🛠️ Usage:**
+```bash
+terraform apply -var="instance_count=3" -var="environment=prod"
+```
+
+---
+
+## 📍 Slide 21 – 🔄 Terraform Plan
+
+```mermaid
+flowchart LR
+  Code[📝 Config] --> Plan[📋 terraform plan]
+  State[📦 State] --> Plan
+  Plan --> Diff[🔍 Difference]
+  Diff --> Preview[👀 What will change?]
+```
+
+**📋 Plan Output Example:**
+```
+# yandex_compute_instance.web will be created
++ resource "yandex_compute_instance" "web" {
+    + name        = "web-server"
+    + platform_id = "standard-v2"
+    + status      = (known after apply)
+
+    + resources {
+        + cores  = 2
+        + memory = 2
+      }
+  }
+
+Plan: 1 to add, 0 to change, 0 to destroy.
+```
+
+**🎯 Always review the plan before applying!**
+
+---
+
+## 📍 Slide 22 – 📦 Pulumi Alternative
+
+```mermaid
+flowchart LR
+  Terraform[🌍 Terraform] -->|HCL| Declarative[📝 Declarative]
+  Pulumi[📦 Pulumi] -->|Python/TS/Go| Imperative[💻 Imperative]
+```
+
+**📦 Pulumi Python Example:**
+```python
+import pulumi
+import pulumi_yandex as yandex
+
+# 🏗️ Create VM using Python
+vm = yandex.ComputeInstance("web",
+    name="web-server",
+    platform_id="standard-v2",
+    resources=yandex.ComputeInstanceResourcesArgs(
+        cores=2,
+        memory=2,
+    ))
+
+# 📤 Export IP address
+pulumi.export("ip", vm.network_interfaces[0].nat_ip_address)
+```
+
+**🎯 Same result, real programming language**
+
+---
+
+## 📍 Slide 23 – ⚖️ Terraform vs Pulumi
+
+| 📋 Aspect | 🌍 Terraform | 📦 Pulumi |
+|-----------|-------------|----------|
+| 📝 Language | HCL (domain-specific) | Python, TS, Go, C# |
+| 📚 Learning curve | New syntax to learn | Familiar languages |
+| 🔄 Logic | Limited (count, for_each) | Full programming |
+| 🧪 Testing | External tools | Native unit tests |
+| 📦 State | Local or S3 | Pulumi Cloud (free tier) |
+| 🔐 Secrets | Plain in state | Encrypted by default |
+
+> ❓ **When to use which?**
+> * 🌍 **Terraform**: Larger community, more examples, declarative simplicity
+> * 📦 **Pulumi**: Complex logic, existing codebase, testing requirements
+
+---
+
+## 📍 Slide 24 – 🔐 Security Best Practices
+
+```yaml
+# ❌ NEVER do this
+provider "aws" {
+  access_key = "AKIAIOSFODNN7EXAMPLE"    # 💀 Hardcoded secret!
+  secret_key = "wJalrXUtnFEMI/..."       # 💀 Hardcoded secret!
+}
+
+# ✅ Use environment variables
+# export AWS_ACCESS_KEY_ID="..."
+# export AWS_SECRET_ACCESS_KEY="..."
+provider "aws" {
+  # Automatically uses env vars
+}
+```
+
+**🔐 Security Rules:**
+* 🚫 Never commit secrets to Git
+* 📁 Use `.gitignore` for state and tfvars
+* 🔑 Use environment variables or secret managers
+* 🔒 Encrypt state file at rest
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L4_MID
+
+---
+
+## 📍 Slide 26 – 📦 Section 4: State Management
+
+## 🗃️ What is Terraform State?
+
+* 📝 Maps configuration to real-world resources
+* 🔍 Tracks what Terraform manages
+* 🔄 Determines what changes are needed
+* ⚠️ Contains sensitive data
+
+```mermaid
+flowchart LR
+  Config[📝 Config Files] --> TF[🌍 Terraform]
+  State[📦 State File] --> TF
+  TF --> Cloud[☁️ Real Infrastructure]
+  Cloud --> State
+```
+
+---
+
+## 📍 Slide 27 – 📁 State File Contents
+
+```json
+{
+  "version": 4,
+  "terraform_version": "1.9.0",
+  "resources": [
+    {
+      "type": "yandex_compute_instance",
+      "name": "web",
+      "instances": [
+        {
+          "attributes": {
+            "id": "fhm1234567890",
+            "name": "web-server",
+            "network_interface": [
+              {
+                "ip_address": "192.168.1.10",
+                "nat_ip_address": "51.250.1.100"
+              }
+            ]
+          }
+        }
+      ]
+    }
+  ]
+}
+```
+
+**⚠️ Never edit state manually!**
+
+---
+
+## 📍 Slide 28 – 🌐 Remote State
+
+```mermaid
+flowchart TD
+  Dev1[👨‍💻 Developer 1] --> Remote[🌐 Remote State]
+  Dev2[👨‍💻 Developer 2] --> Remote
+  Dev3[👨‍💻 Developer 3] --> Remote
+  Remote --> Cloud[☁️ Cloud Infrastructure]
+```
+
+**🌐 Remote State Benefits:**
+* 🤝 Team collaboration
+* 🔒 Locking prevents conflicts
+* 🔐 Encrypted at rest
+* 📜 Versioning and backup
+
+**📦 Backend Options:**
+* ☁️ **S3/GCS**: Object storage
+* 🏢 **Terraform Cloud**: HashiCorp managed
+* 🔐 **Consul**: HashiCorp Consul
+
+---
+
+## 📍 Slide 29 – 📊 IaC Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| ⏱️ **Provisioning Time** | Time to create env | < 15 minutes |
+| 🔄 **Environment Parity** | Dev = Staging = Prod | 100% |
+| ❌ **Drift Detection** | Config drift incidents | 0 per month |
+| 📜 **Audit Compliance** | Changes tracked in Git | 100% |
+
+> 📚 These metrics indicate IaC maturity.
+
+**🤔 Question:** How long does it take to spin up a new environment?
+
+---
+
+## 📍 Slide 30 – 🌊 From Snowflakes to Cattle
+
+```mermaid
+flowchart LR
+  subgraph 😱 Snowflakes
+    Manual[🔧 Manual Setup]
+    Unique[❄️ Unique Servers]
+    Drift[📋 Configuration Drift]
+  end
+  subgraph 🐄 Cattle
+    Code[📝 Code-Defined]
+    Identical[🔄 Identical Servers]
+    Reproducible[✅ Reproducible]
+  end
+  Snowflakes -->|🚀 IaC| Cattle
+```
+
+**🎯 Goal State:**
+* ⚡ Any environment recreatable in minutes
+* 🔄 All changes through code review
+* 📈 Teams deploy infrastructure confidently
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: IaC in Real Life
+
+## 📅 A Day with IaC
+
+**☀️ Morning:**
+* 📊 Review infrastructure PR
+* 👀 Check `terraform plan` output
+* ✅ Approve and merge
+
+**🌤️ Afternoon:**
+* 🚨 Need new test environment
+* 🔧 Copy `terraform.tfvars`
+* 🚀 `terraform apply` — **done in 10 minutes**
+
+**🌙 Evening:**
+* 🗑️ `terraform destroy` test environment
+* 💰 No resources running overnight
+
+---
+
+## 📍 Slide 32 – 👥 IaC Team Workflow
+
+| 👤 Role | 🎯 IaC Responsibility |
+|---------|----------------------|
+| 🔧 **DevOps/Platform** | Write and maintain IaC modules |
+| 👨‍💻 **Developer** | Use modules, request infrastructure |
+| 🛡️ **Security** | Review IaC for compliance |
+| 📊 **FinOps** | Monitor infrastructure costs |
+
+**🔗 Common Workflow:**
+* 📝 Create branch with IaC changes
+* 🔍 CI runs `terraform plan`
+* 👀 Team reviews the plan
+* ✅ Merge triggers `terraform apply`
+
+---
+
+## 📍 Slide 33 – 🤝 GitOps for Infrastructure
+
+```mermaid
+flowchart TD
+  Dev[👨‍💻 Developer] -->|📝 PR| Git[🐙 Git Repository]
+  Git -->|🔄 CI/CD| Plan[📋 Terraform Plan]
+  Plan -->|👀 Review| Approve[✅ Approve]
+  Approve -->|🚀 Merge| Apply[🌍 Terraform Apply]
+  Apply --> Cloud[☁️ Infrastructure]
+```
+
+**🤝 GitOps Practices:**
+* 📟 All changes through pull requests
+* 📝 Plan output in PR comments
+* 👥 Required approvals
+* 🔓 Protected main branch
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: IaC Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Basic Terraform] --> Mid[💼 Mid: Modules & CI/CD]
+  Mid --> Senior[⭐ Senior: Multi-cloud & Architecture]
+  Senior --> Principal[🏆 Principal: Platform Strategy]
+```
+
+**🛠️ Skills to Build:**
+* 🌍 Terraform HCL fluency
+* ☁️ Cloud provider APIs
+* 🔐 Security best practices
+* 📦 Module design
+* 🔄 CI/CD integration
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 HashiCorp Customers:**
+* 🏦 **Stripe**: Terraform for AWS infrastructure
+* 🎮 **Riot Games**: Multi-cloud with Terraform
+* 🛒 **Shopify**: Thousands of resources managed
+
+**☁️ Cloud Native:**
+* 🔍 **Google**: Uses Terraform internally
+* 📦 **Spotify**: IaC for Kubernetes infrastructure
+* 🎬 **Netflix**: Custom tooling built on IaC principles
+
+**📊 Stats:**
+* 🌍 **2M+** Terraform users worldwide
+* 📦 **3000+** providers available
+* 🏢 **Fortune 500**: 85% use IaC
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🏗️ **IaC = Infrastructure defined in code**
+2. 🐄 **Cattle not pets** — servers are disposable
+3. 📝 **Version control everything** — Git for infrastructure
+4. 📋 **Plan before apply** — always review changes
+5. 🔐 **Never commit secrets** — use environment variables
+
+> 💡 If you can't recreate it from code, it's not really infrastructure as code.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🚀 IaC Mindset |
+|---------------|------------------|
+| 🙅 "SSH and fix it" | 📝 "Change the code" |
+| 🚫 "Don't touch that server" | 💪 "Destroy and recreate" |
+| 👉 "Who set this up?" | 📜 "Git blame shows history" |
+| 😨 "Manual is faster" | ⚡ "Automation is faster at scale" |
+| 💻 "Works on my cloud" | 🌍 "Works on any cloud" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Why IaC is essential for modern infrastructure
+* ✅ The difference between declarative and imperative
+* ✅ How Terraform and Pulumi work
+* ✅ State management and security practices
+* ✅ Real-world IaC workflows
+
+> 🚀 **You're ready for Lab 4: Terraform & Pulumi**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L4_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Configuration Management with Ansible
+
+* 🔧 Ansible fundamentals
+* 📦 Roles and playbooks
+* 🤖 Automating server configuration
+* 💻 Hands-on: Deploying Docker with Ansible
+
+**🎉 Your IaC journey begins.**
+
+> 🐄 From snowflakes to cattle — one terraform apply at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> IaC[🏗️ IaC Skills]
+  IaC --> Reproducible[🔄 Reproducible Infra]
+  Reproducible --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Terraform: Up & Running* — Yevgeniy Brikman
+* 📖 *Infrastructure as Code* — Kief Morris
+* 📖 *The DevOps Handbook* — Gene Kim et al.
+
+**🔗 Links:**
+* 🌐 [Terraform Documentation](https://developer.hashicorp.com/terraform/docs)
+* 🌐 [Pulumi Documentation](https://www.pulumi.com/docs/)
+* 🌐 [Terraform Registry](https://registry.terraform.io/)
+
+---
diff --git a/lectures/lec5.md b/lectures/lec5.md
index 5bcfba6c1a..a831119b55 100644
--- a/lectures/lec5.md
+++ b/lectures/lec5.md
@@ -1,824 +1,824 @@
-# 📌 Lecture 5 — Configuration Management: Ansible Fundamentals
-
-## 📍 Slide 1 – 🚀 Welcome to Configuration Management
-
-* 🌍 **Infrastructure is provisioned** — but what about configuring it?
-* 😰 Manual server setup leads to inconsistency and errors
-* 🔧 **Ansible automates configuration** — repeatable, reliable, documented
-* 🎯 This lecture: master Ansible roles, playbooks, and best practices
-
-```mermaid
-flowchart LR
-  Provision[🏗️ Terraform: Create VMs] --> Configure[🔧 Ansible: Configure VMs]
-  Configure --> Ready[✅ Ready to Run Apps]
-```
-
----
-
-## 📍 Slide 2 – 🎯 What You Will Learn
-
-* ✅ Understand Ansible architecture and concepts
-* ✅ Write idempotent playbooks and roles
-* ✅ Secure credentials with Ansible Vault
-* ✅ Apply configuration management best practices
-
-**🎓 Learning Outcomes:**
-| # | Outcome |
-|---|---------|
-| 1 | 🧠 Explain Ansible's agentless architecture |
-| 2 | 🔍 Create reusable roles for configuration |
-| 3 | 🛠️ Write idempotent tasks and handlers |
-| 4 | 🗺️ Secure secrets with Ansible Vault |
-
----
-
-## 📍 Slide 3 – 📋 How This Lecture Works
-
-* 📚 **Concepts + YAML examples** — hands-on learning
-* 🎮 **Real-world scenarios** — server configuration challenges
-* 📝 **3 quiz checkpoints**: PRE / MID / POST
-* 🛠️ **Best practices**: roles, handlers, idempotency
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction (now)     → 📝 PRE Quiz
-Section 1: The Configuration Problem
-Section 2: Ansible Fundamentals
-Section 3: Roles & Playbooks      → 📝 MID Quiz
-Section 4: Idempotency & Handlers
-Section 5: Real World Ansible
-Section 6: Reflection             → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – ❓ The Big Question
-
-* 📊 **94%** of organizations experienced security incidents from misconfigurations
-* ⏱️ Average time to configure a server manually: **2-4 hours**
-* 💥 Most configuration drift goes **undetected for months**
-
-> 💬 *"I installed it the same way... I think"* — Every sysadmin, ever
-
-**🤔 Think about it:**
-* How do you ensure 100 servers have identical configs?
-* What happens when you need to update a package on all servers?
-* Can you prove compliance across your infrastructure?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L5_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Configuration Problem
-
-* 🔧 **Manual configuration** = SSH into each server
-* 📋 Run commands, edit files, install packages
-* 📝 Document steps (that nobody reads)
-* 💥 Result: **no two servers are identical**
-
-```mermaid
-flowchart LR
-  Admin[👤 Admin] -->|SSH| Server1[🖥️ Server 1]
-  Admin -->|SSH| Server2[🖥️ Server 2]
-  Admin -->|SSH| Server3[🖥️ Server 3]
-  Server1 --> Drift1[📋 Config A]
-  Server2 --> Drift2[📋 Config B]
-  Server3 --> Drift3[📋 Config ???]
-```
-
----
-
-## 📍 Slide 7 – 🐚 Shell Script Approach
-
-* 📝 Write bash scripts to automate
-* 🔄 Run scripts on each server
-* ⚠️ Problem: Scripts aren't idempotent
-
-```bash
-#!/bin/bash
-# 😰 What happens if you run this twice?
-apt-get update
-apt-get install -y nginx
-echo "Welcome" > /var/www/html/index.html
-systemctl start nginx
-```
-
-**💥 Issues:**
-* 🔄 Re-running may cause errors
-* 😰 No rollback mechanism
-* 📋 No state tracking
-* 🔗 No dependency management
-
-> 🤔 **Think:** What if nginx is already installed?
-
----
-
-## 📍 Slide 8 – 😱 Configuration Management Challenges
-
-* 📅 100 servers need the same update
-* 🔧 Some servers have different OS versions
-* 📋 Some packages conflict with others
-* 💀 One mistake = hours of cleanup
-
-```mermaid
-flowchart TD
-  Update[📦 Update Required] --> S1[🖥️ Server 1: Ubuntu 20]
-  Update --> S2[🖥️ Server 2: Ubuntu 22]
-  Update --> S3[🖥️ Server 3: Ubuntu 24]
-  S1 --> Problem1[😰 Different package versions]
-  S2 --> Problem2[😰 Different dependencies]
-  S3 --> Problem3[😰 Different configs needed]
-```
-
-**📊 The Numbers:**
-* 🔍 **85%** of breaches involve misconfiguration
-* ⏱️ Manual update of 100 servers: **days**
-* 💰 Cost of configuration-related downtime: **$5,600/minute**
-
----
-
-## 📍 Slide 9 – 😨 Documentation Drift
-
-* 📝 Documentation written once
-* 🔧 Server modified many times
-* 📋 Documentation never updated
-* 💀 Reality ≠ documentation
-
-> ⚠️ **Outdated docs are worse than no docs**
-
-**😰 Signs of Documentation Drift:**
-* 🔇 "The wiki says X but we do Y now"
-* 📝 Multiple conflicting runbooks
-* 🐌 New hires struggle to onboard
-* 🚪 Knowledge leaves with employees
-
-**💬 Discussion:** How current is your documentation?
-
----
-
-## 📍 Slide 10 – 💸 The Cost of Manual Configuration
-
-| 🔥 Problem | 💥 Impact |
-|------------|-----------|
-| 🐢 Slow updates | Security vulnerabilities linger |
-| 📋 Manual errors | Downtime from typos |
-| 👉 Inconsistency | "Works on server 1 but not 2" |
-| 🙈 No audit trail | Compliance failures |
-
-**📈 Real Numbers:**
-* 🏢 **Manual config time**: 2-4 hours per server
-* 🚀 **With Ansible**: 5-10 minutes per server
-* 🔄 **Scaling**: minutes vs days
-
-**💰 ROI Example:**
-* 👨‍💻 100 servers × 3 hours × $75/hour = **$22,500**
-* 🤖 Ansible: 1 hour setup + seconds to run = **$75**
-
----
-
-## 📍 Slide 11 – 💡 Section 2: What Ansible Is
-
-* 🔧 **Configuration management tool** — automate server setup
-* 🌐 **Agentless** — uses SSH, no agents to install
-* 📝 **YAML-based** — human-readable playbooks
-* 🔄 **Idempotent** — safe to run multiple times
-
-```mermaid
-flowchart LR
-  Control[💻 Control Node] -->|SSH| Node1[🖥️ Managed Node]
-  Control -->|SSH| Node2[🖥️ Managed Node]
-  Control -->|SSH| Node3[🖥️ Managed Node]
-```
-
-**📖 Definition:**
-> *Ansible is an open-source automation tool for configuration management, application deployment, and task automation using a simple YAML syntax.*
-
----
-
-## 📍 Slide 12 – 🚫 What Ansible is NOT
-
-| ❌ Myth | ✅ Reality |
-|---------|-----------|
-| "Replaces Terraform" | 🤝 They complement each other |
-| "Requires agents" | 🌐 Agentless, SSH-based |
-| "Only for Linux" | 🪟 Works with Windows too |
-| "Just a scripting tool" | 📦 Full configuration management |
-| "Hard to learn" | 📝 YAML is simple |
-
-> 🔥 **Hot take:** Terraform provisions, Ansible configures. Use both.
-
-**🎯 Ansible is about:**
-* 🧠 Declarative configuration
-* 🤝 Consistent state across servers
-* 🔄 Repeatable automation
-* 📊 Self-documenting infrastructure
-
----
-
-## 📍 Slide 13 – 🏗️ Ansible Architecture
-
-```mermaid
-flowchart TD
-  Control[💻 Control Node]
-  Control --> Inventory[📋 Inventory]
-  Control --> Playbook[📝 Playbook]
-  Control --> Modules[📦 Modules]
-  Inventory --> Managed[🖥️ Managed Nodes]
-  Playbook --> Managed
-  Modules --> Managed
-```
-
-| 🧱 Component | 🎯 Purpose |
-|-------------|----------|
-| 💻 **Control Node** | Where Ansible runs |
-| 📋 **Inventory** | List of managed servers |
-| 📝 **Playbook** | Automation instructions |
-| 📦 **Modules** | Units of work (apt, copy, service) |
-| 🖥️ **Managed Nodes** | Target servers |
-
----
-
-## 📍 Slide 14 – 📋 Inventory Basics
-
-```ini
-# inventory/hosts.ini
-[webservers]
-web1 ansible_host=192.168.1.10
-web2 ansible_host=192.168.1.11
-
-[databases]
-db1 ansible_host=192.168.1.20
-
-[all:vars]
-ansible_user=ubuntu
-ansible_python_interpreter=/usr/bin/python3
-```
-
-**🎯 Inventory Features:**
-* 📁 Group servers logically
-* 🔧 Set per-host or per-group variables
-* 🌐 Static files or dynamic discovery
-* 🏷️ Use patterns: `webservers`, `all`, `db*`
-
----
-
-## 📍 Slide 15 – ⚡ Before vs After Ansible
-
-| 😰 Before | 🚀 After |
-|----------|---------|
-| 📅 SSH into each server | 🤖 One command for all |
-| 📋 Manual steps | 📝 Documented playbooks |
-| 👉 "Run these commands" | ✅ "Desired state defined" |
-| 😨 Fear of updates | 💪 Confident automation |
-| 🐌 Hours per server | ⚡ Seconds per server |
-| 📝 Outdated wiki | 📄 Living documentation |
-
-> 🤔 How much time does your team spend on manual configuration?
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: Roles & Playbooks
-
-## 📝 Playbook Basics
-
-* 📄 YAML file with automation tasks
-* 🎯 Defines desired state
-* 🔄 Executes on target hosts
-* 📦 Groups related tasks
-
-**🎮 Let's write some Ansible.**
-
----
-
-## 📍 Slide 17 – 📝 Simple Playbook Example
-
-```yaml
----
-# playbook.yml
-- name: Configure web servers
-  hosts: webservers
-  become: yes  # 🔐 Run as root
-
-  tasks:
-    - name: Update apt cache
-      apt:
-        update_cache: yes
-        cache_valid_time: 3600
-
-    - name: Install nginx
-      apt:
-        name: nginx
-        state: present
-
-    - name: Start nginx
-      service:
-        name: nginx
-        state: started
-        enabled: yes
-```
-
-**🛠️ Run it:**
-```bash
-ansible-playbook -i inventory/hosts.ini playbook.yml
-```
-
----
-
-## 📍 Slide 18 – 📦 Why Roles?
-
-```mermaid
-flowchart TD
-  subgraph ❌ Without Roles
-    P1[📝 One huge playbook]
-    P1 --> Problem[😰 Hard to maintain]
-  end
-  subgraph ✅ With Roles
-    R1[📦 common role]
-    R2[📦 docker role]
-    R3[📦 app role]
-    R1 --> Reuse[🔄 Reusable]
-    R2 --> Reuse
-    R3 --> Reuse
-  end
-```
-
-**📦 Role Benefits:**
-* 🔄 **Reusability**: Use across projects
-* 📁 **Organization**: Clear structure
-* 🧪 **Testability**: Test roles independently
-* 🤝 **Sharing**: Ansible Galaxy
-
----
-
-## 📍 Slide 19 – 📁 Role Structure
-
-```
-roles/
-├── docker/
-│   ├── tasks/
-│   │   └── main.yml      # 🎯 Main tasks
-│   ├── handlers/
-│   │   └── main.yml      # 🔔 Event handlers
-│   ├── defaults/
-│   │   └── main.yml      # 📊 Default variables
-│   ├── templates/
-│   │   └── config.j2     # 📝 Jinja2 templates
-│   └── files/
-│       └── script.sh     # 📄 Static files
-```
-
-**🔑 Key Directories:**
-* 📁 **tasks/**: What to do
-* 📁 **handlers/**: React to changes
-* 📁 **defaults/**: Default values (low priority)
-* 📁 **templates/**: Dynamic file templates
-* 📁 **files/**: Static files to copy
-
----
-
-## 📍 Slide 20 – 🐳 Docker Role Example
-
-```yaml
-# roles/docker/tasks/main.yml
----
-- name: Install Docker prerequisites
-  apt:
-    name:
-      - apt-transport-https
-      - ca-certificates
-      - curl
-    state: present
-
-- name: Add Docker GPG key
-  apt_key:
-    url: https://download.docker.com/linux/ubuntu/gpg
-    state: present
-
-- name: Add Docker repository
-  apt_repository:
-    repo: "deb https://download.docker.com/linux/ubuntu {{ ansible_distribution_release }} stable"
-    state: present
-
-- name: Install Docker
-  apt:
-    name: docker-ce
-    state: present
-  notify: restart docker
-```
-
----
-
-## 📍 Slide 21 – 🔔 Handlers
-
-```yaml
-# roles/docker/handlers/main.yml
----
-- name: restart docker
-  service:
-    name: docker
-    state: restarted
-```
-
-**🔔 Handler Features:**
-* 🔄 Only run when notified
-* ⏱️ Run once at end of play
-* 🎯 React to configuration changes
-* 💡 Prevent unnecessary restarts
-
-```yaml
-# tasks/main.yml
-- name: Update Docker config
-  template:
-    src: daemon.json.j2
-    dest: /etc/docker/daemon.json
-  notify: restart docker  # 🔔 Trigger handler
-```
-
----
-
-## 📍 Slide 22 – 📊 Variables & Defaults
-
-```yaml
-# roles/docker/defaults/main.yml
----
-docker_version: "24.0"
-docker_users:
-  - ubuntu
-docker_log_driver: "json-file"
-docker_log_max_size: "10m"
-```
-
-**📊 Variable Precedence (lowest to highest):**
-1. 📁 Role defaults
-2. 📋 Inventory variables
-3. 📄 Playbook vars
-4. 🔧 Command line (`-e var=value`)
-
-```yaml
-# Using variables in tasks
-- name: Install Docker {{ docker_version }}
-  apt:
-    name: "docker-ce={{ docker_version }}*"
-    state: present
-```
-
----
-
-## 📍 Slide 23 – 📝 Using Roles in Playbooks
-
-```yaml
-# playbooks/provision.yml
----
-- name: Provision web servers
-  hosts: webservers
-  become: yes
-
-  roles:
-    - common      # 📦 Install common packages
-    - docker      # 🐳 Install Docker
-    - app_deploy  # 🚀 Deploy application
-```
-
-**🎯 Clean and simple!**
-
-```mermaid
-flowchart LR
-  Playbook[📝 Playbook] --> Common[📦 common]
-  Playbook --> Docker[🐳 docker]
-  Playbook --> App[🚀 app_deploy]
-  Common --> Result[✅ Configured Server]
-  Docker --> Result
-  App --> Result
-```
-
----
-
-## 📍 Slide 24 – 🔐 Ansible Vault
-
-```bash
-# 🔐 Create encrypted file
-ansible-vault create group_vars/all.yml
-
-# 📝 Edit encrypted file
-ansible-vault edit group_vars/all.yml
-
-# 👀 View encrypted file
-ansible-vault view group_vars/all.yml
-```
-
-**🔐 Encrypted Content:**
-```yaml
----
-# group_vars/all.yml (encrypted)
-dockerhub_username: myuser
-dockerhub_password: super_secret_token
-app_secret_key: very_secret_key_123
-```
-
-**🛠️ Using Vault:**
-```bash
-ansible-playbook playbook.yml --ask-vault-pass
-# Or use password file (gitignored!)
-ansible-playbook playbook.yml --vault-password-file .vault_pass
-```
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L5_MID
-
----
-
-## 📍 Slide 26 – 🔄 Section 4: Idempotency
-
-## ♾️ What is Idempotency?
-
-* 🔄 Same result whether run once or many times
-* ✅ Safe to re-run playbooks
-* 📊 Converges to desired state
-* 🎯 No unintended side effects
-
-```mermaid
-flowchart LR
-  Run1[🚀 First Run] --> State[✅ Desired State]
-  Run2[🚀 Second Run] --> State
-  Run3[🚀 Third Run] --> State
-```
-
-**🎨 Output Colors:**
-* 🟢 **ok**: Already in desired state
-* 🟡 **changed**: Made a change
-* 🔴 **failed**: Task failed
-* ⚫ **skipped**: Task skipped
-
----
-
-## 📍 Slide 27 – 🔄 Idempotent vs Non-Idempotent
-
-```yaml
-# ❌ Non-idempotent (shell command)
-- name: Add line to file
-  shell: echo "config=value" >> /etc/app.conf
-  # 💥 Adds line EVERY time!
-
-# ✅ Idempotent (lineinfile module)
-- name: Ensure line in file
-  lineinfile:
-    path: /etc/app.conf
-    line: "config=value"
-    state: present
-  # ✅ Only adds if missing!
-```
-
-**📦 Idempotent Modules:**
-| Module | Purpose | Idempotent? |
-|--------|---------|-------------|
-| `apt` | Install packages | ✅ Yes |
-| `service` | Manage services | ✅ Yes |
-| `file` | Manage files | ✅ Yes |
-| `shell` | Run commands | ❌ Usually no |
-| `command` | Run commands | ❌ Usually no |
-
----
-
-## 📍 Slide 28 – 🧪 Testing Idempotency
-
-```mermaid
-flowchart TD
-  Run1[🚀 First Run] --> Changed[🟡 changed: 15]
-  Run2[🚀 Second Run] --> Ok[🟢 changed: 0]
-  Ok --> Idempotent[✅ Playbook is Idempotent!]
-```
-
-**🧪 Test Process:**
-1. 🚀 Run playbook first time → many changes
-2. 🚀 Run playbook second time → **zero changes**
-3. ✅ If second run shows `changed: 0`, you're idempotent
-
-**📊 Example Output:**
-```
-PLAY RECAP
-server1 : ok=15  changed=0  unreachable=0  failed=0
-```
-
----
-
-## 📍 Slide 29 – 📊 Configuration Management Metrics
-
-| 📊 Metric | 📏 Measures | 🏆 Target |
-|-----------|------------|---------|
-| ⏱️ **Config Time** | Time to configure server | < 15 minutes |
-| 🔄 **Drift Rate** | Servers with drift | 0% |
-| ✅ **Idempotency** | Re-run changes | 0 changes |
-| 📜 **Compliance** | Servers meeting policy | 100% |
-
-> 📚 These metrics indicate configuration management maturity.
-
-**🤔 Question:** What happens when you re-run your playbooks?
-
----
-
-## 📍 Slide 30 – 🌊 From Manual to Automated
-
-```mermaid
-flowchart LR
-  subgraph 😱 Manual
-    SSH[🔌 SSH Sessions]
-    Commands[💻 Run Commands]
-    Hope[🙏 Hope It Works]
-  end
-  subgraph 🤖 Automated
-    Playbook[📝 Playbooks]
-    Roles[📦 Roles]
-    Consistent[✅ Consistent]
-  end
-  Manual -->|🚀 Ansible| Automated
-```
-
-**🎯 Automation State:**
-* ⚡ Any server configurable in minutes
-* 🔄 All changes through playbooks
-* 📈 Teams deploy configuration confidently
-
----
-
-## 📍 Slide 31 – 🏢 Section 5: Ansible in Real Life
-
-## 📅 A Day with Ansible
-
-**☀️ Morning:**
-* 📊 Review Ansible PR for new role
-* 👀 Check syntax with `ansible-lint`
-* ✅ Merge to main branch
-
-**🌤️ Afternoon:**
-* 🚨 Security patch needed
-* 🔧 Update role with new package version
-* 🚀 Run playbook — **all servers patched in 10 minutes**
-
-**🌙 Evening:**
-* 🤖 Scheduled playbook runs
-* 📊 Compliance reports generated
-* 🏠 Go home confident
-
----
-
-## 📍 Slide 32 – 👥 Team Ansible Workflow
-
-| 👤 Role | 🎯 Ansible Responsibility |
-|---------|----------------------|
-| 🔧 **DevOps** | Write and maintain roles |
-| 👨‍💻 **Developer** | Request configuration changes |
-| 🛡️ **Security** | Review roles for compliance |
-| 📊 **Audit** | Verify configuration state |
-
-**🔗 Common Workflow:**
-* 📝 Create branch with role changes
-* 🔍 CI runs `ansible-lint` and syntax check
-* 👀 Team reviews the changes
-* ✅ Merge triggers playbook run
-
----
-
-## 📍 Slide 33 – 🤝 Ansible + Terraform
-
-```mermaid
-flowchart LR
-  TF[🌍 Terraform] -->|Creates| VM[🖥️ Virtual Machine]
-  VM -->|IP Address| Ansible[🔧 Ansible]
-  Ansible -->|Configures| Ready[✅ Ready Server]
-```
-
-**🤝 Integration Patterns:**
-* 🌍 Terraform provisions infrastructure
-* 📋 Terraform outputs inventory
-* 🔧 Ansible configures servers
-* 🔄 Both stored in Git
-
-**💡 Best Practice:**
-* 🏗️ Terraform = **what** exists
-* 🔧 Ansible = **how** it's configured
-
----
-
-## 📍 Slide 34 – 📈 Career Path: Ansible Skills
-
-```mermaid
-flowchart LR
-  Junior[🌱 Junior: Basic Playbooks] --> Mid[💼 Mid: Roles & Vault]
-  Mid --> Senior[⭐ Senior: Dynamic Inventory & CI/CD]
-  Senior --> Principal[🏆 Principal: Enterprise Automation]
-```
-
-**🛠️ Skills to Build:**
-* 📝 YAML and Jinja2 fluency
-* 📦 Role design patterns
-* 🔐 Vault and secrets management
-* 🌐 Dynamic inventory
-* 🔄 CI/CD integration
-
----
-
-## 📍 Slide 35 – 🌍 Real Company Examples
-
-**🏢 Enterprise Users:**
-* 🏦 **NASA**: Manages thousands of servers
-* 🎮 **EA Games**: Game server configuration
-* 🛒 **Walmart**: Retail infrastructure
-
-**☁️ Cloud Native:**
-* 🔍 **Twitter**: Configuration at scale
-* 📦 **Lyft**: Microservices configuration
-* 🎬 **Apple**: Device management
-
-**📊 Stats:**
-* 🌍 **#1** open-source automation tool
-* 📦 **30,000+** modules available
-* 🏢 **Most used** by Fortune 100
-
----
-
-## 📍 Slide 36 – 🎯 Section 6: Reflection
-
-## 📝 Key Takeaways
-
-1. 🔧 **Ansible = Agentless configuration management**
-2. 📦 **Roles organize** reusable automation
-3. 🔄 **Idempotency** makes re-runs safe
-4. 🔔 **Handlers** efficiently manage service restarts
-5. 🔐 **Vault encrypts** sensitive data
-
-> 💡 Ansible playbooks are living documentation of your infrastructure.
-
----
-
-## 📍 Slide 37 – 🧠 The Mindset Shift
-
-| 😰 Old Mindset | 🚀 Ansible Mindset |
-|---------------|------------------|
-| 🙅 "SSH and run commands" | 📝 "Define in playbook" |
-| 🚫 "Each server is unique" | 🔄 "All servers are identical" |
-| 👉 "Document the steps" | 📄 "Code IS documentation" |
-| 😨 "Updates are risky" | 💪 "Updates are automated" |
-| 💻 "Works on my server" | 🌍 "Works on all servers" |
-
-> ❓ Which mindset describes your team?
-
----
-
-## 📍 Slide 38 – ✅ Your Progress
-
-## 🎓 What You Now Understand
-
-* ✅ Ansible's agentless architecture
-* ✅ How to write playbooks and roles
-* ✅ Why idempotency matters
-* ✅ How handlers improve efficiency
-* ✅ Securing secrets with Vault
-
-> 🚀 **You're ready for Lab 5: Ansible Fundamentals**
-
----
-
-## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L5_POST
-
----
-
-## 📍 Slide 40 – 🚀 What Comes Next
-
-## 📚 Next Lecture: Continuous Deployment with Ansible
-
-* 🚀 Application deployment roles
-* 🐳 Docker Compose templates
-* 🏷️ Tags and blocks
-* 💻 Hands-on: Deploying your app with Ansible
-
-**🎉 Your configuration automation journey continues.**
-
-> 🔧 From manual to automated — one playbook at a time.
-
-```mermaid
-flowchart LR
-  You[👤 You] --> Ansible[🔧 Ansible Skills]
-  Ansible --> Automated[🤖 Automated Config]
-  Automated --> Career[🚀 Career Growth]
-```
-
-**👋 See you in the next lecture!**
-
----
-
-## 📚 Resources & Further Reading
-
-**📕 Books:**
-* 📖 *Ansible: Up & Running* — Lorin Hochstein
-* 📖 *Ansible for DevOps* — Jeff Geerling
-* 📖 *The Practice of Cloud System Administration* — Limoncelli
-
-**🔗 Links:**
-* 🌐 [Ansible Documentation](https://docs.ansible.com/)
-* 🌐 [Ansible Galaxy](https://galaxy.ansible.com/)
-* 🌐 [Ansible Best Practices](https://docs.ansible.com/ansible/latest/user_guide/playbooks_best_practices.html)
-
----
+# 📌 Lecture 5 — Configuration Management: Ansible Fundamentals
+
+## 📍 Slide 1 – 🚀 Welcome to Configuration Management
+
+* 🌍 **Infrastructure is provisioned** — but what about configuring it?
+* 😰 Manual server setup leads to inconsistency and errors
+* 🔧 **Ansible automates configuration** — repeatable, reliable, documented
+* 🎯 This lecture: master Ansible roles, playbooks, and best practices
+
+```mermaid
+flowchart LR
+  Provision[🏗️ Terraform: Create VMs] --> Configure[🔧 Ansible: Configure VMs]
+  Configure --> Ready[✅ Ready to Run Apps]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand Ansible architecture and concepts
+* ✅ Write idempotent playbooks and roles
+* ✅ Secure credentials with Ansible Vault
+* ✅ Apply configuration management best practices
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Explain Ansible's agentless architecture |
+| 2 | 🔍 Create reusable roles for configuration |
+| 3 | 🛠️ Write idempotent tasks and handlers |
+| 4 | 🗺️ Secure secrets with Ansible Vault |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + YAML examples** — hands-on learning
+* 🎮 **Real-world scenarios** — server configuration challenges
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Best practices**: roles, handlers, idempotency
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Configuration Problem
+Section 2: Ansible Fundamentals
+Section 3: Roles & Playbooks      → 📝 MID Quiz
+Section 4: Idempotency & Handlers
+Section 5: Real World Ansible
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **94%** of organizations experienced security incidents from misconfigurations
+* ⏱️ Average time to configure a server manually: **2-4 hours**
+* 💥 Most configuration drift goes **undetected for months**
+
+> 💬 *"I installed it the same way... I think"* — Every sysadmin, ever
+
+**🤔 Think about it:**
+* How do you ensure 100 servers have identical configs?
+* What happens when you need to update a package on all servers?
+* Can you prove compliance across your infrastructure?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L5_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Configuration Problem
+
+* 🔧 **Manual configuration** = SSH into each server
+* 📋 Run commands, edit files, install packages
+* 📝 Document steps (that nobody reads)
+* 💥 Result: **no two servers are identical**
+
+```mermaid
+flowchart LR
+  Admin[👤 Admin] -->|SSH| Server1[🖥️ Server 1]
+  Admin -->|SSH| Server2[🖥️ Server 2]
+  Admin -->|SSH| Server3[🖥️ Server 3]
+  Server1 --> Drift1[📋 Config A]
+  Server2 --> Drift2[📋 Config B]
+  Server3 --> Drift3[📋 Config ???]
+```
+
+---
+
+## 📍 Slide 7 – 🐚 Shell Script Approach
+
+* 📝 Write bash scripts to automate
+* 🔄 Run scripts on each server
+* ⚠️ Problem: Scripts aren't idempotent
+
+```bash
+#!/bin/bash
+# 😰 What happens if you run this twice?
+apt-get update
+apt-get install -y nginx
+echo "Welcome" > /var/www/html/index.html
+systemctl start nginx
+```
+
+**💥 Issues:**
+* 🔄 Re-running may cause errors
+* 😰 No rollback mechanism
+* 📋 No state tracking
+* 🔗 No dependency management
+
+> 🤔 **Think:** What if nginx is already installed?
+
+---
+
+## 📍 Slide 8 – 😱 Configuration Management Challenges
+
+* 📅 100 servers need the same update
+* 🔧 Some servers have different OS versions
+* 📋 Some packages conflict with others
+* 💀 One mistake = hours of cleanup
+
+```mermaid
+flowchart TD
+  Update[📦 Update Required] --> S1[🖥️ Server 1: Ubuntu 20]
+  Update --> S2[🖥️ Server 2: Ubuntu 22]
+  Update --> S3[🖥️ Server 3: Ubuntu 24]
+  S1 --> Problem1[😰 Different package versions]
+  S2 --> Problem2[😰 Different dependencies]
+  S3 --> Problem3[😰 Different configs needed]
+```
+
+**📊 The Numbers:**
+* 🔍 **85%** of breaches involve misconfiguration
+* ⏱️ Manual update of 100 servers: **days**
+* 💰 Cost of configuration-related downtime: **$5,600/minute**
+
+---
+
+## 📍 Slide 9 – 😨 Documentation Drift
+
+* 📝 Documentation written once
+* 🔧 Server modified many times
+* 📋 Documentation never updated
+* 💀 Reality ≠ documentation
+
+> ⚠️ **Outdated docs are worse than no docs**
+
+**😰 Signs of Documentation Drift:**
+* 🔇 "The wiki says X but we do Y now"
+* 📝 Multiple conflicting runbooks
+* 🐌 New hires struggle to onboard
+* 🚪 Knowledge leaves with employees
+
+**💬 Discussion:** How current is your documentation?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Manual Configuration
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow updates | Security vulnerabilities linger |
+| 📋 Manual errors | Downtime from typos |
+| 👉 Inconsistency | "Works on server 1 but not 2" |
+| 🙈 No audit trail | Compliance failures |
+
+**📈 Real Numbers:**
+* 🏢 **Manual config time**: 2-4 hours per server
+* 🚀 **With Ansible**: 5-10 minutes per server
+* 🔄 **Scaling**: minutes vs days
+
+**💰 ROI Example:**
+* 👨‍💻 100 servers × 3 hours × $75/hour = **$22,500**
+* 🤖 Ansible: 1 hour setup + seconds to run = **$75**
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Ansible Is
+
+* 🔧 **Configuration management tool** — automate server setup
+* 🌐 **Agentless** — uses SSH, no agents to install
+* 📝 **YAML-based** — human-readable playbooks
+* 🔄 **Idempotent** — safe to run multiple times
+
+```mermaid
+flowchart LR
+  Control[💻 Control Node] -->|SSH| Node1[🖥️ Managed Node]
+  Control -->|SSH| Node2[🖥️ Managed Node]
+  Control -->|SSH| Node3[🖥️ Managed Node]
+```
+
+**📖 Definition:**
+> *Ansible is an open-source automation tool for configuration management, application deployment, and task automation using a simple YAML syntax.*
+
+---
+
+## 📍 Slide 12 – 🚫 What Ansible is NOT
+
+| ❌ Myth | ✅ Reality |
+|---------|-----------|
+| "Replaces Terraform" | 🤝 They complement each other |
+| "Requires agents" | 🌐 Agentless, SSH-based |
+| "Only for Linux" | 🪟 Works with Windows too |
+| "Just a scripting tool" | 📦 Full configuration management |
+| "Hard to learn" | 📝 YAML is simple |
+
+> 🔥 **Hot take:** Terraform provisions, Ansible configures. Use both.
+
+**🎯 Ansible is about:**
+* 🧠 Declarative configuration
+* 🤝 Consistent state across servers
+* 🔄 Repeatable automation
+* 📊 Self-documenting infrastructure
+
+---
+
+## 📍 Slide 13 – 🏗️ Ansible Architecture
+
+```mermaid
+flowchart TD
+  Control[💻 Control Node]
+  Control --> Inventory[📋 Inventory]
+  Control --> Playbook[📝 Playbook]
+  Control --> Modules[📦 Modules]
+  Inventory --> Managed[🖥️ Managed Nodes]
+  Playbook --> Managed
+  Modules --> Managed
+```
+
+| 🧱 Component | 🎯 Purpose |
+|-------------|----------|
+| 💻 **Control Node** | Where Ansible runs |
+| 📋 **Inventory** | List of managed servers |
+| 📝 **Playbook** | Automation instructions |
+| 📦 **Modules** | Units of work (apt, copy, service) |
+| 🖥️ **Managed Nodes** | Target servers |
+
+---
+
+## 📍 Slide 14 – 📋 Inventory Basics
+
+```ini
+# inventory/hosts.ini
+[webservers]
+web1 ansible_host=192.168.1.10
+web2 ansible_host=192.168.1.11
+
+[databases]
+db1 ansible_host=192.168.1.20
+
+[all:vars]
+ansible_user=ubuntu
+ansible_python_interpreter=/usr/bin/python3
+```
+
+**🎯 Inventory Features:**
+* 📁 Group servers logically
+* 🔧 Set per-host or per-group variables
+* 🌐 Static files or dynamic discovery
+* 🏷️ Use patterns: `webservers`, `all`, `db*`
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After Ansible
+
+| 😰 Before | 🚀 After |
+|----------|---------|
+| 📅 SSH into each server | 🤖 One command for all |
+| 📋 Manual steps | 📝 Documented playbooks |
+| 👉 "Run these commands" | ✅ "Desired state defined" |
+| 😨 Fear of updates | 💪 Confident automation |
+| 🐌 Hours per server | ⚡ Seconds per server |
+| 📝 Outdated wiki | 📄 Living documentation |
+
+> 🤔 How much time does your team spend on manual configuration?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Roles & Playbooks
+
+## 📝 Playbook Basics
+
+* 📄 YAML file with automation tasks
+* 🎯 Defines desired state
+* 🔄 Executes on target hosts
+* 📦 Groups related tasks
+
+**🎮 Let's write some Ansible.**
+
+---
+
+## 📍 Slide 17 – 📝 Simple Playbook Example
+
+```yaml
+---
+# playbook.yml
+- name: Configure web servers
+  hosts: webservers
+  become: yes  # 🔐 Run as root
+
+  tasks:
+    - name: Update apt cache
+      apt:
+        update_cache: yes
+        cache_valid_time: 3600
+
+    - name: Install nginx
+      apt:
+        name: nginx
+        state: present
+
+    - name: Start nginx
+      service:
+        name: nginx
+        state: started
+        enabled: yes
+```
+
+**🛠️ Run it:**
+```bash
+ansible-playbook -i inventory/hosts.ini playbook.yml
+```
+
+---
+
+## 📍 Slide 18 – 📦 Why Roles?
+
+```mermaid
+flowchart TD
+  subgraph ❌ Without Roles
+    P1[📝 One huge playbook]
+    P1 --> Problem[😰 Hard to maintain]
+  end
+  subgraph ✅ With Roles
+    R1[📦 common role]
+    R2[📦 docker role]
+    R3[📦 app role]
+    R1 --> Reuse[🔄 Reusable]
+    R2 --> Reuse
+    R3 --> Reuse
+  end
+```
+
+**📦 Role Benefits:**
+* 🔄 **Reusability**: Use across projects
+* 📁 **Organization**: Clear structure
+* 🧪 **Testability**: Test roles independently
+* 🤝 **Sharing**: Ansible Galaxy
+
+---
+
+## 📍 Slide 19 – 📁 Role Structure
+
+```
+roles/
+├── docker/
+│   ├── tasks/
+│   │   └── main.yml      # 🎯 Main tasks
+│   ├── handlers/
+│   │   └── main.yml      # 🔔 Event handlers
+│   ├── defaults/
+│   │   └── main.yml      # 📊 Default variables
+│   ├── templates/
+│   │   └── config.j2     # 📝 Jinja2 templates
+│   └── files/
+│       └── script.sh     # 📄 Static files
+```
+
+**🔑 Key Directories:**
+* 📁 **tasks/**: What to do
+* 📁 **handlers/**: React to changes
+* 📁 **defaults/**: Default values (low priority)
+* 📁 **templates/**: Dynamic file templates
+* 📁 **files/**: Static files to copy
+
+---
+
+## 📍 Slide 20 – 🐳 Docker Role Example
+
+```yaml
+# roles/docker/tasks/main.yml
+---
+- name: Install Docker prerequisites
+  apt:
+    name:
+      - apt-transport-https
+      - ca-certificates
+      - curl
+    state: present
+
+- name: Add Docker GPG key
+  apt_key:
+    url: https://download.docker.com/linux/ubuntu/gpg
+    state: present
+
+- name: Add Docker repository
+  apt_repository:
+    repo: "deb https://download.docker.com/linux/ubuntu {{ ansible_distribution_release }} stable"
+    state: present
+
+- name: Install Docker
+  apt:
+    name: docker-ce
+    state: present
+  notify: restart docker
+```
+
+---
+
+## 📍 Slide 21 – 🔔 Handlers
+
+```yaml
+# roles/docker/handlers/main.yml
+---
+- name: restart docker
+  service:
+    name: docker
+    state: restarted
+```
+
+**🔔 Handler Features:**
+* 🔄 Only run when notified
+* ⏱️ Run once at end of play
+* 🎯 React to configuration changes
+* 💡 Prevent unnecessary restarts
+
+```yaml
+# tasks/main.yml
+- name: Update Docker config
+  template:
+    src: daemon.json.j2
+    dest: /etc/docker/daemon.json
+  notify: restart docker  # 🔔 Trigger handler
+```
+
+---
+
+## 📍 Slide 22 – 📊 Variables & Defaults
+
+```yaml
+# roles/docker/defaults/main.yml
+---
+docker_version: "24.0"
+docker_users:
+  - ubuntu
+docker_log_driver: "json-file"
+docker_log_max_size: "10m"
+```
+
+**📊 Variable Precedence (lowest to highest):**
+1. 📁 Role defaults
+2. 📋 Inventory variables
+3. 📄 Playbook vars
+4. 🔧 Command line (`-e var=value`)
+
+```yaml
+# Using variables in tasks
+- name: Install Docker {{ docker_version }}
+  apt:
+    name: "docker-ce={{ docker_version }}*"
+    state: present
+```
+
+---
+
+## 📍 Slide 23 – 📝 Using Roles in Playbooks
+
+```yaml
+# playbooks/provision.yml
+---
+- name: Provision web servers
+  hosts: webservers
+  become: yes
+
+  roles:
+    - common      # 📦 Install common packages
+    - docker      # 🐳 Install Docker
+    - app_deploy  # 🚀 Deploy application
+```
+
+**🎯 Clean and simple!**
+
+```mermaid
+flowchart LR
+  Playbook[📝 Playbook] --> Common[📦 common]
+  Playbook --> Docker[🐳 docker]
+  Playbook --> App[🚀 app_deploy]
+  Common --> Result[✅ Configured Server]
+  Docker --> Result
+  App --> Result
+```
+
+---
+
+## 📍 Slide 24 – 🔐 Ansible Vault
+
+```bash
+# 🔐 Create encrypted file
+ansible-vault create group_vars/all.yml
+
+# 📝 Edit encrypted file
+ansible-vault edit group_vars/all.yml
+
+# 👀 View encrypted file
+ansible-vault view group_vars/all.yml
+```
+
+**🔐 Encrypted Content:**
+```yaml
+---
+# group_vars/all.yml (encrypted)
+dockerhub_username: myuser
+dockerhub_password: super_secret_token
+app_secret_key: very_secret_key_123
+```
+
+**🛠️ Using Vault:**
+```bash
+ansible-playbook playbook.yml --ask-vault-pass
+# Or use password file (gitignored!)
+ansible-playbook playbook.yml --vault-password-file .vault_pass
+```
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L5_MID
+
+---
+
+## 📍 Slide 26 – 🔄 Section 4: Idempotency
+
+## ♾️ What is Idempotency?
+
+* 🔄 Same result whether run once or many times
+* ✅ Safe to re-run playbooks
+* 📊 Converges to desired state
+* 🎯 No unintended side effects
+
+```mermaid
+flowchart LR
+  Run1[🚀 First Run] --> State[✅ Desired State]
+  Run2[🚀 Second Run] --> State
+  Run3[🚀 Third Run] --> State
+```
+
+**🎨 Output Colors:**
+* 🟢 **ok**: Already in desired state
+* 🟡 **changed**: Made a change
+* 🔴 **failed**: Task failed
+* ⚫ **skipped**: Task skipped
+
+---
+
+## 📍 Slide 27 – 🔄 Idempotent vs Non-Idempotent
+
+```yaml
+# ❌ Non-idempotent (shell command)
+- name: Add line to file
+  shell: echo "config=value" >> /etc/app.conf
+  # 💥 Adds line EVERY time!
+
+# ✅ Idempotent (lineinfile module)
+- name: Ensure line in file
+  lineinfile:
+    path: /etc/app.conf
+    line: "config=value"
+    state: present
+  # ✅ Only adds if missing!
+```
+
+**📦 Idempotent Modules:**
+| Module | Purpose | Idempotent? |
+|--------|---------|-------------|
+| `apt` | Install packages | ✅ Yes |
+| `service` | Manage services | ✅ Yes |
+| `file` | Manage files | ✅ Yes |
+| `shell` | Run commands | ❌ Usually no |
+| `command` | Run commands | ❌ Usually no |
+
+---
+
+## 📍 Slide 28 – 🧪 Testing Idempotency
+
+```mermaid
+flowchart TD
+  Run1[🚀 First Run] --> Changed[🟡 changed: 15]
+  Run2[🚀 Second Run] --> Ok[🟢 changed: 0]
+  Ok --> Idempotent[✅ Playbook is Idempotent!]
+```
+
+**🧪 Test Process:**
+1. 🚀 Run playbook first time → many changes
+2. 🚀 Run playbook second time → **zero changes**
+3. ✅ If second run shows `changed: 0`, you're idempotent
+
+**📊 Example Output:**
+```
+PLAY RECAP
+server1 : ok=15  changed=0  unreachable=0  failed=0
+```
+
+---
+
+## 📍 Slide 29 – 📊 Configuration Management Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| ⏱️ **Config Time** | Time to configure server | < 15 minutes |
+| 🔄 **Drift Rate** | Servers with drift | 0% |
+| ✅ **Idempotency** | Re-run changes | 0 changes |
+| 📜 **Compliance** | Servers meeting policy | 100% |
+
+> 📚 These metrics indicate configuration management maturity.
+
+**🤔 Question:** What happens when you re-run your playbooks?
+
+---
+
+## 📍 Slide 30 – 🌊 From Manual to Automated
+
+```mermaid
+flowchart LR
+  subgraph 😱 Manual
+    SSH[🔌 SSH Sessions]
+    Commands[💻 Run Commands]
+    Hope[🙏 Hope It Works]
+  end
+  subgraph 🤖 Automated
+    Playbook[📝 Playbooks]
+    Roles[📦 Roles]
+    Consistent[✅ Consistent]
+  end
+  Manual -->|🚀 Ansible| Automated
+```
+
+**🎯 Automation State:**
+* ⚡ Any server configurable in minutes
+* 🔄 All changes through playbooks
+* 📈 Teams deploy configuration confidently
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: Ansible in Real Life
+
+## 📅 A Day with Ansible
+
+**☀️ Morning:**
+* 📊 Review Ansible PR for new role
+* 👀 Check syntax with `ansible-lint`
+* ✅ Merge to main branch
+
+**🌤️ Afternoon:**
+* 🚨 Security patch needed
+* 🔧 Update role with new package version
+* 🚀 Run playbook — **all servers patched in 10 minutes**
+
+**🌙 Evening:**
+* 🤖 Scheduled playbook runs
+* 📊 Compliance reports generated
+* 🏠 Go home confident
+
+---
+
+## 📍 Slide 32 – 👥 Team Ansible Workflow
+
+| 👤 Role | 🎯 Ansible Responsibility |
+|---------|----------------------|
+| 🔧 **DevOps** | Write and maintain roles |
+| 👨‍💻 **Developer** | Request configuration changes |
+| 🛡️ **Security** | Review roles for compliance |
+| 📊 **Audit** | Verify configuration state |
+
+**🔗 Common Workflow:**
+* 📝 Create branch with role changes
+* 🔍 CI runs `ansible-lint` and syntax check
+* 👀 Team reviews the changes
+* ✅ Merge triggers playbook run
+
+---
+
+## 📍 Slide 33 – 🤝 Ansible + Terraform
+
+```mermaid
+flowchart LR
+  TF[🌍 Terraform] -->|Creates| VM[🖥️ Virtual Machine]
+  VM -->|IP Address| Ansible[🔧 Ansible]
+  Ansible -->|Configures| Ready[✅ Ready Server]
+```
+
+**🤝 Integration Patterns:**
+* 🌍 Terraform provisions infrastructure
+* 📋 Terraform outputs inventory
+* 🔧 Ansible configures servers
+* 🔄 Both stored in Git
+
+**💡 Best Practice:**
+* 🏗️ Terraform = **what** exists
+* 🔧 Ansible = **how** it's configured
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: Ansible Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Basic Playbooks] --> Mid[💼 Mid: Roles & Vault]
+  Mid --> Senior[⭐ Senior: Dynamic Inventory & CI/CD]
+  Senior --> Principal[🏆 Principal: Enterprise Automation]
+```
+
+**🛠️ Skills to Build:**
+* 📝 YAML and Jinja2 fluency
+* 📦 Role design patterns
+* 🔐 Vault and secrets management
+* 🌐 Dynamic inventory
+* 🔄 CI/CD integration
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 Enterprise Users:**
+* 🏦 **NASA**: Manages thousands of servers
+* 🎮 **EA Games**: Game server configuration
+* 🛒 **Walmart**: Retail infrastructure
+
+**☁️ Cloud Native:**
+* 🔍 **Twitter**: Configuration at scale
+* 📦 **Lyft**: Microservices configuration
+* 🎬 **Apple**: Device management
+
+**📊 Stats:**
+* 🌍 **#1** open-source automation tool
+* 📦 **30,000+** modules available
+* 🏢 **Most used** by Fortune 100
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🔧 **Ansible = Agentless configuration management**
+2. 📦 **Roles organize** reusable automation
+3. 🔄 **Idempotency** makes re-runs safe
+4. 🔔 **Handlers** efficiently manage service restarts
+5. 🔐 **Vault encrypts** sensitive data
+
+> 💡 Ansible playbooks are living documentation of your infrastructure.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🚀 Ansible Mindset |
+|---------------|------------------|
+| 🙅 "SSH and run commands" | 📝 "Define in playbook" |
+| 🚫 "Each server is unique" | 🔄 "All servers are identical" |
+| 👉 "Document the steps" | 📄 "Code IS documentation" |
+| 😨 "Updates are risky" | 💪 "Updates are automated" |
+| 💻 "Works on my server" | 🌍 "Works on all servers" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Ansible's agentless architecture
+* ✅ How to write playbooks and roles
+* ✅ Why idempotency matters
+* ✅ How handlers improve efficiency
+* ✅ Securing secrets with Vault
+
+> 🚀 **You're ready for Lab 5: Ansible Fundamentals**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L5_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Continuous Deployment with Ansible
+
+* 🚀 Application deployment roles
+* 🐳 Docker Compose templates
+* 🏷️ Tags and blocks
+* 💻 Hands-on: Deploying your app with Ansible
+
+**🎉 Your configuration automation journey continues.**
+
+> 🔧 From manual to automated — one playbook at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Ansible[🔧 Ansible Skills]
+  Ansible --> Automated[🤖 Automated Config]
+  Automated --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Ansible: Up & Running* — Lorin Hochstein
+* 📖 *Ansible for DevOps* — Jeff Geerling
+* 📖 *The Practice of Cloud System Administration* — Limoncelli
+
+**🔗 Links:**
+* 🌐 [Ansible Documentation](https://docs.ansible.com/)
+* 🌐 [Ansible Galaxy](https://galaxy.ansible.com/)
+* 🌐 [Ansible Best Practices](https://docs.ansible.com/ansible/latest/user_guide/playbooks_best_practices.html)
+
+---
diff --git a/lectures/lec6.md b/lectures/lec6.md
index a78ba20b5b..cf20a19fbc 100644
--- a/lectures/lec6.md
+++ b/lectures/lec6.md
@@ -1,887 +1,887 @@
-# 📌 Lecture 6 — Continuous Deployment: Advanced Ansible
-
-## 📍 Slide 1 – 🚀 Welcome to Continuous Deployment
-
-* 🌍 **Configuration is automated** — but what about deployments?
-* 😰 Manual deployments are slow, error-prone, and risky
-* 🚀 **CI/CD with Ansible** = automated, repeatable, safe deployments
-* 🎯 This lecture: master blocks, tags, Docker Compose, and CI/CD integration
-
-```mermaid
-flowchart LR
-  Code[💻 Code Push] -->|CI/CD| Build[🔨 Build]
-  Build --> Deploy[🚀 Ansible Deploy]
-  Deploy --> Running[✅ Running in Production]
-```
-
----
-
-## 📍 Slide 2 – 🎯 What You Will Learn
-
-* ✅ Use blocks for error handling and task grouping
-* ✅ Apply tags for selective execution
-* ✅ Deploy applications with Docker Compose templates
-* ✅ Integrate Ansible with GitHub Actions
-
-**🎓 Learning Outcomes:**
-| # | Outcome |
-|---|---------|
-| 1 | 🧠 Implement blocks with rescue and always |
-| 2 | 🔍 Design effective tag strategies |
-| 3 | 🛠️ Template Docker Compose files with Jinja2 |
-| 4 | 🗺️ Automate deployments with CI/CD |
-
----
-
-## 📍 Slide 3 – 📋 How This Lecture Works
-
-* 📚 **Advanced patterns** — production-ready practices
-* 🎮 **Real-world scenarios** — deployment challenges
-* 📝 **3 quiz checkpoints**: PRE / MID / POST
-* 🛠️ **CI/CD integration**: GitHub Actions + Ansible
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction (now)     → 📝 PRE Quiz
-Section 1: The Deployment Problem
-Section 2: Blocks & Error Handling
-Section 3: Tags & Selective Execution → 📝 MID Quiz
-Section 4: Docker Compose Deployment
-Section 5: CI/CD Integration
-Section 6: Reflection             → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – ❓ The Big Question
-
-* 📊 **46%** of organizations deploy weekly or faster
-* ⏱️ Top performers deploy **multiple times per day**
-* 💥 **80%** of outages caused by changes (deploys, configs)
-
-> 💬 *"We deploy on Fridays and pray over the weekend"* — Nobody should say this
-
-**🤔 Think about it:**
-* How often does your team deploy?
-* How long does a deployment take?
-* Can you roll back in under 5 minutes?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L6_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Deployment Problem
-
-* 🎰 **Deployments = high-risk events**
-* 📋 Manual steps, checklists, approval gates
-* 🌙 Deploy only during "maintenance windows"
-* 💥 Result: **fear of deploying**
-
-```mermaid
-flowchart LR
-  Ready[✅ Code Ready] --> Wait[📅 Wait for Window]
-  Wait --> Manual[📋 Manual Steps]
-  Manual --> Pray[🙏 Hope It Works]
-  Pray -->|💥 Fail| Rollback[😱 Manual Rollback]
-  Pray -->|✅ Success| Relief[😮‍💨 Temporary Relief]
-```
-
----
-
-## 📍 Slide 7 – 💥 Deployment Failures
-
-* 🔧 Wrong version deployed
-* 📦 Missing dependencies
-* ⚙️ Configuration mismatch
-* 💀 Partial deployment (some servers updated, some not)
-
-```mermaid
-flowchart TD
-  Deploy[🚀 Deploy Started] --> S1[🖥️ Server 1: ✅ Updated]
-  Deploy --> S2[🖥️ Server 2: ❌ Failed]
-  Deploy --> S3[🖥️ Server 3: 🔄 Pending]
-  S1 --> Inconsistent[😱 Inconsistent State]
-  S2 --> Inconsistent
-  S3 --> Inconsistent
-```
-
-**📊 The Numbers:**
-* 🔍 **60%** of outages caused by bad deployments
-* ⏱️ Average recovery time: **4+ hours**
-* 💰 Cost per hour of downtime: **$300,000+**
-
----
-
-## 📍 Slide 8 – 😱 Rollback Nightmares
-
-* 📋 "Just revert the code" — but what about:
-  * 💾 Database migrations?
-  * ⚙️ Configuration changes?
-  * 📦 Dependencies?
-* 🙈 No automated rollback = manual scramble
-* 💀 Hours of downtime
-
-> ⚠️ **If you can't roll back quickly, you shouldn't deploy**
-
-**😰 Signs of Rollback Problems:**
-* 🔇 "We've never actually tested rollback"
-* 📝 Rollback requires manual steps
-* 🐌 "Rollback takes longer than fixing forward"
-* 🚪 Nobody knows the rollback procedure
-
----
-
-## 📍 Slide 9 – 😨 All-or-Nothing Deploys
-
-* 📅 Big-bang releases every few months
-* 🎰 Everything changes at once
-* 📋 Impossible to isolate failures
-* 💀 If it fails, everything fails
-
-> ⚠️ **Large releases = large risk**
-
-**💬 Discussion:** Would you rather deploy 100 changes once or 1 change 100 times?
-
----
-
-## 📍 Slide 10 – 💸 The Cost of Manual Deployment
-
-| 🔥 Problem | 💥 Impact |
-|------------|-----------|
-| 🐢 Slow deployments | Features delayed |
-| 📋 Manual errors | Outages, rollbacks |
-| 👉 Inconsistent process | "Works for Alice, not Bob" |
-| 🙈 Fear of deploying | Innovation stalls |
-
-**📈 Elite vs Low Performers:**
-| Metric | 🏆 Elite | 😰 Low |
-|--------|---------|-------|
-| Deploy frequency | Multiple/day | Monthly |
-| Lead time | < 1 hour | 1-6 months |
-| Change failure rate | 0-15% | 46-60% |
-| Recovery time | < 1 hour | 1 week+ |
-
----
-
-## 📍 Slide 11 – 💡 Section 2: Blocks & Error Handling
-
-* 🧱 **Blocks** = group related tasks
-* 🔄 **Rescue** = handle failures
-* ✅ **Always** = run regardless of outcome
-* 🎯 Production-ready error handling
-
-```mermaid
-flowchart TD
-  Block[🧱 Block] --> Try[🎯 Try Tasks]
-  Try -->|✅ Success| Always[✅ Always]
-  Try -->|❌ Failure| Rescue[🔧 Rescue]
-  Rescue --> Always
-```
-
----
-
-## 📍 Slide 12 – 🧱 Block Syntax
-
-```yaml
-- name: Deploy application with error handling
-  block:
-    - name: Pull latest image
-      docker_image:
-        name: "{{ app_image }}"
-        source: pull
-
-    - name: Start container
-      docker_container:
-        name: "{{ app_name }}"
-        image: "{{ app_image }}"
-        state: started
-
-  rescue:
-    - name: Log failure
-      debug:
-        msg: "Deployment failed! Rolling back..."
-
-    - name: Notify team
-      uri:
-        url: "{{ slack_webhook }}"
-        method: POST
-        body: '{"text": "Deployment failed!"}'
-
-  always:
-    - name: Cleanup temp files
-      file:
-        path: /tmp/deploy
-        state: absent
-```
-
----
-
-## 📍 Slide 13 – 🛡️ Block Benefits
-
-```mermaid
-flowchart LR
-  subgraph Without Blocks
-    T1[Task 1] --> T2[Task 2]
-    T2 -->|❌ Fail| Stop[😱 Playbook Stops]
-  end
-  subgraph With Blocks
-    B1[🧱 Block] -->|❌ Fail| R1[🔧 Rescue]
-    R1 --> A1[✅ Always]
-  end
-```
-
-**🛡️ Advantages:**
-* 🔄 Graceful error handling
-* 📊 Cleanup runs even on failure
-* 🔔 Notification on failure
-* 🎯 Apply settings to multiple tasks
-
-```yaml
-- name: Docker installation
-  block:
-    - name: Task 1
-    - name: Task 2
-    - name: Task 3
-  become: yes        # 🔐 Applied to all tasks
-  when: install_docker  # 🔀 Condition for all
-  tags:
-    - docker         # 🏷️ Tag for all
-```
-
----
-
-## 📍 Slide 14 – 🏷️ Section 3: Tags Strategy
-
-* 🏷️ **Tags** = label tasks for selective execution
-* 🎯 Run only what you need
-* ⏱️ Speed up development and testing
-* 🔧 Isolate specific operations
-
-```bash
-# Run only docker tasks
-ansible-playbook site.yml --tags "docker"
-
-# Skip common tasks
-ansible-playbook site.yml --skip-tags "common"
-
-# List available tags
-ansible-playbook site.yml --list-tags
-```
-
----
-
-## 📍 Slide 15 – 🏷️ Tag Design Patterns
-
-```yaml
-# roles/web_app/tasks/main.yml
-- name: Application deployment
-  block:
-    - name: Pull image
-      docker_image:
-        name: "{{ app_image }}"
-        source: pull
-
-    - name: Deploy container
-      docker_container:
-        name: "{{ app_name }}"
-        state: started
-  tags:
-    - app_deploy
-    - deploy
-
-- name: Application wipe
-  block:
-    - name: Stop container
-      docker_container:
-        name: "{{ app_name }}"
-        state: absent
-  when: web_app_wipe | bool
-  tags:
-    - web_app_wipe
-```
-
-**🏷️ Tag Categories:**
-* 🚀 **deploy**: Deployment tasks
-* 🧹 **wipe**: Cleanup tasks
-* 📦 **packages**: Package installation
-* ⚙️ **config**: Configuration only
-
----
-
-## 📍 Slide 16 – ⚠️ Wipe Logic Pattern
-
-```mermaid
-flowchart TD
-  Check{🔍 web_app_wipe = true?}
-  Check -->|No| Skip[⏭️ Skip wipe tasks]
-  Check -->|Yes| TagCheck{🏷️ --tags web_app_wipe?}
-  TagCheck -->|No| Skip2[⏭️ Skip: tag not specified]
-  TagCheck -->|Yes| Wipe[🧹 Execute wipe]
-```
-
-**🛡️ Double Safety Mechanism:**
-* 📊 **Variable gate**: `web_app_wipe: false` by default
-* 🏷️ **Tag gate**: Must specify `--tags web_app_wipe`
-* ✅ Both required to execute dangerous tasks
-
-```bash
-# Normal deploy (wipe doesn't run)
-ansible-playbook deploy.yml
-
-# Wipe only
-ansible-playbook deploy.yml -e "web_app_wipe=true" --tags web_app_wipe
-
-# Clean reinstall (wipe + deploy)
-ansible-playbook deploy.yml -e "web_app_wipe=true"
-```
-
----
-
-## 📍 Slide 17 – 🐳 Docker Compose Deployment
-
-```mermaid
-flowchart LR
-  Template[📝 Template] -->|Jinja2| Compose[🐳 docker-compose.yml]
-  Compose --> Deploy[🚀 Deploy]
-  Deploy --> Running[✅ Running]
-```
-
-**🐳 Why Docker Compose with Ansible?**
-* 📝 Declarative container configuration
-* 🔄 Managed by templates (dynamic values)
-* 🔧 Easy updates and rollbacks
-* 📊 Multi-container applications
-
----
-
-## 📍 Slide 18 – 📝 Jinja2 Templates
-
-```yaml
-# roles/web_app/templates/docker-compose.yml.j2
-version: '3.8'
-
-services:
-  {{ app_name }}:
-    image: {{ docker_image }}:{{ docker_tag }}
-    container_name: {{ app_name }}
-    ports:
-      - "{{ app_port }}:{{ app_internal_port }}"
-    environment:
-{% for key, value in app_env.items() %}
-      {{ key }}: "{{ value }}"
-{% endfor %}
-    restart: unless-stopped
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:{{ app_internal_port }}/health"]
-      interval: 30s
-      timeout: 10s
-      retries: 3
-```
-
-**📊 Variables Used:**
-* 📦 `app_name`: Container name
-* 🐳 `docker_image`: Image repository
-* 🏷️ `docker_tag`: Image version
-* 🔌 `app_port`: Exposed port
-
----
-
-## 📍 Slide 19 – 🚀 Deploy with Docker Compose Module
-
-```yaml
-# roles/web_app/tasks/main.yml
-- name: Create application directory
-  file:
-    path: "{{ compose_project_dir }}"
-    state: directory
-    mode: '0755'
-
-- name: Template docker-compose file
-  template:
-    src: docker-compose.yml.j2
-    dest: "{{ compose_project_dir }}/docker-compose.yml"
-    mode: '0644'
-  notify: restart app
-
-- name: Deploy with Docker Compose
-  community.docker.docker_compose_v2:
-    project_src: "{{ compose_project_dir }}"
-    state: present
-    pull: always
-  register: deploy_result
-
-- name: Verify deployment
-  uri:
-    url: "http://localhost:{{ app_port }}/health"
-    status_code: 200
-  retries: 5
-  delay: 10
-```
-
----
-
-## 📍 Slide 20 – 🔗 Role Dependencies
-
-```yaml
-# roles/web_app/meta/main.yml
----
-dependencies:
-  - role: docker
-    vars:
-      docker_users:
-        - "{{ ansible_user }}"
-```
-
-**🔗 Dependency Benefits:**
-* 🔄 Automatic execution order
-* 📦 Ensures prerequisites
-* 🎯 Self-contained roles
-
-```mermaid
-flowchart LR
-  WebApp[📦 web_app role] -->|depends on| Docker[🐳 docker role]
-  Docker --> Tasks[🔧 Docker tasks run first]
-  Tasks --> WebAppTasks[🚀 Web app tasks run second]
-```
-
----
-
-## 📍 Slide 21 – 📊 Multi-Environment Deployment
-
-```yaml
-# vars/app_python.yml
-app_name: devops-python
-docker_image: username/devops-info-service
-docker_tag: latest
-app_port: 8000
-
-# vars/app_bonus.yml
-app_name: devops-go
-docker_image: username/devops-info-service-go
-docker_tag: latest
-app_port: 8001
-```
-
-```yaml
-# playbooks/deploy_python.yml
----
-- name: Deploy Python Application
-  hosts: webservers
-  become: yes
-  vars_files:
-    - ../vars/app_python.yml
-  roles:
-    - web_app
-```
-
-**🔄 Same role, different variables!**
-
----
-
-## 📍 Slide 22 – 🤖 CI/CD Integration
-
-```mermaid
-flowchart LR
-  Push[📤 Git Push] --> CI[🔄 GitHub Actions]
-  CI --> Lint[📋 ansible-lint]
-  Lint --> Deploy[🚀 ansible-playbook]
-  Deploy --> Verify[✅ Verification]
-```
-
-**🤖 CI/CD Benefits:**
-* 🔄 Automatic deployments on push
-* 📋 Linting catches errors early
-* 🔐 Secure credential handling
-* 📊 Audit trail of deployments
-
----
-
-## 📍 Slide 23 – 📝 GitHub Actions Workflow
-
-```yaml
-# .github/workflows/ansible-deploy.yml
-name: Ansible Deployment
-
-on:
-  push:
-    branches: [main]
-    paths:
-      - 'ansible/**'
-
-jobs:
-  lint:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-      - name: Install ansible-lint
-        run: pip install ansible ansible-lint
-      - name: Run ansible-lint
-        run: ansible-lint ansible/playbooks/*.yml
-
-  deploy:
-    needs: lint
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-      - name: Setup SSH
-        run: |
-          mkdir -p ~/.ssh
-          echo "${{ secrets.SSH_KEY }}" > ~/.ssh/id_rsa
-          chmod 600 ~/.ssh/id_rsa
-      - name: Deploy
-        run: |
-          cd ansible
-          echo "${{ secrets.VAULT_PASS }}" > .vault_pass
-          ansible-playbook playbooks/deploy.yml \
-            --vault-password-file .vault_pass
-          rm .vault_pass
-```
-
----
-
-## 📍 Slide 24 – 🔐 Secrets in CI/CD
-
-```mermaid
-flowchart TD
-  Secrets[🔐 GitHub Secrets] --> Workflow[🔄 Workflow]
-  Workflow --> TempFile[📄 Temp File]
-  TempFile --> Ansible[🔧 Ansible]
-  Ansible --> Delete[🗑️ Delete Temp File]
-```
-
-**🔐 Security Practices:**
-* 📦 Store credentials in GitHub Secrets
-* 📄 Write to temp file during run
-* 🗑️ Delete immediately after use
-* 🚫 Never echo secrets to logs
-
-```yaml
-# Using secrets safely
-- name: Deploy with Vault
-  env:
-    VAULT_PASS: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
-  run: |
-    echo "$VAULT_PASS" > /tmp/vault_pass
-    ansible-playbook playbook.yml --vault-password-file /tmp/vault_pass
-    rm /tmp/vault_pass  # 🗑️ Cleanup!
-```
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L6_MID
-
----
-
-## 📍 Slide 26 – 📁 Section 4: Path Filters
-
-```yaml
-on:
-  push:
-    paths:
-      - 'ansible/**'           # 📁 Only ansible changes
-      - '!ansible/docs/**'     # 📝 Exclude docs
-      - '.github/workflows/ansible-deploy.yml'
-```
-
-**📁 Path Filter Benefits:**
-* ⚡ Faster CI (skip unnecessary runs)
-* 💰 Lower costs (fewer minutes used)
-* 🎯 Focused workflows
-
-```mermaid
-flowchart TD
-  Push[📤 Push] --> Check{📁 ansible/** changed?}
-  Check -->|Yes| Run[🚀 Run Workflow]
-  Check -->|No| Skip[⏭️ Skip Workflow]
-```
-
----
-
-## 📍 Slide 27 – 📊 Deployment Metrics
-
-| 📊 Metric | 📏 Measures | 🏆 Target |
-|-----------|------------|---------|
-| ⏱️ **Deploy Time** | Push to production | < 15 minutes |
-| 📦 **Deploy Frequency** | How often | Daily+ |
-| ❌ **Failure Rate** | Failed deploys | < 15% |
-| 🔄 **Rollback Time** | Recovery time | < 5 minutes |
-
-> 📚 These are DORA metrics for deployment performance.
-
-**🤔 Question:** How fast can you deploy and roll back?
-
----
-
-## 📍 Slide 28 – 🔄 Rollback Strategy
-
-```yaml
-# Rollback by re-deploying previous version
-- name: Rollback application
-  block:
-    - name: Stop current container
-      docker_container:
-        name: "{{ app_name }}"
-        state: stopped
-
-    - name: Deploy previous version
-      community.docker.docker_compose_v2:
-        project_src: "{{ compose_project_dir }}"
-        state: present
-      vars:
-        docker_tag: "{{ rollback_tag }}"
-
-    - name: Verify rollback
-      uri:
-        url: "http://localhost:{{ app_port }}/health"
-        status_code: 200
-      retries: 3
-      delay: 5
-```
-
-**🔄 Rollback Options:**
-* 🏷️ Deploy previous tag
-* 📦 Docker Compose down/up
-* 🔙 Git revert + CI/CD
-
----
-
-## 📍 Slide 29 – 🌊 From Manual to Automated Deployment
-
-```mermaid
-flowchart LR
-  subgraph 😱 Manual
-    SSH[🔌 SSH to servers]
-    Commands[💻 Run commands]
-    Hope[🙏 Hope it works]
-  end
-  subgraph 🤖 Automated
-    Push[📤 Git push]
-    CI[🔄 CI/CD]
-    Deploy[🚀 Ansible]
-  end
-  Manual -->|🚀 Automate| Automated
-```
-
-**🎯 Automation State:**
-* ⚡ Deploy in minutes, not hours
-* 🔄 Every change through CI/CD
-* 📈 Deploy with confidence
-
----
-
-## 📍 Slide 30 – 🏢 Section 5: Real World CI/CD
-
-## 📅 A Day with Automated Deployment
-
-**☀️ Morning:**
-* 📊 Review deployment PR
-* 👀 Check CI lint results
-* ✅ Merge to main
-
-**🌤️ Afternoon:**
-* 🤖 CI automatically deploys
-* 📊 Monitoring shows healthy
-* ☕ Coffee break
-
-**🌙 Evening:**
-* 🚨 Bug found in production
-* 🔙 Revert commit, CI deploys previous
-* ⏱️ **5 minutes** to rollback
-
----
-
-## 📍 Slide 31 – 👥 Team Deployment Workflow
-
-| 👤 Role | 🎯 CI/CD Responsibility |
-|---------|----------------------|
-| 👨‍💻 **Developer** | Create PR, fix lint issues |
-| 🔧 **DevOps** | Maintain workflows, roles |
-| 👀 **Reviewer** | Approve changes |
-| 🤖 **CI/CD** | Execute deployment |
-
-**🔗 GitOps Workflow:**
-```mermaid
-flowchart LR
-  PR[📝 Pull Request] --> Review[👀 Review]
-  Review --> Merge[✅ Merge]
-  Merge --> CI[🔄 CI/CD]
-  CI --> Deploy[🚀 Deploy]
-  Deploy --> Prod[🌐 Production]
-```
-
----
-
-## 📍 Slide 32 – 🔀 Deployment Strategies
-
-```mermaid
-flowchart TD
-  subgraph Rolling
-    R1[🔄 Update 1 at a time]
-  end
-  subgraph Blue-Green
-    BG1[🔵 Blue: Current]
-    BG2[🟢 Green: New]
-  end
-  subgraph Canary
-    C1[🐤 Small % first]
-    C2[📊 Monitor]
-    C3[🚀 Full rollout]
-  end
-```
-
-| 🚀 Strategy | 🎯 Use Case |
-|------------|----------|
-| 🔄 **Rolling** | Gradual update, zero downtime |
-| 🔵 **Blue-Green** | Instant switch, easy rollback |
-| 🐤 **Canary** | Test with subset of users |
-
----
-
-## 📍 Slide 33 – 🧪 Deployment Verification
-
-```yaml
-# Verify deployment success
-- name: Wait for application
-  uri:
-    url: "http://{{ ansible_host }}:{{ app_port }}/health"
-    status_code: 200
-    return_content: yes
-  register: health_check
-  until: health_check.status == 200
-  retries: 10
-  delay: 6
-
-- name: Run smoke tests
-  command: "curl -f http://{{ ansible_host }}:{{ app_port }}/"
-  register: smoke_test
-  failed_when: smoke_test.rc != 0
-
-- name: Log deployment success
-  debug:
-    msg: "✅ Deployment verified: {{ app_name }} is healthy"
-```
-
----
-
-## 📍 Slide 34 – 📈 Career Path: CD Skills
-
-```mermaid
-flowchart LR
-  Junior[🌱 Junior: Manual deploys] --> Mid[💼 Mid: CI/CD pipelines]
-  Mid --> Senior[⭐ Senior: Zero-downtime strategies]
-  Senior --> Principal[🏆 Principal: Platform architecture]
-```
-
-**🛠️ Skills to Build:**
-* 🔄 CI/CD pipeline design
-* 🐳 Container orchestration
-* 📊 Monitoring and alerting
-* 🔙 Rollback strategies
-* 🔐 Security in pipelines
-
----
-
-## 📍 Slide 35 – 🌍 Real Company Examples
-
-**🏢 Enterprise CD:**
-* 📦 **Amazon**: Deploy every 11.7 seconds
-* 🎬 **Netflix**: Canary deployments everywhere
-* 🔍 **Google**: Feature flags for gradual rollout
-
-**☁️ CD Practices:**
-* 🏦 **Stripe**: Shadow traffic for testing
-* 📦 **Etsy**: 50+ deploys per day
-* 🎮 **Spotify**: Squad-based ownership
-
-**📊 Stats:**
-* 🚀 Elite teams deploy **on demand**
-* ⏱️ Lead time: **less than 1 hour**
-* 🔄 Recovery: **less than 1 hour**
-
----
-
-## 📍 Slide 36 – 🎯 Section 6: Reflection
-
-## 📝 Key Takeaways
-
-1. 🧱 **Blocks** enable graceful error handling
-2. 🏷️ **Tags** allow selective execution
-3. 🐳 **Docker Compose** templates for flexible deployments
-4. 🔗 **Role dependencies** ensure proper ordering
-5. 🤖 **CI/CD** automates the entire process
-
-> 💡 Small, frequent deployments are safer than big releases.
-
----
-
-## 📍 Slide 37 – 🧠 The Mindset Shift
-
-| 😰 Old Mindset | 🚀 CD Mindset |
-|---------------|------------------|
-| 🙅 "Deploy on weekends" | 🚀 "Deploy anytime" |
-| 🚫 "Big releases quarterly" | 🔄 "Small releases daily" |
-| 👉 "Manual verification" | 🤖 "Automated checks" |
-| 😨 "Rollback is hard" | 💪 "Rollback in minutes" |
-| 💻 "It works locally" | 🌍 "CI validates it" |
-
-> ❓ Which mindset describes your team?
-
----
-
-## 📍 Slide 38 – ✅ Your Progress
-
-## 🎓 What You Now Understand
-
-* ✅ Blocks with rescue and always
-* ✅ Tag strategies for selective execution
-* ✅ Docker Compose templates with Jinja2
-* ✅ Role dependencies and ordering
-* ✅ CI/CD integration with GitHub Actions
-
-> 🚀 **You're ready for Lab 6: Advanced Ansible & CI/CD**
-
----
-
-## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L6_POST
-
----
-
-## 📍 Slide 40 – 🚀 What Comes Next
-
-## 📚 Next Lecture: Observability & Logging
-
-* 📋 Log aggregation with Loki
-* 📊 Visualization with Grafana
-* 🔍 LogQL query language
-* 💻 Hands-on: Building a logging stack
-
-**🎉 Your continuous deployment journey continues.**
-
-> 🚀 From manual deploys to automated CI/CD — one commit at a time.
-
-```mermaid
-flowchart LR
-  You[👤 You] --> CICD[🤖 CI/CD Skills]
-  CICD --> Automated[🚀 Automated Deploys]
-  Automated --> Career[🚀 Career Growth]
-```
-
-**👋 See you in the next lecture!**
-
----
-
-## 📚 Resources & Further Reading
-
-**📕 Books:**
-* 📖 *Continuous Delivery* — Jez Humble
-* 📖 *The DevOps Handbook* — Gene Kim et al.
-* 📖 *Accelerate* — Nicole Forsgren
-
-**🔗 Links:**
-* 🌐 [Ansible Blocks](https://docs.ansible.com/ansible/latest/user_guide/playbooks_blocks.html)
-* 🌐 [Ansible Tags](https://docs.ansible.com/ansible/latest/user_guide/playbooks_tags.html)
-* 🌐 [GitHub Actions](https://docs.github.com/en/actions)
-
----
+# 📌 Lecture 6 — Continuous Deployment: Advanced Ansible
+
+## 📍 Slide 1 – 🚀 Welcome to Continuous Deployment
+
+* 🌍 **Configuration is automated** — but what about deployments?
+* 😰 Manual deployments are slow, error-prone, and risky
+* 🚀 **CI/CD with Ansible** = automated, repeatable, safe deployments
+* 🎯 This lecture: master blocks, tags, Docker Compose, and CI/CD integration
+
+```mermaid
+flowchart LR
+  Code[💻 Code Push] -->|CI/CD| Build[🔨 Build]
+  Build --> Deploy[🚀 Ansible Deploy]
+  Deploy --> Running[✅ Running in Production]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Use blocks for error handling and task grouping
+* ✅ Apply tags for selective execution
+* ✅ Deploy applications with Docker Compose templates
+* ✅ Integrate Ansible with GitHub Actions
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Implement blocks with rescue and always |
+| 2 | 🔍 Design effective tag strategies |
+| 3 | 🛠️ Template Docker Compose files with Jinja2 |
+| 4 | 🗺️ Automate deployments with CI/CD |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Advanced patterns** — production-ready practices
+* 🎮 **Real-world scenarios** — deployment challenges
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **CI/CD integration**: GitHub Actions + Ansible
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Deployment Problem
+Section 2: Blocks & Error Handling
+Section 3: Tags & Selective Execution → 📝 MID Quiz
+Section 4: Docker Compose Deployment
+Section 5: CI/CD Integration
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **46%** of organizations deploy weekly or faster
+* ⏱️ Top performers deploy **multiple times per day**
+* 💥 **80%** of outages caused by changes (deploys, configs)
+
+> 💬 *"We deploy on Fridays and pray over the weekend"* — Nobody should say this
+
+**🤔 Think about it:**
+* How often does your team deploy?
+* How long does a deployment take?
+* Can you roll back in under 5 minutes?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L6_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Deployment Problem
+
+* 🎰 **Deployments = high-risk events**
+* 📋 Manual steps, checklists, approval gates
+* 🌙 Deploy only during "maintenance windows"
+* 💥 Result: **fear of deploying**
+
+```mermaid
+flowchart LR
+  Ready[✅ Code Ready] --> Wait[📅 Wait for Window]
+  Wait --> Manual[📋 Manual Steps]
+  Manual --> Pray[🙏 Hope It Works]
+  Pray -->|💥 Fail| Rollback[😱 Manual Rollback]
+  Pray -->|✅ Success| Relief[😮‍💨 Temporary Relief]
+```
+
+---
+
+## 📍 Slide 7 – 💥 Deployment Failures
+
+* 🔧 Wrong version deployed
+* 📦 Missing dependencies
+* ⚙️ Configuration mismatch
+* 💀 Partial deployment (some servers updated, some not)
+
+```mermaid
+flowchart TD
+  Deploy[🚀 Deploy Started] --> S1[🖥️ Server 1: ✅ Updated]
+  Deploy --> S2[🖥️ Server 2: ❌ Failed]
+  Deploy --> S3[🖥️ Server 3: 🔄 Pending]
+  S1 --> Inconsistent[😱 Inconsistent State]
+  S2 --> Inconsistent
+  S3 --> Inconsistent
+```
+
+**📊 The Numbers:**
+* 🔍 **60%** of outages caused by bad deployments
+* ⏱️ Average recovery time: **4+ hours**
+* 💰 Cost per hour of downtime: **$300,000+**
+
+---
+
+## 📍 Slide 8 – 😱 Rollback Nightmares
+
+* 📋 "Just revert the code" — but what about:
+  * 💾 Database migrations?
+  * ⚙️ Configuration changes?
+  * 📦 Dependencies?
+* 🙈 No automated rollback = manual scramble
+* 💀 Hours of downtime
+
+> ⚠️ **If you can't roll back quickly, you shouldn't deploy**
+
+**😰 Signs of Rollback Problems:**
+* 🔇 "We've never actually tested rollback"
+* 📝 Rollback requires manual steps
+* 🐌 "Rollback takes longer than fixing forward"
+* 🚪 Nobody knows the rollback procedure
+
+---
+
+## 📍 Slide 9 – 😨 All-or-Nothing Deploys
+
+* 📅 Big-bang releases every few months
+* 🎰 Everything changes at once
+* 📋 Impossible to isolate failures
+* 💀 If it fails, everything fails
+
+> ⚠️ **Large releases = large risk**
+
+**💬 Discussion:** Would you rather deploy 100 changes once or 1 change 100 times?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Manual Deployment
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow deployments | Features delayed |
+| 📋 Manual errors | Outages, rollbacks |
+| 👉 Inconsistent process | "Works for Alice, not Bob" |
+| 🙈 Fear of deploying | Innovation stalls |
+
+**📈 Elite vs Low Performers:**
+| Metric | 🏆 Elite | 😰 Low |
+|--------|---------|-------|
+| Deploy frequency | Multiple/day | Monthly |
+| Lead time | < 1 hour | 1-6 months |
+| Change failure rate | 0-15% | 46-60% |
+| Recovery time | < 1 hour | 1 week+ |
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: Blocks & Error Handling
+
+* 🧱 **Blocks** = group related tasks
+* 🔄 **Rescue** = handle failures
+* ✅ **Always** = run regardless of outcome
+* 🎯 Production-ready error handling
+
+```mermaid
+flowchart TD
+  Block[🧱 Block] --> Try[🎯 Try Tasks]
+  Try -->|✅ Success| Always[✅ Always]
+  Try -->|❌ Failure| Rescue[🔧 Rescue]
+  Rescue --> Always
+```
+
+---
+
+## 📍 Slide 12 – 🧱 Block Syntax
+
+```yaml
+- name: Deploy application with error handling
+  block:
+    - name: Pull latest image
+      docker_image:
+        name: "{{ app_image }}"
+        source: pull
+
+    - name: Start container
+      docker_container:
+        name: "{{ app_name }}"
+        image: "{{ app_image }}"
+        state: started
+
+  rescue:
+    - name: Log failure
+      debug:
+        msg: "Deployment failed! Rolling back..."
+
+    - name: Notify team
+      uri:
+        url: "{{ slack_webhook }}"
+        method: POST
+        body: '{"text": "Deployment failed!"}'
+
+  always:
+    - name: Cleanup temp files
+      file:
+        path: /tmp/deploy
+        state: absent
+```
+
+---
+
+## 📍 Slide 13 – 🛡️ Block Benefits
+
+```mermaid
+flowchart LR
+  subgraph Without Blocks
+    T1[Task 1] --> T2[Task 2]
+    T2 -->|❌ Fail| Stop[😱 Playbook Stops]
+  end
+  subgraph With Blocks
+    B1[🧱 Block] -->|❌ Fail| R1[🔧 Rescue]
+    R1 --> A1[✅ Always]
+  end
+```
+
+**🛡️ Advantages:**
+* 🔄 Graceful error handling
+* 📊 Cleanup runs even on failure
+* 🔔 Notification on failure
+* 🎯 Apply settings to multiple tasks
+
+```yaml
+- name: Docker installation
+  block:
+    - name: Task 1
+    - name: Task 2
+    - name: Task 3
+  become: yes        # 🔐 Applied to all tasks
+  when: install_docker  # 🔀 Condition for all
+  tags:
+    - docker         # 🏷️ Tag for all
+```
+
+---
+
+## 📍 Slide 14 – 🏷️ Section 3: Tags Strategy
+
+* 🏷️ **Tags** = label tasks for selective execution
+* 🎯 Run only what you need
+* ⏱️ Speed up development and testing
+* 🔧 Isolate specific operations
+
+```bash
+# Run only docker tasks
+ansible-playbook site.yml --tags "docker"
+
+# Skip common tasks
+ansible-playbook site.yml --skip-tags "common"
+
+# List available tags
+ansible-playbook site.yml --list-tags
+```
+
+---
+
+## 📍 Slide 15 – 🏷️ Tag Design Patterns
+
+```yaml
+# roles/web_app/tasks/main.yml
+- name: Application deployment
+  block:
+    - name: Pull image
+      docker_image:
+        name: "{{ app_image }}"
+        source: pull
+
+    - name: Deploy container
+      docker_container:
+        name: "{{ app_name }}"
+        state: started
+  tags:
+    - app_deploy
+    - deploy
+
+- name: Application wipe
+  block:
+    - name: Stop container
+      docker_container:
+        name: "{{ app_name }}"
+        state: absent
+  when: web_app_wipe | bool
+  tags:
+    - web_app_wipe
+```
+
+**🏷️ Tag Categories:**
+* 🚀 **deploy**: Deployment tasks
+* 🧹 **wipe**: Cleanup tasks
+* 📦 **packages**: Package installation
+* ⚙️ **config**: Configuration only
+
+---
+
+## 📍 Slide 16 – ⚠️ Wipe Logic Pattern
+
+```mermaid
+flowchart TD
+  Check{🔍 web_app_wipe = true?}
+  Check -->|No| Skip[⏭️ Skip wipe tasks]
+  Check -->|Yes| TagCheck{🏷️ --tags web_app_wipe?}
+  TagCheck -->|No| Skip2[⏭️ Skip: tag not specified]
+  TagCheck -->|Yes| Wipe[🧹 Execute wipe]
+```
+
+**🛡️ Double Safety Mechanism:**
+* 📊 **Variable gate**: `web_app_wipe: false` by default
+* 🏷️ **Tag gate**: Must specify `--tags web_app_wipe`
+* ✅ Both required to execute dangerous tasks
+
+```bash
+# Normal deploy (wipe doesn't run)
+ansible-playbook deploy.yml
+
+# Wipe only
+ansible-playbook deploy.yml -e "web_app_wipe=true" --tags web_app_wipe
+
+# Clean reinstall (wipe + deploy)
+ansible-playbook deploy.yml -e "web_app_wipe=true"
+```
+
+---
+
+## 📍 Slide 17 – 🐳 Docker Compose Deployment
+
+```mermaid
+flowchart LR
+  Template[📝 Template] -->|Jinja2| Compose[🐳 docker-compose.yml]
+  Compose --> Deploy[🚀 Deploy]
+  Deploy --> Running[✅ Running]
+```
+
+**🐳 Why Docker Compose with Ansible?**
+* 📝 Declarative container configuration
+* 🔄 Managed by templates (dynamic values)
+* 🔧 Easy updates and rollbacks
+* 📊 Multi-container applications
+
+---
+
+## 📍 Slide 18 – 📝 Jinja2 Templates
+
+```yaml
+# roles/web_app/templates/docker-compose.yml.j2
+version: '3.8'
+
+services:
+  {{ app_name }}:
+    image: {{ docker_image }}:{{ docker_tag }}
+    container_name: {{ app_name }}
+    ports:
+      - "{{ app_port }}:{{ app_internal_port }}"
+    environment:
+{% for key, value in app_env.items() %}
+      {{ key }}: "{{ value }}"
+{% endfor %}
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:{{ app_internal_port }}/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+```
+
+**📊 Variables Used:**
+* 📦 `app_name`: Container name
+* 🐳 `docker_image`: Image repository
+* 🏷️ `docker_tag`: Image version
+* 🔌 `app_port`: Exposed port
+
+---
+
+## 📍 Slide 19 – 🚀 Deploy with Docker Compose Module
+
+```yaml
+# roles/web_app/tasks/main.yml
+- name: Create application directory
+  file:
+    path: "{{ compose_project_dir }}"
+    state: directory
+    mode: '0755'
+
+- name: Template docker-compose file
+  template:
+    src: docker-compose.yml.j2
+    dest: "{{ compose_project_dir }}/docker-compose.yml"
+    mode: '0644'
+  notify: restart app
+
+- name: Deploy with Docker Compose
+  community.docker.docker_compose_v2:
+    project_src: "{{ compose_project_dir }}"
+    state: present
+    pull: always
+  register: deploy_result
+
+- name: Verify deployment
+  uri:
+    url: "http://localhost:{{ app_port }}/health"
+    status_code: 200
+  retries: 5
+  delay: 10
+```
+
+---
+
+## 📍 Slide 20 – 🔗 Role Dependencies
+
+```yaml
+# roles/web_app/meta/main.yml
+---
+dependencies:
+  - role: docker
+    vars:
+      docker_users:
+        - "{{ ansible_user }}"
+```
+
+**🔗 Dependency Benefits:**
+* 🔄 Automatic execution order
+* 📦 Ensures prerequisites
+* 🎯 Self-contained roles
+
+```mermaid
+flowchart LR
+  WebApp[📦 web_app role] -->|depends on| Docker[🐳 docker role]
+  Docker --> Tasks[🔧 Docker tasks run first]
+  Tasks --> WebAppTasks[🚀 Web app tasks run second]
+```
+
+---
+
+## 📍 Slide 21 – 📊 Multi-Environment Deployment
+
+```yaml
+# vars/app_python.yml
+app_name: devops-python
+docker_image: username/devops-info-service
+docker_tag: latest
+app_port: 8000
+
+# vars/app_bonus.yml
+app_name: devops-go
+docker_image: username/devops-info-service-go
+docker_tag: latest
+app_port: 8001
+```
+
+```yaml
+# playbooks/deploy_python.yml
+---
+- name: Deploy Python Application
+  hosts: webservers
+  become: yes
+  vars_files:
+    - ../vars/app_python.yml
+  roles:
+    - web_app
+```
+
+**🔄 Same role, different variables!**
+
+---
+
+## 📍 Slide 22 – 🤖 CI/CD Integration
+
+```mermaid
+flowchart LR
+  Push[📤 Git Push] --> CI[🔄 GitHub Actions]
+  CI --> Lint[📋 ansible-lint]
+  Lint --> Deploy[🚀 ansible-playbook]
+  Deploy --> Verify[✅ Verification]
+```
+
+**🤖 CI/CD Benefits:**
+* 🔄 Automatic deployments on push
+* 📋 Linting catches errors early
+* 🔐 Secure credential handling
+* 📊 Audit trail of deployments
+
+---
+
+## 📍 Slide 23 – 📝 GitHub Actions Workflow
+
+```yaml
+# .github/workflows/ansible-deploy.yml
+name: Ansible Deployment
+
+on:
+  push:
+    branches: [main]
+    paths:
+      - 'ansible/**'
+
+jobs:
+  lint:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install ansible-lint
+        run: pip install ansible ansible-lint
+      - name: Run ansible-lint
+        run: ansible-lint ansible/playbooks/*.yml
+
+  deploy:
+    needs: lint
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Setup SSH
+        run: |
+          mkdir -p ~/.ssh
+          echo "${{ secrets.SSH_KEY }}" > ~/.ssh/id_rsa
+          chmod 600 ~/.ssh/id_rsa
+      - name: Deploy
+        run: |
+          cd ansible
+          echo "${{ secrets.VAULT_PASS }}" > .vault_pass
+          ansible-playbook playbooks/deploy.yml \
+            --vault-password-file .vault_pass
+          rm .vault_pass
+```
+
+---
+
+## 📍 Slide 24 – 🔐 Secrets in CI/CD
+
+```mermaid
+flowchart TD
+  Secrets[🔐 GitHub Secrets] --> Workflow[🔄 Workflow]
+  Workflow --> TempFile[📄 Temp File]
+  TempFile --> Ansible[🔧 Ansible]
+  Ansible --> Delete[🗑️ Delete Temp File]
+```
+
+**🔐 Security Practices:**
+* 📦 Store credentials in GitHub Secrets
+* 📄 Write to temp file during run
+* 🗑️ Delete immediately after use
+* 🚫 Never echo secrets to logs
+
+```yaml
+# Using secrets safely
+- name: Deploy with Vault
+  env:
+    VAULT_PASS: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
+  run: |
+    echo "$VAULT_PASS" > /tmp/vault_pass
+    ansible-playbook playbook.yml --vault-password-file /tmp/vault_pass
+    rm /tmp/vault_pass  # 🗑️ Cleanup!
+```
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L6_MID
+
+---
+
+## 📍 Slide 26 – 📁 Section 4: Path Filters
+
+```yaml
+on:
+  push:
+    paths:
+      - 'ansible/**'           # 📁 Only ansible changes
+      - '!ansible/docs/**'     # 📝 Exclude docs
+      - '.github/workflows/ansible-deploy.yml'
+```
+
+**📁 Path Filter Benefits:**
+* ⚡ Faster CI (skip unnecessary runs)
+* 💰 Lower costs (fewer minutes used)
+* 🎯 Focused workflows
+
+```mermaid
+flowchart TD
+  Push[📤 Push] --> Check{📁 ansible/** changed?}
+  Check -->|Yes| Run[🚀 Run Workflow]
+  Check -->|No| Skip[⏭️ Skip Workflow]
+```
+
+---
+
+## 📍 Slide 27 – 📊 Deployment Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| ⏱️ **Deploy Time** | Push to production | < 15 minutes |
+| 📦 **Deploy Frequency** | How often | Daily+ |
+| ❌ **Failure Rate** | Failed deploys | < 15% |
+| 🔄 **Rollback Time** | Recovery time | < 5 minutes |
+
+> 📚 These are DORA metrics for deployment performance.
+
+**🤔 Question:** How fast can you deploy and roll back?
+
+---
+
+## 📍 Slide 28 – 🔄 Rollback Strategy
+
+```yaml
+# Rollback by re-deploying previous version
+- name: Rollback application
+  block:
+    - name: Stop current container
+      docker_container:
+        name: "{{ app_name }}"
+        state: stopped
+
+    - name: Deploy previous version
+      community.docker.docker_compose_v2:
+        project_src: "{{ compose_project_dir }}"
+        state: present
+      vars:
+        docker_tag: "{{ rollback_tag }}"
+
+    - name: Verify rollback
+      uri:
+        url: "http://localhost:{{ app_port }}/health"
+        status_code: 200
+      retries: 3
+      delay: 5
+```
+
+**🔄 Rollback Options:**
+* 🏷️ Deploy previous tag
+* 📦 Docker Compose down/up
+* 🔙 Git revert + CI/CD
+
+---
+
+## 📍 Slide 29 – 🌊 From Manual to Automated Deployment
+
+```mermaid
+flowchart LR
+  subgraph 😱 Manual
+    SSH[🔌 SSH to servers]
+    Commands[💻 Run commands]
+    Hope[🙏 Hope it works]
+  end
+  subgraph 🤖 Automated
+    Push[📤 Git push]
+    CI[🔄 CI/CD]
+    Deploy[🚀 Ansible]
+  end
+  Manual -->|🚀 Automate| Automated
+```
+
+**🎯 Automation State:**
+* ⚡ Deploy in minutes, not hours
+* 🔄 Every change through CI/CD
+* 📈 Deploy with confidence
+
+---
+
+## 📍 Slide 30 – 🏢 Section 5: Real World CI/CD
+
+## 📅 A Day with Automated Deployment
+
+**☀️ Morning:**
+* 📊 Review deployment PR
+* 👀 Check CI lint results
+* ✅ Merge to main
+
+**🌤️ Afternoon:**
+* 🤖 CI automatically deploys
+* 📊 Monitoring shows healthy
+* ☕ Coffee break
+
+**🌙 Evening:**
+* 🚨 Bug found in production
+* 🔙 Revert commit, CI deploys previous
+* ⏱️ **5 minutes** to rollback
+
+---
+
+## 📍 Slide 31 – 👥 Team Deployment Workflow
+
+| 👤 Role | 🎯 CI/CD Responsibility |
+|---------|----------------------|
+| 👨‍💻 **Developer** | Create PR, fix lint issues |
+| 🔧 **DevOps** | Maintain workflows, roles |
+| 👀 **Reviewer** | Approve changes |
+| 🤖 **CI/CD** | Execute deployment |
+
+**🔗 GitOps Workflow:**
+```mermaid
+flowchart LR
+  PR[📝 Pull Request] --> Review[👀 Review]
+  Review --> Merge[✅ Merge]
+  Merge --> CI[🔄 CI/CD]
+  CI --> Deploy[🚀 Deploy]
+  Deploy --> Prod[🌐 Production]
+```
+
+---
+
+## 📍 Slide 32 – 🔀 Deployment Strategies
+
+```mermaid
+flowchart TD
+  subgraph Rolling
+    R1[🔄 Update 1 at a time]
+  end
+  subgraph Blue-Green
+    BG1[🔵 Blue: Current]
+    BG2[🟢 Green: New]
+  end
+  subgraph Canary
+    C1[🐤 Small % first]
+    C2[📊 Monitor]
+    C3[🚀 Full rollout]
+  end
+```
+
+| 🚀 Strategy | 🎯 Use Case |
+|------------|----------|
+| 🔄 **Rolling** | Gradual update, zero downtime |
+| 🔵 **Blue-Green** | Instant switch, easy rollback |
+| 🐤 **Canary** | Test with subset of users |
+
+---
+
+## 📍 Slide 33 – 🧪 Deployment Verification
+
+```yaml
+# Verify deployment success
+- name: Wait for application
+  uri:
+    url: "http://{{ ansible_host }}:{{ app_port }}/health"
+    status_code: 200
+    return_content: yes
+  register: health_check
+  until: health_check.status == 200
+  retries: 10
+  delay: 6
+
+- name: Run smoke tests
+  command: "curl -f http://{{ ansible_host }}:{{ app_port }}/"
+  register: smoke_test
+  failed_when: smoke_test.rc != 0
+
+- name: Log deployment success
+  debug:
+    msg: "✅ Deployment verified: {{ app_name }} is healthy"
+```
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: CD Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Manual deploys] --> Mid[💼 Mid: CI/CD pipelines]
+  Mid --> Senior[⭐ Senior: Zero-downtime strategies]
+  Senior --> Principal[🏆 Principal: Platform architecture]
+```
+
+**🛠️ Skills to Build:**
+* 🔄 CI/CD pipeline design
+* 🐳 Container orchestration
+* 📊 Monitoring and alerting
+* 🔙 Rollback strategies
+* 🔐 Security in pipelines
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 Enterprise CD:**
+* 📦 **Amazon**: Deploy every 11.7 seconds
+* 🎬 **Netflix**: Canary deployments everywhere
+* 🔍 **Google**: Feature flags for gradual rollout
+
+**☁️ CD Practices:**
+* 🏦 **Stripe**: Shadow traffic for testing
+* 📦 **Etsy**: 50+ deploys per day
+* 🎮 **Spotify**: Squad-based ownership
+
+**📊 Stats:**
+* 🚀 Elite teams deploy **on demand**
+* ⏱️ Lead time: **less than 1 hour**
+* 🔄 Recovery: **less than 1 hour**
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🧱 **Blocks** enable graceful error handling
+2. 🏷️ **Tags** allow selective execution
+3. 🐳 **Docker Compose** templates for flexible deployments
+4. 🔗 **Role dependencies** ensure proper ordering
+5. 🤖 **CI/CD** automates the entire process
+
+> 💡 Small, frequent deployments are safer than big releases.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🚀 CD Mindset |
+|---------------|------------------|
+| 🙅 "Deploy on weekends" | 🚀 "Deploy anytime" |
+| 🚫 "Big releases quarterly" | 🔄 "Small releases daily" |
+| 👉 "Manual verification" | 🤖 "Automated checks" |
+| 😨 "Rollback is hard" | 💪 "Rollback in minutes" |
+| 💻 "It works locally" | 🌍 "CI validates it" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Blocks with rescue and always
+* ✅ Tag strategies for selective execution
+* ✅ Docker Compose templates with Jinja2
+* ✅ Role dependencies and ordering
+* ✅ CI/CD integration with GitHub Actions
+
+> 🚀 **You're ready for Lab 6: Advanced Ansible & CI/CD**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L6_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Observability & Logging
+
+* 📋 Log aggregation with Loki
+* 📊 Visualization with Grafana
+* 🔍 LogQL query language
+* 💻 Hands-on: Building a logging stack
+
+**🎉 Your continuous deployment journey continues.**
+
+> 🚀 From manual deploys to automated CI/CD — one commit at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> CICD[🤖 CI/CD Skills]
+  CICD --> Automated[🚀 Automated Deploys]
+  Automated --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Continuous Delivery* — Jez Humble
+* 📖 *The DevOps Handbook* — Gene Kim et al.
+* 📖 *Accelerate* — Nicole Forsgren
+
+**🔗 Links:**
+* 🌐 [Ansible Blocks](https://docs.ansible.com/ansible/latest/user_guide/playbooks_blocks.html)
+* 🌐 [Ansible Tags](https://docs.ansible.com/ansible/latest/user_guide/playbooks_tags.html)
+* 🌐 [GitHub Actions](https://docs.github.com/en/actions)
+
+---
diff --git a/lectures/lec7.md b/lectures/lec7.md
index b00d0ad39f..7619e8ba05 100644
--- a/lectures/lec7.md
+++ b/lectures/lec7.md
@@ -1,849 +1,849 @@
-# 📌 Lecture 7 — Observability & Logging: From Blind to Insight
-
-## 📍 Slide 1 – 🚀 Welcome to Observability
-
-* 🌍 **Applications are running** — but what's happening inside?
-* 😰 Without visibility, debugging is guesswork
-* 🔍 **Observability** = understanding system state from outputs
-* 🎯 This lecture: master logging with Loki, Promtail, and Grafana
-
-```mermaid
-flowchart LR
-  App[📦 Application] -->|📋 Logs| Collect[🔧 Promtail]
-  Collect --> Store[💾 Loki]
-  Store --> View[📊 Grafana]
-  View --> Insight[💡 Insight]
-```
-
----
-
-## 📍 Slide 2 – 🎯 What You Will Learn
-
-* ✅ Understand the three pillars of observability
-* ✅ Deploy Loki stack for log aggregation
-* ✅ Query logs with LogQL
-* ✅ Build effective log dashboards
-
-**🎓 Learning Outcomes:**
-| # | Outcome |
-|---|---------|
-| 1 | 🧠 Differentiate logs, metrics, and traces |
-| 2 | 🔍 Configure Loki 3.0 with TSDB storage |
-| 3 | 🛠️ Write LogQL queries for filtering and aggregation |
-| 4 | 🗺️ Design actionable log dashboards |
-
----
-
-## 📍 Slide 3 – 📋 How This Lecture Works
-
-* 📚 **Concepts + Configuration** — hands-on focus
-* 🎮 **Real-world scenarios** — debugging production issues
-* 📝 **3 quiz checkpoints**: PRE / MID / POST
-* 🛠️ **Tool stack**: Loki + Promtail + Grafana
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction (now)     → 📝 PRE Quiz
-Section 1: The Visibility Problem
-Section 2: Observability Fundamentals
-Section 3: Loki Stack Deep Dive   → 📝 MID Quiz
-Section 4: LogQL & Dashboards
-Section 5: Production Logging
-Section 6: Reflection             → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – ❓ The Big Question
-
-* 📊 **70%** of mean time to resolution is spent finding the problem
-* ⏱️ Average time to detect issues: **hours to days**
-* 💥 Without observability, debugging is **archaeology**
-
-> 💬 *"Users reported it's slow... but where?"* — Every on-call engineer, ever
-
-**🤔 Think about it:**
-* How do you know your app is healthy?
-* When users report issues, where do you look first?
-* Can you trace a request through your system?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L7_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Visibility Problem
-
-* 🙈 **No logs** = flying blind
-* 📋 Logs scattered across servers
-* 🔍 grep through SSH sessions
-* 💥 Result: **hours spent finding problems**
-
-```mermaid
-flowchart LR
-  Issue[🚨 Issue Reported] --> SSH1[🔌 SSH to Server 1]
-  SSH1 --> Grep1[🔍 grep logs]
-  Grep1 --> SSH2[🔌 SSH to Server 2]
-  SSH2 --> Grep2[🔍 grep logs]
-  Grep2 --> Hours[⏱️ Hours Later...]
-```
-
----
-
-## 📍 Slide 7 – 📋 Log Chaos
-
-* 📁 Logs in different formats
-* 🖥️ Different locations per server
-* 📅 Old logs deleted or rotated
-* 💀 No correlation between services
-
-```mermaid
-flowchart TD
-  App1[📦 App 1: JSON logs]
-  App2[📦 App 2: Plain text]
-  App3[📦 App 3: Custom format]
-  App1 --> Chaos[😱 No Unified View]
-  App2 --> Chaos
-  App3 --> Chaos
-```
-
-**📊 The Numbers:**
-* 🔍 **73%** of engineers can't find logs quickly
-* ⏱️ Average time to find relevant log: **15+ minutes**
-* 💰 Cost of slow debugging: **$26,000/hour** (enterprise)
-
----
-
-## 📍 Slide 8 – 😱 "It's Working for Me"
-
-* 👥 Users report: *"App is slow"*
-* 🤷 Team responds: *"Works for me"*
-* 🔍 No data to prove either side
-* 💀 Frustration all around
-
-> ⚠️ **Without observability, you can't prove anything**
-
-**😰 Signs of Poor Observability:**
-* 🔇 "Check the server logs" (which server?)
-* 📝 "It was working yesterday" (what changed?)
-* 🐌 "Let's restart and see" (cargo cult debugging)
-* 🚪 Blame instead of data
-
-**💬 Discussion:** How do you currently debug production issues?
-
----
-
-## 📍 Slide 9 – 🔥 The Alert Fatigue Problem
-
-* 🚨 Too many alerts = no alerts
-* 📧 Inbox full of "warnings"
-* 😴 Real issues get ignored
-* 💀 On-call burnout
-
-> ⚠️ **Noise drowns out signal**
-
-```mermaid
-flowchart LR
-  Alerts[🚨 1000 Alerts/day] --> Ignore[😴 Alert Fatigue]
-  Ignore --> Miss[🙈 Miss Real Issues]
-  Miss --> Outage[💥 Production Outage]
-```
-
----
-
-## 📍 Slide 10 – 💸 The Cost of Blind Operations
-
-| 🔥 Problem | 💥 Impact |
-|------------|-----------|
-| 🐢 Slow debugging | Hours/days to resolve |
-| 📋 No correlation | Can't trace requests |
-| 👉 Finger pointing | No data, just blame |
-| 🙈 Hidden failures | Issues go unnoticed |
-
-**📈 Real Numbers:**
-* 🏢 **MTTR without observability**: 4+ hours
-* 🚀 **MTTR with observability**: < 30 minutes
-* 💰 **ROI of observability**: 10x+ reduction in incident cost
-
-**💰 Cost Example:**
-* 💵 1-hour outage: **$300,000**
-* 🔍 Good observability: **$30/month**
-* 🧮 Break-even: **first 6 seconds of prevented downtime**
-
----
-
-## 📍 Slide 11 – 💡 Section 2: What Observability Is
-
-* 🔍 **Observability** = understanding system state from external outputs
-* 📊 **Three pillars**: Logs, Metrics, Traces
-* 🎯 Answer: "Why is this happening?"
-* 🚫 NOT just monitoring (which asks "Is it working?")
-
-```mermaid
-flowchart TD
-  Obs[🔍 Observability]
-  Obs --> Logs[📋 Logs: What happened]
-  Obs --> Metrics[📊 Metrics: How much]
-  Obs --> Traces[🔗 Traces: Where/how long]
-```
-
-**📖 Definition:**
-> *Observability is the ability to understand the internal state of a system by examining its external outputs — logs, metrics, and traces.*
-
----
-
-## 📍 Slide 12 – 📋 The Three Pillars
-
-| 📊 Pillar | 🎯 Answers | 🛠️ Tools |
-|-----------|-----------|----------|
-| 📋 **Logs** | What happened? | Loki, ELK |
-| 📊 **Metrics** | How much/fast? | Prometheus |
-| 🔗 **Traces** | Where did time go? | Jaeger, Tempo |
-
-```mermaid
-flowchart LR
-  subgraph Logs
-    L1[📝 Error: Connection refused]
-  end
-  subgraph Metrics
-    M1[📈 99.9% availability]
-  end
-  subgraph Traces
-    T1[🔗 Request: 250ms total]
-  end
-```
-
-**🎯 Together they tell the full story**
-
----
-
-## 📍 Slide 13 – 📋 Logs: What Happened
-
-* 📝 **Events** with timestamps
-* 🔍 Detailed context for debugging
-* 📊 Can be structured (JSON) or unstructured
-* ⚠️ High volume, high storage
-
-```json
-{
-  "timestamp": "2024-01-15T10:23:45Z",
-  "level": "ERROR",
-  "service": "user-api",
-  "message": "Database connection failed",
-  "error": "Connection refused",
-  "host": "server-1"
-}
-```
-
-**🎯 Use logs when:**
-* 🔍 Debugging specific errors
-* 📋 Understanding request flow
-* 🛡️ Security auditing
-
----
-
-## 📍 Slide 14 – 📊 Why Structured Logging?
-
-```mermaid
-flowchart LR
-  subgraph ❌ Unstructured
-    U1[ERROR: Failed to connect to db at 10:23]
-  end
-  subgraph ✅ Structured
-    S1[JSON with fields]
-  end
-  U1 --> Hard[😰 Hard to parse]
-  S1 --> Easy[✅ Easy to query]
-```
-
-**❌ Unstructured:**
-```
-ERROR 2024-01-15 10:23:45 Connection to database failed on server-1
-```
-
-**✅ Structured (JSON):**
-```json
-{"timestamp":"2024-01-15T10:23:45Z","level":"ERROR","msg":"Connection failed","server":"server-1"}
-```
-
-**🎯 Benefits:**
-* 🔍 Easy to filter and search
-* 📊 Aggregate by any field
-* 🤖 Machine-parseable
-
----
-
-## 📍 Slide 15 – ⚡ Loki vs ELK
-
-| 📋 Aspect | 📊 Loki | 🔍 ELK Stack |
-|-----------|---------|-------------|
-| 🏗️ Architecture | Lightweight | Heavy |
-| 💾 Storage | Index labels only | Full-text index |
-| 📊 Query | LogQL | Lucene |
-| 💰 Cost | Low (storage) | High (compute) |
-| 🎯 Best for | Cloud-native | Enterprise search |
-
-```mermaid
-flowchart LR
-  Loki[📊 Loki] -->|Labels| Index1[🏷️ Small Index]
-  ELK[🔍 ELK] -->|Full Text| Index2[📚 Large Index]
-  Index1 --> Cost1[💰 Low Cost]
-  Index2 --> Cost2[💸 High Cost]
-```
-
-> 🔥 **Loki**: "Like Prometheus, but for logs"
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: Loki Stack Deep Dive
-
-## 🏗️ Loki Architecture
-
-* 💾 **Loki**: Log storage (index + chunks)
-* 🔧 **Promtail**: Log collector (agent)
-* 📊 **Grafana**: Visualization
-
-```mermaid
-flowchart LR
-  App1[📦 App 1] --> Promtail[🔧 Promtail]
-  App2[📦 App 2] --> Promtail
-  Promtail -->|Push| Loki[💾 Loki]
-  Loki --> Grafana[📊 Grafana]
-```
-
-**🎮 Let's build a logging stack.**
-
----
-
-## 📍 Slide 17 – 💾 Loki 3.0 Features
-
-* 🚀 **TSDB index**: 10x faster queries
-* 📊 **Structured metadata**: First-class support
-* 💾 **Better compression**: Lower storage costs
-* 🔍 **Schema v13**: Latest and recommended
-
-```yaml
-# loki/config.yml
-schema_config:
-  configs:
-    - from: 2024-01-01
-      store: tsdb        # 🚀 New fast store
-      object_store: filesystem
-      schema: v13        # 📊 Latest schema
-      index:
-        prefix: index_
-        period: 24h
-```
-
-**🎯 Always use TSDB for new deployments!**
-
----
-
-## 📍 Slide 18 – ⚙️ Loki Configuration
-
-```yaml
-# loki/config.yml
-auth_enabled: false
-
-server:
-  http_listen_port: 3100
-
-common:
-  path_prefix: /loki
-  storage:
-    filesystem:
-      chunks_directory: /loki/chunks
-      rules_directory: /loki/rules
-  replication_factor: 1
-  ring:
-    instance_addr: 127.0.0.1
-    kvstore:
-      store: inmemory
-
-limits_config:
-  retention_period: 168h  # 🗓️ 7 days
-```
-
-**🔑 Key Settings:**
-* 🔐 `auth_enabled`: False for testing
-* 💾 `storage`: Where logs are stored
-* 🗓️ `retention_period`: How long to keep logs
-
----
-
-## 📍 Slide 19 – 🔧 Promtail Configuration
-
-```yaml
-# promtail/config.yml
-server:
-  http_listen_port: 9080
-
-positions:
-  filename: /tmp/positions.yaml
-
-clients:
-  - url: http://loki:3100/loki/api/v1/push
-
-scrape_configs:
-  - job_name: docker
-    docker_sd_configs:
-      - host: unix:///var/run/docker.sock
-        refresh_interval: 5s
-    relabel_configs:
-      - source_labels: ['__meta_docker_container_name']
-        regex: '/(.*)'
-        target_label: 'container'
-```
-
-**🔑 Key Components:**
-* 📋 `positions`: Track what's been read
-* 🔗 `clients`: Where to send logs
-* 🐳 `docker_sd_configs`: Auto-discover containers
-
----
-
-## 📍 Slide 20 – 🐳 Docker Compose Stack
-
-```yaml
-# docker-compose.yml
-version: '3.8'
-
-services:
-  loki:
-    image: grafana/loki:3.0.0
-    ports:
-      - "3100:3100"
-    volumes:
-      - ./loki/config.yml:/etc/loki/config.yml
-      - loki-data:/loki
-    command: -config.file=/etc/loki/config.yml
-
-  promtail:
-    image: grafana/promtail:3.0.0
-    volumes:
-      - ./promtail/config.yml:/etc/promtail/config.yml
-      - /var/lib/docker/containers:/var/lib/docker/containers:ro
-      - /var/run/docker.sock:/var/run/docker.sock:ro
-    command: -config.file=/etc/promtail/config.yml
-
-  grafana:
-    image: grafana/grafana:11.3.0
-    ports:
-      - "3000:3000"
-    volumes:
-      - grafana-data:/var/lib/grafana
-```
-
----
-
-## 📍 Slide 21 – 🏷️ Labels: The Key Concept
-
-```mermaid
-flowchart TD
-  Log[📋 Log Entry] --> Labels[🏷️ Labels]
-  Labels --> App[app=web-api]
-  Labels --> Env[env=production]
-  Labels --> Level[level=error]
-  App --> Query[🔍 Query by Labels]
-  Env --> Query
-  Level --> Query
-```
-
-**🏷️ Labels = How Loki indexes logs**
-
-```logql
-# Query logs by labels
-{app="web-api", env="production"}
-
-# Filter errors
-{app="web-api"} |= "error"
-```
-
-**⚠️ Label Best Practices:**
-* 🔢 Keep cardinality low (< 10 values per label)
-* 🚫 Never use high-cardinality fields (user IDs, request IDs)
-* 🏷️ Use for: app name, environment, service
-
----
-
-## 📍 Slide 22 – 🔍 LogQL Basics
-
-```mermaid
-flowchart LR
-  Selector[🏷️ Stream Selector] --> Filter[🔍 Line Filter]
-  Filter --> Parser[📊 Parser]
-  Parser --> Result[📋 Results]
-```
-
-**🔍 Query Structure:**
-```logql
-{label="value"} |= "filter" | json | field="value"
-```
-
-**📋 Examples:**
-```logql
-# All logs from container
-{container="web-api"}
-
-# Errors only
-{container="web-api"} |= "error"
-
-# Parse JSON, filter by level
-{container="web-api"} | json | level="ERROR"
-
-# Count errors per minute
-rate({container="web-api"} |= "error" [1m])
-```
-
----
-
-## 📍 Slide 23 – 📊 LogQL Operators
-
-| 🔧 Operator | 🎯 Purpose | 📝 Example |
-|-------------|----------|---------|
-| `\|=` | Contains | `\|= "error"` |
-| `!=` | Not contains | `!= "debug"` |
-| `\|~` | Regex match | `\|~ "error\|warn"` |
-| `\| json` | Parse JSON | `\| json` |
-| `\| logfmt` | Parse logfmt | `\| logfmt` |
-| `rate()` | Logs per second | `rate({app="x"}[5m])` |
-
-**📊 Aggregation:**
-```logql
-# Logs per second by container
-sum by (container) (rate({job="docker"}[1m]))
-
-# Count by level
-sum by (level) (count_over_time({app="web"} | json [5m]))
-```
-
----
-
-## 📍 Slide 24 – 🐍 Structured Logging in Python
-
-```python
-import logging
-import json
-from datetime import datetime
-
-class JSONFormatter(logging.Formatter):
-    def format(self, record):
-        log_obj = {
-            "timestamp": datetime.utcnow().isoformat() + "Z",
-            "level": record.levelname,
-            "message": record.getMessage(),
-            "logger": record.name,
-        }
-        if record.exc_info:
-            log_obj["exception"] = self.formatException(record.exc_info)
-        return json.dumps(log_obj)
-
-# Setup
-handler = logging.StreamHandler()
-handler.setFormatter(JSONFormatter())
-logger = logging.getLogger()
-logger.addHandler(handler)
-logger.setLevel(logging.INFO)
-
-# Usage
-logger.info("User logged in", extra={"user_id": 123})
-```
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L7_MID
-
----
-
-## 📍 Slide 26 – 📊 Section 4: Building Dashboards
-
-## 🎨 Dashboard Design Principles
-
-* 🎯 **Purpose**: What question does it answer?
-* 📊 **Hierarchy**: Most important at top
-* 🎨 **Color**: Red = bad, Green = good
-* 🔄 **Refresh**: Auto-refresh for real-time
-
-```mermaid
-flowchart TD
-  Top[🚨 Alerts & Errors]
-  Top --> Middle[📊 Request Rates]
-  Middle --> Bottom[📋 Log Stream]
-```
-
----
-
-## 📍 Slide 27 – 📊 Essential Log Panels
-
-**1️⃣ Log Stream (Logs visualization)**
-```logql
-{app=~"devops-.*"}
-```
-
-**2️⃣ Error Rate (Time series)**
-```logql
-sum by (app) (rate({app=~"devops-.*"} |= "ERROR" [1m]))
-```
-
-**3️⃣ Request Rate (Time series)**
-```logql
-sum by (app) (rate({app=~"devops-.*"} [1m]))
-```
-
-**4️⃣ Level Distribution (Pie chart)**
-```logql
-sum by (level) (count_over_time({app=~"devops-.*"} | json [5m]))
-```
-
----
-
-## 📍 Slide 28 – 📊 Grafana Panel Types
-
-| 📊 Type | 🎯 Use For |
-|---------|----------|
-| 📋 **Logs** | Raw log entries |
-| 📈 **Time series** | Trends over time |
-| 📊 **Stat** | Single values |
-| 🥧 **Pie chart** | Distribution |
-| 📋 **Table** | Structured data |
-| 🌡️ **Gauge** | Current status |
-
-```mermaid
-flowchart LR
-  Logs[📋 Logs] --> Debug[🔍 Debugging]
-  TimeSeries[📈 Time Series] --> Trends[📊 Trends]
-  Stat[📊 Stat] --> KPIs[🎯 KPIs]
-```
-
----
-
-## 📍 Slide 29 – 📊 Logging Metrics
-
-| 📊 Metric | 📏 Measures | 🏆 Target |
-|-----------|------------|---------|
-| 📋 **Log Volume** | Logs per second | Stable |
-| ❌ **Error Rate** | Errors per minute | < 1% |
-| ⏱️ **Query Time** | Time to find logs | < 30s |
-| 💾 **Retention** | How long kept | 7+ days |
-
-> 📚 These metrics indicate logging health.
-
-**🤔 Question:** How quickly can you find relevant logs?
-
----
-
-## 📍 Slide 30 – 🌊 From Blind to Observable
-
-```mermaid
-flowchart LR
-  subgraph 😱 Blind
-    SSH[🔌 SSH grep]
-    Guess[🤷 Guesswork]
-    Slow[⏱️ Hours]
-  end
-  subgraph 🔍 Observable
-    Dashboard[📊 Dashboard]
-    Query[🔍 LogQL]
-    Fast[⚡ Minutes]
-  end
-  Blind -->|🚀 Loki| Observable
-```
-
-**🎯 Observability State:**
-* ⚡ Find issues in minutes, not hours
-* 🔄 Unified view across all services
-* 📈 Data-driven debugging
-
----
-
-## 📍 Slide 31 – 🏢 Section 5: Production Logging
-
-## 📅 A Day with Observability
-
-**☀️ Morning:**
-* 📊 Check Grafana dashboard — all green ✅
-* 📋 Review overnight logs — no anomalies
-* ☕ Coffee with confidence
-
-**🌤️ Afternoon:**
-* 🚨 Alert: Error rate spike
-* 🔍 LogQL: `{app="api"} |= "error" | json | level="ERROR"`
-* 🔧 Found: Database timeout
-* ⏱️ **10 minutes** to identify root cause
-
-**🌙 Evening:**
-* 📊 Review error trends
-* 📝 Create runbook for similar issues
-* 🏠 Go home knowing you can debug remotely
-
----
-
-## 📍 Slide 32 – 👥 Team Logging Workflow
-
-| 👤 Role | 🎯 Observability Responsibility |
-|---------|----------------------|
-| 👨‍💻 **Developer** | Add structured logging |
-| 🔧 **DevOps** | Maintain logging stack |
-| 🛡️ **SRE** | Build dashboards, respond to alerts |
-| 📊 **On-call** | Use logs for incident response |
-
-**🔗 Incident Response Flow:**
-```mermaid
-flowchart LR
-  Alert[🚨 Alert] --> Dashboard[📊 Dashboard]
-  Dashboard --> LogQL[🔍 LogQL Query]
-  LogQL --> RootCause[🎯 Root Cause]
-  RootCause --> Fix[🔧 Fix]
-```
-
----
-
-## 📍 Slide 33 – 🔐 Production Considerations
-
-```yaml
-# Production settings
-deploy:
-  resources:
-    limits:
-      memory: 1G
-      cpus: '1.0'
-    reservations:
-      memory: 512M
-
-healthcheck:
-  test: ["CMD", "wget", "--no-verbose", "--tries=1", "--spider", "http://localhost:3100/ready"]
-  interval: 10s
-  timeout: 5s
-  retries: 5
-```
-
-**🛡️ Production Checklist:**
-* 💾 Persistent volumes for data
-* 🔐 Secure Grafana (disable anonymous)
-* 📊 Resource limits on all services
-* 🏥 Health checks enabled
-* 🗓️ Retention policies configured
-
----
-
-## 📍 Slide 34 – 📈 Career Path: Observability Skills
-
-```mermaid
-flowchart LR
-  Junior[🌱 Junior: Basic logging] --> Mid[💼 Mid: Structured logging & dashboards]
-  Mid --> Senior[⭐ Senior: Full observability stack]
-  Senior --> Principal[🏆 Principal: Observability strategy]
-```
-
-**🛠️ Skills to Build:**
-* 📋 Structured logging patterns
-* 🔍 LogQL/PromQL fluency
-* 📊 Dashboard design
-* 🚨 Alerting strategies
-* 🔗 Distributed tracing
-
----
-
-## 📍 Slide 35 – 🌍 Real Company Examples
-
-**🏢 Observability Leaders:**
-* 🎬 **Netflix**: Custom observability platform
-* 🔍 **Google**: Invented Dapper (tracing)
-* 📦 **Uber**: Jaeger (open-source tracing)
-
-**☁️ Modern Practices:**
-* 🏦 **Stripe**: Structured logging everywhere
-* 📦 **Spotify**: Centralized logging for 1000+ microservices
-* 🎮 **Riot Games**: Real-time game telemetry
-
-**📊 Stats:**
-* 🔍 **80%** of debugging time is finding problems
-* ⏱️ Good observability reduces MTTR by **70%+**
-* 💰 ROI: **10-100x** in reduced incident costs
-
----
-
-## 📍 Slide 36 – 🎯 Section 6: Reflection
-
-## 📝 Key Takeaways
-
-1. 🔍 **Observability = Logs + Metrics + Traces**
-2. 📋 **Structured logging** enables powerful queries
-3. 🏷️ **Labels** are how Loki indexes (keep cardinality low)
-4. 📊 **LogQL** is your query language
-5. 📈 **Dashboards** provide unified visibility
-
-> 💡 You can't fix what you can't see. Observability gives you eyes.
-
----
-
-## 📍 Slide 37 – 🧠 The Mindset Shift
-
-| 😰 Old Mindset | 🔍 Observable Mindset |
-|---------------|------------------|
-| 🙅 "SSH and grep" | 📊 "Query Grafana" |
-| 🚫 "Check the logs somewhere" | 🔍 "All logs in one place" |
-| 👉 "It's probably X" | 📊 "Data shows it's Y" |
-| 😨 "Debugging takes hours" | ⚡ "Root cause in minutes" |
-| 💻 "Works on my machine" | 🌍 "Production shows different" |
-
-> ❓ Which mindset describes your team?
-
----
-
-## 📍 Slide 38 – ✅ Your Progress
-
-## 🎓 What You Now Understand
-
-* ✅ The three pillars of observability
-* ✅ Loki architecture and configuration
-* ✅ LogQL query syntax
-* ✅ Building effective dashboards
-* ✅ Production logging best practices
-
-> 🚀 **You're ready for Lab 7: Loki Logging Stack**
-
----
-
-## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L7_POST
-
----
-
-## 📍 Slide 40 – 🚀 What Comes Next
-
-## 📚 Next Lecture: Monitoring with Prometheus
-
-* 📊 Metrics collection and storage
-* 🔢 PromQL query language
-* 📈 Application instrumentation
-* 💻 Hands-on: Building metrics dashboards
-
-**🎉 Your observability journey continues.**
-
-> 🔍 From blind operations to insight — one query at a time.
-
-```mermaid
-flowchart LR
-  You[👤 You] --> Obs[🔍 Observability Skills]
-  Obs --> Insight[💡 System Insight]
-  Insight --> Career[🚀 Career Growth]
-```
-
-**👋 See you in the next lecture!**
-
----
-
-## 📚 Resources & Further Reading
-
-**📕 Books:**
-* 📖 *Observability Engineering* — Charity Majors
-* 📖 *Distributed Systems Observability* — Cindy Sridharan
-* 📖 *The Art of Monitoring* — James Turnbull
-
-**🔗 Links:**
-* 🌐 [Grafana Loki Documentation](https://grafana.com/docs/loki/latest/)
-* 🌐 [LogQL Reference](https://grafana.com/docs/loki/latest/query/)
-* 🌐 [Promtail Configuration](https://grafana.com/docs/loki/latest/send-data/promtail/)
-
----
+# 📌 Lecture 7 — Observability & Logging: From Blind to Insight
+
+## 📍 Slide 1 – 🚀 Welcome to Observability
+
+* 🌍 **Applications are running** — but what's happening inside?
+* 😰 Without visibility, debugging is guesswork
+* 🔍 **Observability** = understanding system state from outputs
+* 🎯 This lecture: master logging with Loki, Promtail, and Grafana
+
+```mermaid
+flowchart LR
+  App[📦 Application] -->|📋 Logs| Collect[🔧 Promtail]
+  Collect --> Store[💾 Loki]
+  Store --> View[📊 Grafana]
+  View --> Insight[💡 Insight]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand the three pillars of observability
+* ✅ Deploy Loki stack for log aggregation
+* ✅ Query logs with LogQL
+* ✅ Build effective log dashboards
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Differentiate logs, metrics, and traces |
+| 2 | 🔍 Configure Loki 3.0 with TSDB storage |
+| 3 | 🛠️ Write LogQL queries for filtering and aggregation |
+| 4 | 🗺️ Design actionable log dashboards |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + Configuration** — hands-on focus
+* 🎮 **Real-world scenarios** — debugging production issues
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Tool stack**: Loki + Promtail + Grafana
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Visibility Problem
+Section 2: Observability Fundamentals
+Section 3: Loki Stack Deep Dive   → 📝 MID Quiz
+Section 4: LogQL & Dashboards
+Section 5: Production Logging
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **70%** of mean time to resolution is spent finding the problem
+* ⏱️ Average time to detect issues: **hours to days**
+* 💥 Without observability, debugging is **archaeology**
+
+> 💬 *"Users reported it's slow... but where?"* — Every on-call engineer, ever
+
+**🤔 Think about it:**
+* How do you know your app is healthy?
+* When users report issues, where do you look first?
+* Can you trace a request through your system?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L7_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Visibility Problem
+
+* 🙈 **No logs** = flying blind
+* 📋 Logs scattered across servers
+* 🔍 grep through SSH sessions
+* 💥 Result: **hours spent finding problems**
+
+```mermaid
+flowchart LR
+  Issue[🚨 Issue Reported] --> SSH1[🔌 SSH to Server 1]
+  SSH1 --> Grep1[🔍 grep logs]
+  Grep1 --> SSH2[🔌 SSH to Server 2]
+  SSH2 --> Grep2[🔍 grep logs]
+  Grep2 --> Hours[⏱️ Hours Later...]
+```
+
+---
+
+## 📍 Slide 7 – 📋 Log Chaos
+
+* 📁 Logs in different formats
+* 🖥️ Different locations per server
+* 📅 Old logs deleted or rotated
+* 💀 No correlation between services
+
+```mermaid
+flowchart TD
+  App1[📦 App 1: JSON logs]
+  App2[📦 App 2: Plain text]
+  App3[📦 App 3: Custom format]
+  App1 --> Chaos[😱 No Unified View]
+  App2 --> Chaos
+  App3 --> Chaos
+```
+
+**📊 The Numbers:**
+* 🔍 **73%** of engineers can't find logs quickly
+* ⏱️ Average time to find relevant log: **15+ minutes**
+* 💰 Cost of slow debugging: **$26,000/hour** (enterprise)
+
+---
+
+## 📍 Slide 8 – 😱 "It's Working for Me"
+
+* 👥 Users report: *"App is slow"*
+* 🤷 Team responds: *"Works for me"*
+* 🔍 No data to prove either side
+* 💀 Frustration all around
+
+> ⚠️ **Without observability, you can't prove anything**
+
+**😰 Signs of Poor Observability:**
+* 🔇 "Check the server logs" (which server?)
+* 📝 "It was working yesterday" (what changed?)
+* 🐌 "Let's restart and see" (cargo cult debugging)
+* 🚪 Blame instead of data
+
+**💬 Discussion:** How do you currently debug production issues?
+
+---
+
+## 📍 Slide 9 – 🔥 The Alert Fatigue Problem
+
+* 🚨 Too many alerts = no alerts
+* 📧 Inbox full of "warnings"
+* 😴 Real issues get ignored
+* 💀 On-call burnout
+
+> ⚠️ **Noise drowns out signal**
+
+```mermaid
+flowchart LR
+  Alerts[🚨 1000 Alerts/day] --> Ignore[😴 Alert Fatigue]
+  Ignore --> Miss[🙈 Miss Real Issues]
+  Miss --> Outage[💥 Production Outage]
+```
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Blind Operations
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow debugging | Hours/days to resolve |
+| 📋 No correlation | Can't trace requests |
+| 👉 Finger pointing | No data, just blame |
+| 🙈 Hidden failures | Issues go unnoticed |
+
+**📈 Real Numbers:**
+* 🏢 **MTTR without observability**: 4+ hours
+* 🚀 **MTTR with observability**: < 30 minutes
+* 💰 **ROI of observability**: 10x+ reduction in incident cost
+
+**💰 Cost Example:**
+* 💵 1-hour outage: **$300,000**
+* 🔍 Good observability: **$30/month**
+* 🧮 Break-even: **first 6 seconds of prevented downtime**
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Observability Is
+
+* 🔍 **Observability** = understanding system state from external outputs
+* 📊 **Three pillars**: Logs, Metrics, Traces
+* 🎯 Answer: "Why is this happening?"
+* 🚫 NOT just monitoring (which asks "Is it working?")
+
+```mermaid
+flowchart TD
+  Obs[🔍 Observability]
+  Obs --> Logs[📋 Logs: What happened]
+  Obs --> Metrics[📊 Metrics: How much]
+  Obs --> Traces[🔗 Traces: Where/how long]
+```
+
+**📖 Definition:**
+> *Observability is the ability to understand the internal state of a system by examining its external outputs — logs, metrics, and traces.*
+
+---
+
+## 📍 Slide 12 – 📋 The Three Pillars
+
+| 📊 Pillar | 🎯 Answers | 🛠️ Tools |
+|-----------|-----------|----------|
+| 📋 **Logs** | What happened? | Loki, ELK |
+| 📊 **Metrics** | How much/fast? | Prometheus |
+| 🔗 **Traces** | Where did time go? | Jaeger, Tempo |
+
+```mermaid
+flowchart LR
+  subgraph Logs
+    L1[📝 Error: Connection refused]
+  end
+  subgraph Metrics
+    M1[📈 99.9% availability]
+  end
+  subgraph Traces
+    T1[🔗 Request: 250ms total]
+  end
+```
+
+**🎯 Together they tell the full story**
+
+---
+
+## 📍 Slide 13 – 📋 Logs: What Happened
+
+* 📝 **Events** with timestamps
+* 🔍 Detailed context for debugging
+* 📊 Can be structured (JSON) or unstructured
+* ⚠️ High volume, high storage
+
+```json
+{
+  "timestamp": "2024-01-15T10:23:45Z",
+  "level": "ERROR",
+  "service": "user-api",
+  "message": "Database connection failed",
+  "error": "Connection refused",
+  "host": "server-1"
+}
+```
+
+**🎯 Use logs when:**
+* 🔍 Debugging specific errors
+* 📋 Understanding request flow
+* 🛡️ Security auditing
+
+---
+
+## 📍 Slide 14 – 📊 Why Structured Logging?
+
+```mermaid
+flowchart LR
+  subgraph ❌ Unstructured
+    U1[ERROR: Failed to connect to db at 10:23]
+  end
+  subgraph ✅ Structured
+    S1[JSON with fields]
+  end
+  U1 --> Hard[😰 Hard to parse]
+  S1 --> Easy[✅ Easy to query]
+```
+
+**❌ Unstructured:**
+```
+ERROR 2024-01-15 10:23:45 Connection to database failed on server-1
+```
+
+**✅ Structured (JSON):**
+```json
+{"timestamp":"2024-01-15T10:23:45Z","level":"ERROR","msg":"Connection failed","server":"server-1"}
+```
+
+**🎯 Benefits:**
+* 🔍 Easy to filter and search
+* 📊 Aggregate by any field
+* 🤖 Machine-parseable
+
+---
+
+## 📍 Slide 15 – ⚡ Loki vs ELK
+
+| 📋 Aspect | 📊 Loki | 🔍 ELK Stack |
+|-----------|---------|-------------|
+| 🏗️ Architecture | Lightweight | Heavy |
+| 💾 Storage | Index labels only | Full-text index |
+| 📊 Query | LogQL | Lucene |
+| 💰 Cost | Low (storage) | High (compute) |
+| 🎯 Best for | Cloud-native | Enterprise search |
+
+```mermaid
+flowchart LR
+  Loki[📊 Loki] -->|Labels| Index1[🏷️ Small Index]
+  ELK[🔍 ELK] -->|Full Text| Index2[📚 Large Index]
+  Index1 --> Cost1[💰 Low Cost]
+  Index2 --> Cost2[💸 High Cost]
+```
+
+> 🔥 **Loki**: "Like Prometheus, but for logs"
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Loki Stack Deep Dive
+
+## 🏗️ Loki Architecture
+
+* 💾 **Loki**: Log storage (index + chunks)
+* 🔧 **Promtail**: Log collector (agent)
+* 📊 **Grafana**: Visualization
+
+```mermaid
+flowchart LR
+  App1[📦 App 1] --> Promtail[🔧 Promtail]
+  App2[📦 App 2] --> Promtail
+  Promtail -->|Push| Loki[💾 Loki]
+  Loki --> Grafana[📊 Grafana]
+```
+
+**🎮 Let's build a logging stack.**
+
+---
+
+## 📍 Slide 17 – 💾 Loki 3.0 Features
+
+* 🚀 **TSDB index**: 10x faster queries
+* 📊 **Structured metadata**: First-class support
+* 💾 **Better compression**: Lower storage costs
+* 🔍 **Schema v13**: Latest and recommended
+
+```yaml
+# loki/config.yml
+schema_config:
+  configs:
+    - from: 2024-01-01
+      store: tsdb        # 🚀 New fast store
+      object_store: filesystem
+      schema: v13        # 📊 Latest schema
+      index:
+        prefix: index_
+        period: 24h
+```
+
+**🎯 Always use TSDB for new deployments!**
+
+---
+
+## 📍 Slide 18 – ⚙️ Loki Configuration
+
+```yaml
+# loki/config.yml
+auth_enabled: false
+
+server:
+  http_listen_port: 3100
+
+common:
+  path_prefix: /loki
+  storage:
+    filesystem:
+      chunks_directory: /loki/chunks
+      rules_directory: /loki/rules
+  replication_factor: 1
+  ring:
+    instance_addr: 127.0.0.1
+    kvstore:
+      store: inmemory
+
+limits_config:
+  retention_period: 168h  # 🗓️ 7 days
+```
+
+**🔑 Key Settings:**
+* 🔐 `auth_enabled`: False for testing
+* 💾 `storage`: Where logs are stored
+* 🗓️ `retention_period`: How long to keep logs
+
+---
+
+## 📍 Slide 19 – 🔧 Promtail Configuration
+
+```yaml
+# promtail/config.yml
+server:
+  http_listen_port: 9080
+
+positions:
+  filename: /tmp/positions.yaml
+
+clients:
+  - url: http://loki:3100/loki/api/v1/push
+
+scrape_configs:
+  - job_name: docker
+    docker_sd_configs:
+      - host: unix:///var/run/docker.sock
+        refresh_interval: 5s
+    relabel_configs:
+      - source_labels: ['__meta_docker_container_name']
+        regex: '/(.*)'
+        target_label: 'container'
+```
+
+**🔑 Key Components:**
+* 📋 `positions`: Track what's been read
+* 🔗 `clients`: Where to send logs
+* 🐳 `docker_sd_configs`: Auto-discover containers
+
+---
+
+## 📍 Slide 20 – 🐳 Docker Compose Stack
+
+```yaml
+# docker-compose.yml
+version: '3.8'
+
+services:
+  loki:
+    image: grafana/loki:3.0.0
+    ports:
+      - "3100:3100"
+    volumes:
+      - ./loki/config.yml:/etc/loki/config.yml
+      - loki-data:/loki
+    command: -config.file=/etc/loki/config.yml
+
+  promtail:
+    image: grafana/promtail:3.0.0
+    volumes:
+      - ./promtail/config.yml:/etc/promtail/config.yml
+      - /var/lib/docker/containers:/var/lib/docker/containers:ro
+      - /var/run/docker.sock:/var/run/docker.sock:ro
+    command: -config.file=/etc/promtail/config.yml
+
+  grafana:
+    image: grafana/grafana:11.3.0
+    ports:
+      - "3000:3000"
+    volumes:
+      - grafana-data:/var/lib/grafana
+```
+
+---
+
+## 📍 Slide 21 – 🏷️ Labels: The Key Concept
+
+```mermaid
+flowchart TD
+  Log[📋 Log Entry] --> Labels[🏷️ Labels]
+  Labels --> App[app=web-api]
+  Labels --> Env[env=production]
+  Labels --> Level[level=error]
+  App --> Query[🔍 Query by Labels]
+  Env --> Query
+  Level --> Query
+```
+
+**🏷️ Labels = How Loki indexes logs**
+
+```logql
+# Query logs by labels
+{app="web-api", env="production"}
+
+# Filter errors
+{app="web-api"} |= "error"
+```
+
+**⚠️ Label Best Practices:**
+* 🔢 Keep cardinality low (< 10 values per label)
+* 🚫 Never use high-cardinality fields (user IDs, request IDs)
+* 🏷️ Use for: app name, environment, service
+
+---
+
+## 📍 Slide 22 – 🔍 LogQL Basics
+
+```mermaid
+flowchart LR
+  Selector[🏷️ Stream Selector] --> Filter[🔍 Line Filter]
+  Filter --> Parser[📊 Parser]
+  Parser --> Result[📋 Results]
+```
+
+**🔍 Query Structure:**
+```logql
+{label="value"} |= "filter" | json | field="value"
+```
+
+**📋 Examples:**
+```logql
+# All logs from container
+{container="web-api"}
+
+# Errors only
+{container="web-api"} |= "error"
+
+# Parse JSON, filter by level
+{container="web-api"} | json | level="ERROR"
+
+# Count errors per minute
+rate({container="web-api"} |= "error" [1m])
+```
+
+---
+
+## 📍 Slide 23 – 📊 LogQL Operators
+
+| 🔧 Operator | 🎯 Purpose | 📝 Example |
+|-------------|----------|---------|
+| `\|=` | Contains | `\|= "error"` |
+| `!=` | Not contains | `!= "debug"` |
+| `\|~` | Regex match | `\|~ "error\|warn"` |
+| `\| json` | Parse JSON | `\| json` |
+| `\| logfmt` | Parse logfmt | `\| logfmt` |
+| `rate()` | Logs per second | `rate({app="x"}[5m])` |
+
+**📊 Aggregation:**
+```logql
+# Logs per second by container
+sum by (container) (rate({job="docker"}[1m]))
+
+# Count by level
+sum by (level) (count_over_time({app="web"} | json [5m]))
+```
+
+---
+
+## 📍 Slide 24 – 🐍 Structured Logging in Python
+
+```python
+import logging
+import json
+from datetime import datetime
+
+class JSONFormatter(logging.Formatter):
+    def format(self, record):
+        log_obj = {
+            "timestamp": datetime.utcnow().isoformat() + "Z",
+            "level": record.levelname,
+            "message": record.getMessage(),
+            "logger": record.name,
+        }
+        if record.exc_info:
+            log_obj["exception"] = self.formatException(record.exc_info)
+        return json.dumps(log_obj)
+
+# Setup
+handler = logging.StreamHandler()
+handler.setFormatter(JSONFormatter())
+logger = logging.getLogger()
+logger.addHandler(handler)
+logger.setLevel(logging.INFO)
+
+# Usage
+logger.info("User logged in", extra={"user_id": 123})
+```
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L7_MID
+
+---
+
+## 📍 Slide 26 – 📊 Section 4: Building Dashboards
+
+## 🎨 Dashboard Design Principles
+
+* 🎯 **Purpose**: What question does it answer?
+* 📊 **Hierarchy**: Most important at top
+* 🎨 **Color**: Red = bad, Green = good
+* 🔄 **Refresh**: Auto-refresh for real-time
+
+```mermaid
+flowchart TD
+  Top[🚨 Alerts & Errors]
+  Top --> Middle[📊 Request Rates]
+  Middle --> Bottom[📋 Log Stream]
+```
+
+---
+
+## 📍 Slide 27 – 📊 Essential Log Panels
+
+**1️⃣ Log Stream (Logs visualization)**
+```logql
+{app=~"devops-.*"}
+```
+
+**2️⃣ Error Rate (Time series)**
+```logql
+sum by (app) (rate({app=~"devops-.*"} |= "ERROR" [1m]))
+```
+
+**3️⃣ Request Rate (Time series)**
+```logql
+sum by (app) (rate({app=~"devops-.*"} [1m]))
+```
+
+**4️⃣ Level Distribution (Pie chart)**
+```logql
+sum by (level) (count_over_time({app=~"devops-.*"} | json [5m]))
+```
+
+---
+
+## 📍 Slide 28 – 📊 Grafana Panel Types
+
+| 📊 Type | 🎯 Use For |
+|---------|----------|
+| 📋 **Logs** | Raw log entries |
+| 📈 **Time series** | Trends over time |
+| 📊 **Stat** | Single values |
+| 🥧 **Pie chart** | Distribution |
+| 📋 **Table** | Structured data |
+| 🌡️ **Gauge** | Current status |
+
+```mermaid
+flowchart LR
+  Logs[📋 Logs] --> Debug[🔍 Debugging]
+  TimeSeries[📈 Time Series] --> Trends[📊 Trends]
+  Stat[📊 Stat] --> KPIs[🎯 KPIs]
+```
+
+---
+
+## 📍 Slide 29 – 📊 Logging Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| 📋 **Log Volume** | Logs per second | Stable |
+| ❌ **Error Rate** | Errors per minute | < 1% |
+| ⏱️ **Query Time** | Time to find logs | < 30s |
+| 💾 **Retention** | How long kept | 7+ days |
+
+> 📚 These metrics indicate logging health.
+
+**🤔 Question:** How quickly can you find relevant logs?
+
+---
+
+## 📍 Slide 30 – 🌊 From Blind to Observable
+
+```mermaid
+flowchart LR
+  subgraph 😱 Blind
+    SSH[🔌 SSH grep]
+    Guess[🤷 Guesswork]
+    Slow[⏱️ Hours]
+  end
+  subgraph 🔍 Observable
+    Dashboard[📊 Dashboard]
+    Query[🔍 LogQL]
+    Fast[⚡ Minutes]
+  end
+  Blind -->|🚀 Loki| Observable
+```
+
+**🎯 Observability State:**
+* ⚡ Find issues in minutes, not hours
+* 🔄 Unified view across all services
+* 📈 Data-driven debugging
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: Production Logging
+
+## 📅 A Day with Observability
+
+**☀️ Morning:**
+* 📊 Check Grafana dashboard — all green ✅
+* 📋 Review overnight logs — no anomalies
+* ☕ Coffee with confidence
+
+**🌤️ Afternoon:**
+* 🚨 Alert: Error rate spike
+* 🔍 LogQL: `{app="api"} |= "error" | json | level="ERROR"`
+* 🔧 Found: Database timeout
+* ⏱️ **10 minutes** to identify root cause
+
+**🌙 Evening:**
+* 📊 Review error trends
+* 📝 Create runbook for similar issues
+* 🏠 Go home knowing you can debug remotely
+
+---
+
+## 📍 Slide 32 – 👥 Team Logging Workflow
+
+| 👤 Role | 🎯 Observability Responsibility |
+|---------|----------------------|
+| 👨‍💻 **Developer** | Add structured logging |
+| 🔧 **DevOps** | Maintain logging stack |
+| 🛡️ **SRE** | Build dashboards, respond to alerts |
+| 📊 **On-call** | Use logs for incident response |
+
+**🔗 Incident Response Flow:**
+```mermaid
+flowchart LR
+  Alert[🚨 Alert] --> Dashboard[📊 Dashboard]
+  Dashboard --> LogQL[🔍 LogQL Query]
+  LogQL --> RootCause[🎯 Root Cause]
+  RootCause --> Fix[🔧 Fix]
+```
+
+---
+
+## 📍 Slide 33 – 🔐 Production Considerations
+
+```yaml
+# Production settings
+deploy:
+  resources:
+    limits:
+      memory: 1G
+      cpus: '1.0'
+    reservations:
+      memory: 512M
+
+healthcheck:
+  test: ["CMD", "wget", "--no-verbose", "--tries=1", "--spider", "http://localhost:3100/ready"]
+  interval: 10s
+  timeout: 5s
+  retries: 5
+```
+
+**🛡️ Production Checklist:**
+* 💾 Persistent volumes for data
+* 🔐 Secure Grafana (disable anonymous)
+* 📊 Resource limits on all services
+* 🏥 Health checks enabled
+* 🗓️ Retention policies configured
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: Observability Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Basic logging] --> Mid[💼 Mid: Structured logging & dashboards]
+  Mid --> Senior[⭐ Senior: Full observability stack]
+  Senior --> Principal[🏆 Principal: Observability strategy]
+```
+
+**🛠️ Skills to Build:**
+* 📋 Structured logging patterns
+* 🔍 LogQL/PromQL fluency
+* 📊 Dashboard design
+* 🚨 Alerting strategies
+* 🔗 Distributed tracing
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 Observability Leaders:**
+* 🎬 **Netflix**: Custom observability platform
+* 🔍 **Google**: Invented Dapper (tracing)
+* 📦 **Uber**: Jaeger (open-source tracing)
+
+**☁️ Modern Practices:**
+* 🏦 **Stripe**: Structured logging everywhere
+* 📦 **Spotify**: Centralized logging for 1000+ microservices
+* 🎮 **Riot Games**: Real-time game telemetry
+
+**📊 Stats:**
+* 🔍 **80%** of debugging time is finding problems
+* ⏱️ Good observability reduces MTTR by **70%+**
+* 💰 ROI: **10-100x** in reduced incident costs
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🔍 **Observability = Logs + Metrics + Traces**
+2. 📋 **Structured logging** enables powerful queries
+3. 🏷️ **Labels** are how Loki indexes (keep cardinality low)
+4. 📊 **LogQL** is your query language
+5. 📈 **Dashboards** provide unified visibility
+
+> 💡 You can't fix what you can't see. Observability gives you eyes.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🔍 Observable Mindset |
+|---------------|------------------|
+| 🙅 "SSH and grep" | 📊 "Query Grafana" |
+| 🚫 "Check the logs somewhere" | 🔍 "All logs in one place" |
+| 👉 "It's probably X" | 📊 "Data shows it's Y" |
+| 😨 "Debugging takes hours" | ⚡ "Root cause in minutes" |
+| 💻 "Works on my machine" | 🌍 "Production shows different" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ The three pillars of observability
+* ✅ Loki architecture and configuration
+* ✅ LogQL query syntax
+* ✅ Building effective dashboards
+* ✅ Production logging best practices
+
+> 🚀 **You're ready for Lab 7: Loki Logging Stack**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L7_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Monitoring with Prometheus
+
+* 📊 Metrics collection and storage
+* 🔢 PromQL query language
+* 📈 Application instrumentation
+* 💻 Hands-on: Building metrics dashboards
+
+**🎉 Your observability journey continues.**
+
+> 🔍 From blind operations to insight — one query at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Obs[🔍 Observability Skills]
+  Obs --> Insight[💡 System Insight]
+  Insight --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Observability Engineering* — Charity Majors
+* 📖 *Distributed Systems Observability* — Cindy Sridharan
+* 📖 *The Art of Monitoring* — James Turnbull
+
+**🔗 Links:**
+* 🌐 [Grafana Loki Documentation](https://grafana.com/docs/loki/latest/)
+* 🌐 [LogQL Reference](https://grafana.com/docs/loki/latest/query/)
+* 🌐 [Promtail Configuration](https://grafana.com/docs/loki/latest/send-data/promtail/)
+
+---
diff --git a/lectures/lec8.md b/lectures/lec8.md
index 0b921df100..c930522a9f 100644
--- a/lectures/lec8.md
+++ b/lectures/lec8.md
@@ -1,799 +1,799 @@
-# 📌 Lecture 8 — Monitoring with Prometheus: From Guessing to Measuring
-
-## 📍 Slide 1 – 🚀 Welcome to Metrics Monitoring
-
-* 🌍 **Logs tell you what happened** — but how much and how fast?
-* 😰 Without metrics, capacity planning is guesswork
-* 📊 **Prometheus** = the industry standard for metrics
-* 🎯 This lecture: master metrics collection, PromQL, and dashboards
-
-```mermaid
-flowchart LR
-  App[📦 Application] -->|📊 Metrics| Prometheus[💾 Prometheus]
-  Prometheus --> Grafana[📊 Grafana]
-  Grafana --> Insight[💡 Insight]
-```
-
----
-
-## 📍 Slide 2 – 🎯 What You Will Learn
-
-* ✅ Understand metrics types and instrumentation
-* ✅ Configure Prometheus for metrics collection
-* ✅ Query metrics with PromQL
-* ✅ Build effective monitoring dashboards
-
-**🎓 Learning Outcomes:**
-| # | Outcome |
-|---|---------|
-| 1 | 🧠 Differentiate Counter, Gauge, Histogram |
-| 2 | 🔍 Configure Prometheus scrape targets |
-| 3 | 🛠️ Write PromQL queries for analysis |
-| 4 | 🗺️ Design RED method dashboards |
-
----
-
-## 📍 Slide 3 – 📋 How This Lecture Works
-
-* 📚 **Concepts + Instrumentation** — hands-on focus
-* 🎮 **Real-world scenarios** — performance monitoring
-* 📝 **3 quiz checkpoints**: PRE / MID / POST
-* 🛠️ **Methods**: RED, USE, Four Golden Signals
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction (now)     → 📝 PRE Quiz
-Section 1: The Monitoring Problem
-Section 2: Prometheus Fundamentals
-Section 3: Application Instrumentation → 📝 MID Quiz
-Section 4: PromQL & Dashboards
-Section 5: Production Monitoring
-Section 6: Reflection             → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – ❓ The Big Question
-
-* 📊 **83%** of organizations can't predict performance issues
-* ⏱️ Average time to detect capacity problems: **too late**
-* 💥 Without metrics, you're **reactive, not proactive**
-
-> 💬 *"Is the server slow or is it just me?"* — Everyone, always
-
-**🤔 Think about it:**
-* How do you know if your app can handle more load?
-* When did response times start degrading?
-* How much headroom do you have?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L8_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Monitoring Problem
-
-* 🤷 **No metrics** = can't measure performance
-* 📊 Users complain before you know there's a problem
-* 🔍 Can't identify bottlenecks
-* 💥 Result: **reactive firefighting**
-
-```mermaid
-flowchart LR
-  Users[👥 Users Complain] --> Support[📞 Support Ticket]
-  Support --> Team[👨‍💻 Team Investigates]
-  Team --> Guess[🤷 Guesswork]
-  Guess --> Hours[⏱️ Hours Later...]
-```
-
----
-
-## 📍 Slide 7 – 📊 Metrics vs Logs
-
-```mermaid
-flowchart TD
-  subgraph 📋 Logs
-    L1[What happened?]
-    L2[Detailed events]
-    L3[High cardinality]
-  end
-  subgraph 📊 Metrics
-    M1[How much/fast?]
-    M2[Aggregated numbers]
-    M3[Low cardinality]
-  end
-```
-
-| 📋 Aspect | 📊 Metrics | 📝 Logs |
-|-----------|----------|---------|
-| 🎯 Question | How much? | What happened? |
-| 📈 Volume | Low | High |
-| 💾 Storage | Small | Large |
-| 🔍 Analysis | Trends, alerts | Debugging |
-| ⏱️ Retention | Long (months) | Short (days) |
-
-> 🔥 **Use both**: Logs for debugging, metrics for monitoring
-
----
-
-## 📍 Slide 8 – 😱 Alert Blindness
-
-* 🚨 No alerts = problems go unnoticed
-* 📧 Too many alerts = alert fatigue
-* 🔍 Wrong thresholds = false positives
-* 💀 On-call burnout
-
-> ⚠️ **Good metrics = actionable alerts**
-
-```mermaid
-flowchart LR
-  NoMetrics[🙈 No Metrics] --> NoAlerts[🔇 No Alerts]
-  NoAlerts --> UserReports[👥 Users Report]
-  UserReports --> Scramble[😱 Scramble]
-```
-
----
-
-## 📍 Slide 9 – 😨 Capacity Planning Without Metrics
-
-* 📅 "We need more servers" — but how many?
-* 🔮 Crystal ball capacity planning
-* 💰 Over-provision (waste money) or under-provision (outages)
-* 💀 No data to justify decisions
-
-> ⚠️ **Without metrics, capacity planning is gambling**
-
-**💬 Discussion:** How does your team plan capacity?
-
----
-
-## 📍 Slide 10 – 💸 The Cost of Blind Monitoring
-
-| 🔥 Problem | 💥 Impact |
-|------------|-----------|
-| 🐢 No baseline | Can't detect degradation |
-| 📊 No trends | Can't predict growth |
-| 👉 No attribution | Can't identify bottlenecks |
-| 🙈 No thresholds | Can't alert proactively |
-
-**📈 Real Numbers:**
-* 🏢 **Reactive incident detection**: Users report first (30+ min delay)
-* 🚀 **Proactive with metrics**: Alert in seconds
-* 💰 **Cost of 30-minute delay**: $150,000+ (enterprise)
-
----
-
-## 📍 Slide 11 – 💡 Section 2: What Prometheus Is
-
-* 📊 **Time-series database** for metrics
-* 🔄 **Pull-based** model — scrapes targets
-* 📈 **PromQL** — powerful query language
-* 🎯 Industry standard for cloud-native monitoring
-
-```mermaid
-flowchart LR
-  App1[📦 App /metrics] --> Prometheus[💾 Prometheus]
-  App2[📦 Service /metrics] --> Prometheus
-  Prometheus -->|⏰ Every 15s| Scrape[🔄 Pull Metrics]
-```
-
-**📖 Definition:**
-> *Prometheus is an open-source monitoring system that collects metrics from targets by scraping HTTP endpoints, stores them in a time-series database, and provides a powerful query language (PromQL) for analysis.*
-
----
-
-## 📍 Slide 12 – 🔄 Pull vs Push Model
-
-```mermaid
-flowchart TD
-  subgraph Pull (Prometheus)
-    P1[💾 Prometheus] -->|🔄 Scrape| T1[📦 Target]
-    P1 -->|🔄 Scrape| T2[📦 Target]
-  end
-  subgraph Push (StatsD)
-    S1[📦 App] -->|📤 Push| D1[💾 Collector]
-    S2[📦 App] -->|📤 Push| D1
-  end
-```
-
-**🔄 Pull Benefits:**
-* 🔍 Prometheus controls the rate
-* ✅ Know immediately if target is down (scrape fails)
-* 🎯 Apps don't need to know about monitoring
-* 🔧 Easy service discovery
-
----
-
-## 📍 Slide 13 – 🏗️ Prometheus Architecture
-
-```mermaid
-flowchart TD
-  Targets[📦 Targets /metrics] --> Prometheus[💾 Prometheus TSDB]
-  Prometheus --> AlertManager[🚨 AlertManager]
-  Prometheus --> Grafana[📊 Grafana]
-  Prometheus --> API[🔗 HTTP API]
-  AlertManager --> Slack[💬 Slack]
-  AlertManager --> PagerDuty[📟 PagerDuty]
-```
-
-| 🧱 Component | 🎯 Purpose |
-|-------------|----------|
-| 💾 **Prometheus** | Scrape, store, query |
-| 📦 **Targets** | Expose /metrics endpoint |
-| 🚨 **AlertManager** | Handle alerts |
-| 📊 **Grafana** | Visualization |
-
----
-
-## 📍 Slide 14 – 📊 Metric Types
-
-```mermaid
-flowchart LR
-  Counter[🔢 Counter] --> Always[Only goes UP]
-  Gauge[📊 Gauge] --> UpDown[Goes up AND down]
-  Histogram[📈 Histogram] --> Distribution[Value distribution]
-```
-
-| 📊 Type | 🎯 Use For | 📝 Example |
-|---------|----------|---------|
-| 🔢 **Counter** | Cumulative events | Total requests |
-| 📊 **Gauge** | Current value | Temperature, memory |
-| 📈 **Histogram** | Distribution | Request latency |
-| 📊 **Summary** | Percentiles | Pre-calculated p95 |
-
----
-
-## 📍 Slide 15 – 🔢 Counter Deep Dive
-
-```python
-from prometheus_client import Counter
-
-# 🔢 Counter: Only goes up
-http_requests_total = Counter(
-    'http_requests_total',
-    'Total HTTP requests',
-    ['method', 'endpoint', 'status']
-)
-
-# Usage
-http_requests_total.labels(method='GET', endpoint='/', status='200').inc()
-```
-
-**📊 Query Patterns:**
-```promql
-# Total requests
-http_requests_total
-
-# Requests per second (rate over 5m)
-rate(http_requests_total[5m])
-
-# Requests per second by endpoint
-sum by (endpoint) (rate(http_requests_total[5m]))
-```
-
-**⚠️ Counter Rule:** Use `rate()` to get per-second values
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: Application Instrumentation
-
-## 🐍 Python prometheus_client
-
-```python
-from prometheus_client import Counter, Gauge, Histogram, generate_latest
-from flask import Flask, Response
-
-app = Flask(__name__)
-
-# 📊 Define metrics
-requests = Counter('http_requests', 'Total requests', ['method', 'path'])
-latency = Histogram('http_latency_seconds', 'Request latency', ['path'])
-in_progress = Gauge('http_in_progress', 'Requests in progress')
-
-@app.route('/metrics')
-def metrics():
-    return Response(generate_latest(), content_type='text/plain')
-```
-
-**🎮 Let's instrument an application.**
-
----
-
-## 📍 Slide 17 – 📊 Histogram Deep Dive
-
-```python
-from prometheus_client import Histogram
-
-# 📈 Histogram with buckets
-request_latency = Histogram(
-    'http_request_duration_seconds',
-    'Request latency in seconds',
-    ['method', 'endpoint'],
-    buckets=[0.01, 0.05, 0.1, 0.5, 1.0, 5.0]  # 🪣 Custom buckets
-)
-
-# Usage
-with request_latency.labels(method='GET', endpoint='/').time():
-    # ... handle request ...
-    pass
-```
-
-**📊 Query Patterns:**
-```promql
-# 95th percentile latency
-histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m]))
-
-# Average latency
-rate(http_request_duration_seconds_sum[5m]) / rate(http_request_duration_seconds_count[5m])
-```
-
----
-
-## 📍 Slide 18 – 📈 The RED Method
-
-```mermaid
-flowchart LR
-  R[🔴 Rate] --> Requests[Requests per second]
-  E[🟡 Errors] --> Failures[Error rate]
-  D[🔵 Duration] --> Latency[Response time]
-```
-
-**📊 RED Method for Request-Driven Services:**
-
-| 📊 Metric | 🎯 Question | 📝 PromQL |
-|-----------|----------|---------|
-| 🔴 **Rate** | How busy? | `rate(requests[5m])` |
-| 🟡 **Errors** | How often failing? | `rate(errors[5m])` |
-| 🔵 **Duration** | How slow? | `histogram_quantile(0.95, ...)` |
-
-**🎯 If you monitor only 3 things, monitor these!**
-
----
-
-## 📍 Slide 19 – 📈 The USE Method
-
-```mermaid
-flowchart LR
-  U[📊 Utilization] --> HowMuch[% resource busy]
-  S[📊 Saturation] --> Queuing[Extra work waiting]
-  E[📊 Errors] --> Failures[Error count]
-```
-
-**📊 USE Method for Resources (CPU, Memory, Disk):**
-
-| 📊 Metric | 🎯 Example |
-|-----------|----------|
-| 📊 **Utilization** | CPU at 80% |
-| 📊 **Saturation** | 10 requests queued |
-| 📊 **Errors** | Disk I/O errors |
-
-**🎯 USE for resources, RED for services**
-
----
-
-## 📍 Slide 20 – ⚙️ Prometheus Configuration
-
-```yaml
-# prometheus/prometheus.yml
-global:
-  scrape_interval: 15s
-  evaluation_interval: 15s
-
-scrape_configs:
-  - job_name: 'prometheus'
-    static_configs:
-      - targets: ['localhost:9090']
-
-  - job_name: 'app'
-    static_configs:
-      - targets: ['app-python:8000']
-    metrics_path: '/metrics'
-
-  - job_name: 'loki'
-    static_configs:
-      - targets: ['loki:3100']
-```
-
-**🔑 Key Settings:**
-* ⏱️ `scrape_interval`: How often to collect (15s default)
-* 🎯 `targets`: What to scrape
-* 📍 `metrics_path`: Where metrics are exposed
-
----
-
-## 📍 Slide 21 – 🎯 Scrape Targets
-
-```mermaid
-flowchart TD
-  Prometheus[💾 Prometheus] -->|🔄 Scrape| App[📦 app:8000/metrics]
-  Prometheus -->|🔄 Scrape| Loki[📦 loki:3100/metrics]
-  Prometheus -->|🔄 Scrape| Grafana[📦 grafana:3000/metrics]
-  Prometheus -->|🔄 Scrape| Self[📦 prometheus:9090/metrics]
-```
-
-**📊 Verify Targets:**
-```bash
-# Check targets status
-curl http://localhost:9090/api/v1/targets
-
-# Web UI
-http://localhost:9090/targets
-```
-
-**✅ All targets should show `UP`**
-
----
-
-## 📍 Slide 22 – 📊 /metrics Endpoint Format
-
-```
-# HELP http_requests_total Total HTTP requests
-# TYPE http_requests_total counter
-http_requests_total{method="GET",endpoint="/",status="200"} 1234
-http_requests_total{method="GET",endpoint="/health",status="200"} 567
-http_requests_total{method="POST",endpoint="/api",status="201"} 89
-
-# HELP http_request_duration_seconds Request latency
-# TYPE http_request_duration_seconds histogram
-http_request_duration_seconds_bucket{le="0.01"} 100
-http_request_duration_seconds_bucket{le="0.05"} 200
-http_request_duration_seconds_bucket{le="0.1"} 250
-http_request_duration_seconds_bucket{le="+Inf"} 300
-http_request_duration_seconds_sum 45.67
-http_request_duration_seconds_count 300
-```
-
-**📊 Format:** `metric_name{labels} value`
-
----
-
-## 📍 Slide 23 – 🏷️ Labels Best Practices
-
-```python
-# ✅ Good: Low cardinality labels
-http_requests.labels(method='GET', status='200', endpoint='/api')
-
-# ❌ Bad: High cardinality (user IDs, request IDs)
-http_requests.labels(user_id='12345')  # 💥 Millions of time series!
-```
-
-**🏷️ Label Rules:**
-* ✅ Use for: method, endpoint, status, service
-* ❌ Avoid: user_id, request_id, session_id
-* 📊 Target: < 1000 unique label combinations
-
-**⚠️ High cardinality = memory explosion**
-
----
-
-## 📍 Slide 24 – 🔍 PromQL Basics
-
-```promql
-# Instant vector (current value)
-http_requests_total
-
-# Range vector (over time)
-http_requests_total[5m]
-
-# Rate (per-second)
-rate(http_requests_total[5m])
-
-# Sum by label
-sum by (endpoint) (rate(http_requests_total[5m]))
-
-# Filter by label
-http_requests_total{status="500"}
-```
-
-**🔑 Key Operators:**
-* `rate()` — Per-second rate for counters
-* `sum()` — Aggregate across series
-* `by ()` — Group results
-* `{}` — Filter by labels
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L8_MID
-
----
-
-## 📍 Slide 26 – 📊 Section 4: Building Dashboards
-
-## 🎨 Dashboard Design with RED
-
-```mermaid
-flowchart TD
-  Row1[🔝 Row 1: Overview Stats]
-  Row2[📊 Row 2: Rate & Errors]
-  Row3[⏱️ Row 3: Latency]
-  Row4[📋 Row 4: Details]
-  Row1 --> Row2 --> Row3 --> Row4
-```
-
-**📊 Essential Panels:**
-1. 📊 **Request Rate** — Requests per second
-2. ❌ **Error Rate** — 5xx responses
-3. ⏱️ **Latency p95** — 95th percentile
-4. 📈 **Latency Heatmap** — Distribution
-
----
-
-## 📍 Slide 27 – 📊 PromQL Dashboard Queries
-
-**1️⃣ Request Rate (Time series)**
-```promql
-sum(rate(http_requests_total[5m])) by (endpoint)
-```
-
-**2️⃣ Error Rate % (Time series)**
-```promql
-sum(rate(http_requests_total{status=~"5.."}[5m]))
-  / sum(rate(http_requests_total[5m])) * 100
-```
-
-**3️⃣ P95 Latency (Time series)**
-```promql
-histogram_quantile(0.95,
-  sum(rate(http_request_duration_seconds_bucket[5m])) by (le))
-```
-
-**4️⃣ Uptime (Stat)**
-```promql
-up{job="app"}
-```
-
----
-
-## 📍 Slide 28 – 📈 Heatmap for Latency
-
-```promql
-# Latency distribution over time
-sum(rate(http_request_duration_seconds_bucket[1m])) by (le)
-```
-
-**🎨 Heatmap Benefits:**
-* 📊 See latency distribution
-* 🔍 Spot outliers
-* 📈 Track changes over time
-
-```mermaid
-flowchart LR
-  Green[🟢 Fast: < 100ms] --> Yellow[🟡 OK: 100-500ms]
-  Yellow --> Red[🔴 Slow: > 500ms]
-```
-
----
-
-## 📍 Slide 29 – 📊 Monitoring Metrics
-
-| 📊 Metric | 📏 Measures | 🏆 Target |
-|-----------|------------|---------|
-| ⏱️ **Scrape Success** | Targets reachable | 100% |
-| 📊 **Series Count** | Time series | Stable |
-| 💾 **Storage Size** | Disk usage | Predictable |
-| 🔍 **Query Latency** | PromQL speed | < 1s |
-
-> 📚 Monitor your monitoring!
-
-**🤔 Question:** What happens if Prometheus goes down?
-
----
-
-## 📍 Slide 30 – 🌊 From Guessing to Measuring
-
-```mermaid
-flowchart LR
-  subgraph 😱 Guessing
-    NoData[🤷 No Data]
-    Reactive[🔥 Reactive]
-    Slow[⏱️ Slow Detection]
-  end
-  subgraph 📊 Measuring
-    Metrics[📈 Real Metrics]
-    Proactive[⚡ Proactive]
-    Fast[🚀 Instant Detection]
-  end
-  Guessing -->|🚀 Prometheus| Measuring
-```
-
-**🎯 Monitoring State:**
-* ⚡ Detect issues before users
-* 📊 Data-driven capacity planning
-* 📈 Trend analysis and predictions
-
----
-
-## 📍 Slide 31 – 🏢 Section 5: Production Monitoring
-
-## 📅 A Day with Prometheus
-
-**☀️ Morning:**
-* 📊 Check Grafana — all green ✅
-* 📈 Review overnight trends
-* 🔍 No anomalies detected
-
-**🌤️ Afternoon:**
-* 🚨 Alert: Latency p95 > 500ms
-* 📊 Dashboard shows spike at 2pm
-* 🔍 PromQL: `histogram_quantile(0.95, ...)`
-* 🔧 Found: Database slow query
-* ⏱️ **5 minutes** to identify
-
-**🌙 Evening:**
-* 📊 Review daily trends
-* 📈 Plan tomorrow's capacity
-* 🏠 Go home with confidence
-
----
-
-## 📍 Slide 32 – 👥 Team Monitoring Workflow
-
-| 👤 Role | 🎯 Monitoring Responsibility |
-|---------|----------------------|
-| 👨‍💻 **Developer** | Add metrics to code |
-| 🔧 **DevOps** | Maintain Prometheus |
-| 🛡️ **SRE** | Design dashboards & alerts |
-| 📊 **On-call** | Respond to alerts |
-
-**🔗 Alert Flow:**
-```mermaid
-flowchart LR
-  Prometheus[💾 Prometheus] -->|🚨 Alert| AlertManager[📬 AlertManager]
-  AlertManager --> Slack[💬 Slack]
-  AlertManager --> PagerDuty[📟 PagerDuty]
-  PagerDuty --> OnCall[👤 On-call]
-```
-
----
-
-## 📍 Slide 33 – 🔐 Production Considerations
-
-```yaml
-# Prometheus with retention
-command:
-  - '--config.file=/etc/prometheus/prometheus.yml'
-  - '--storage.tsdb.retention.time=15d'
-  - '--storage.tsdb.retention.size=10GB'
-
-deploy:
-  resources:
-    limits:
-      memory: 1G
-      cpus: '1.0'
-
-healthcheck:
-  test: ["CMD", "wget", "-q", "--spider", "http://localhost:9090/-/healthy"]
-  interval: 10s
-  timeout: 5s
-  retries: 5
-```
-
-**🛡️ Production Checklist:**
-* 💾 Persistent storage configured
-* 🗓️ Retention policy set
-* 📊 Resource limits defined
-* 🏥 Health checks enabled
-
----
-
-## 📍 Slide 34 – 📈 Career Path: Monitoring Skills
-
-```mermaid
-flowchart LR
-  Junior[🌱 Junior: Basic metrics] --> Mid[💼 Mid: PromQL & dashboards]
-  Mid --> Senior[⭐ Senior: Full observability]
-  Senior --> Principal[🏆 Principal: SRE practices]
-```
-
-**🛠️ Skills to Build:**
-* 📊 Application instrumentation
-* 🔍 PromQL fluency
-* 📈 Dashboard design
-* 🚨 Alert engineering
-* 📊 SLO/SLI definition
-
----
-
-## 📍 Slide 35 – 🌍 Real Company Examples
-
-**🏢 Prometheus at Scale:**
-* ☁️ **SoundCloud**: Created Prometheus (2012)
-* 🔍 **Google**: Inspired Prometheus (Borgmon)
-* 🎬 **Netflix**: Millions of time series
-
-**☁️ Modern Practices:**
-* 📦 **Spotify**: Custom Prometheus federation
-* 🏦 **Stripe**: Fine-grained latency tracking
-* 🎮 **Riot Games**: Real-time game metrics
-
-**📊 Stats:**
-* 🌍 **#1** cloud-native monitoring tool
-* 📦 **CNCF graduated** project
-* 🏢 Adopted by **70%+** of K8s users
-
----
-
-## 📍 Slide 36 – 🎯 Section 6: Reflection
-
-## 📝 Key Takeaways
-
-1. 📊 **Metrics complement logs** — different purposes
-2. 🔢 **Counter, Gauge, Histogram** — choose wisely
-3. 🔴 **RED method** for services (Rate, Errors, Duration)
-4. 🏷️ **Labels** — keep cardinality low
-5. 📈 **PromQL** is powerful — learn it well
-
-> 💡 If you can't measure it, you can't improve it.
-
----
-
-## 📍 Slide 37 – 🧠 The Mindset Shift
-
-| 😰 Old Mindset | 📊 Metrics Mindset |
-|---------------|------------------|
-| 🙅 "Seems fine" | 📊 "Data shows it's fine" |
-| 🚫 "Users will tell us" | 🚨 "Alerts tell us first" |
-| 👉 "We need more servers" | 📈 "Data shows we need 3 more" |
-| 😨 "Deploy and hope" | 📊 "Deploy and measure" |
-| 💻 "Performance is subjective" | 🔢 "p95 is 250ms" |
-
-> ❓ Which mindset describes your team?
-
----
-
-## 📍 Slide 38 – ✅ Your Progress
-
-## 🎓 What You Now Understand
-
-* ✅ Metrics types and when to use each
-* ✅ Prometheus architecture and configuration
-* ✅ Application instrumentation patterns
-* ✅ PromQL query syntax
-* ✅ Dashboard design with RED method
-
-> 🚀 **You're ready for Lab 8: Prometheus Monitoring**
-
----
-
-## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L8_POST
-
----
-
-## 📍 Slide 40 – 🚀 What Comes Next
-
-## 📚 Next Lecture: Kubernetes Fundamentals
-
-* ☸️ Container orchestration
-* 📦 Deployments and Services
-* 🔄 Scaling and self-healing
-* 💻 Hands-on: Deploying to Kubernetes
-
-**🎉 Your monitoring journey continues.**
-
-> 📊 From guessing to measuring — one metric at a time.
-
-```mermaid
-flowchart LR
-  You[👤 You] --> Metrics[📊 Metrics Skills]
-  Metrics --> DataDriven[📈 Data-Driven Ops]
-  DataDriven --> Career[🚀 Career Growth]
-```
-
-**👋 See you in the next lecture!**
-
----
-
-## 📚 Resources & Further Reading
-
-**📕 Books:**
-* 📖 *Prometheus: Up & Running* — Brian Brazil
-* 📖 *Site Reliability Engineering* — Google
-* 📖 *The Art of Monitoring* — James Turnbull
-
-**🔗 Links:**
-* 🌐 [Prometheus Documentation](https://prometheus.io/docs/)
-* 🌐 [PromQL Basics](https://prometheus.io/docs/prometheus/latest/querying/basics/)
-* 🌐 [RED Method](https://grafana.com/blog/2018/08/02/the-red-method-how-to-instrument-your-services/)
-
----
+# 📌 Lecture 8 — Monitoring with Prometheus: From Guessing to Measuring
+
+## 📍 Slide 1 – 🚀 Welcome to Metrics Monitoring
+
+* 🌍 **Logs tell you what happened** — but how much and how fast?
+* 😰 Without metrics, capacity planning is guesswork
+* 📊 **Prometheus** = the industry standard for metrics
+* 🎯 This lecture: master metrics collection, PromQL, and dashboards
+
+```mermaid
+flowchart LR
+  App[📦 Application] -->|📊 Metrics| Prometheus[💾 Prometheus]
+  Prometheus --> Grafana[📊 Grafana]
+  Grafana --> Insight[💡 Insight]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand metrics types and instrumentation
+* ✅ Configure Prometheus for metrics collection
+* ✅ Query metrics with PromQL
+* ✅ Build effective monitoring dashboards
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Differentiate Counter, Gauge, Histogram |
+| 2 | 🔍 Configure Prometheus scrape targets |
+| 3 | 🛠️ Write PromQL queries for analysis |
+| 4 | 🗺️ Design RED method dashboards |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + Instrumentation** — hands-on focus
+* 🎮 **Real-world scenarios** — performance monitoring
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Methods**: RED, USE, Four Golden Signals
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Monitoring Problem
+Section 2: Prometheus Fundamentals
+Section 3: Application Instrumentation → 📝 MID Quiz
+Section 4: PromQL & Dashboards
+Section 5: Production Monitoring
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **83%** of organizations can't predict performance issues
+* ⏱️ Average time to detect capacity problems: **too late**
+* 💥 Without metrics, you're **reactive, not proactive**
+
+> 💬 *"Is the server slow or is it just me?"* — Everyone, always
+
+**🤔 Think about it:**
+* How do you know if your app can handle more load?
+* When did response times start degrading?
+* How much headroom do you have?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L8_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Monitoring Problem
+
+* 🤷 **No metrics** = can't measure performance
+* 📊 Users complain before you know there's a problem
+* 🔍 Can't identify bottlenecks
+* 💥 Result: **reactive firefighting**
+
+```mermaid
+flowchart LR
+  Users[👥 Users Complain] --> Support[📞 Support Ticket]
+  Support --> Team[👨‍💻 Team Investigates]
+  Team --> Guess[🤷 Guesswork]
+  Guess --> Hours[⏱️ Hours Later...]
+```
+
+---
+
+## 📍 Slide 7 – 📊 Metrics vs Logs
+
+```mermaid
+flowchart TD
+  subgraph 📋 Logs
+    L1[What happened?]
+    L2[Detailed events]
+    L3[High cardinality]
+  end
+  subgraph 📊 Metrics
+    M1[How much/fast?]
+    M2[Aggregated numbers]
+    M3[Low cardinality]
+  end
+```
+
+| 📋 Aspect | 📊 Metrics | 📝 Logs |
+|-----------|----------|---------|
+| 🎯 Question | How much? | What happened? |
+| 📈 Volume | Low | High |
+| 💾 Storage | Small | Large |
+| 🔍 Analysis | Trends, alerts | Debugging |
+| ⏱️ Retention | Long (months) | Short (days) |
+
+> 🔥 **Use both**: Logs for debugging, metrics for monitoring
+
+---
+
+## 📍 Slide 8 – 😱 Alert Blindness
+
+* 🚨 No alerts = problems go unnoticed
+* 📧 Too many alerts = alert fatigue
+* 🔍 Wrong thresholds = false positives
+* 💀 On-call burnout
+
+> ⚠️ **Good metrics = actionable alerts**
+
+```mermaid
+flowchart LR
+  NoMetrics[🙈 No Metrics] --> NoAlerts[🔇 No Alerts]
+  NoAlerts --> UserReports[👥 Users Report]
+  UserReports --> Scramble[😱 Scramble]
+```
+
+---
+
+## 📍 Slide 9 – 😨 Capacity Planning Without Metrics
+
+* 📅 "We need more servers" — but how many?
+* 🔮 Crystal ball capacity planning
+* 💰 Over-provision (waste money) or under-provision (outages)
+* 💀 No data to justify decisions
+
+> ⚠️ **Without metrics, capacity planning is gambling**
+
+**💬 Discussion:** How does your team plan capacity?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Blind Monitoring
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 No baseline | Can't detect degradation |
+| 📊 No trends | Can't predict growth |
+| 👉 No attribution | Can't identify bottlenecks |
+| 🙈 No thresholds | Can't alert proactively |
+
+**📈 Real Numbers:**
+* 🏢 **Reactive incident detection**: Users report first (30+ min delay)
+* 🚀 **Proactive with metrics**: Alert in seconds
+* 💰 **Cost of 30-minute delay**: $150,000+ (enterprise)
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Prometheus Is
+
+* 📊 **Time-series database** for metrics
+* 🔄 **Pull-based** model — scrapes targets
+* 📈 **PromQL** — powerful query language
+* 🎯 Industry standard for cloud-native monitoring
+
+```mermaid
+flowchart LR
+  App1[📦 App /metrics] --> Prometheus[💾 Prometheus]
+  App2[📦 Service /metrics] --> Prometheus
+  Prometheus -->|⏰ Every 15s| Scrape[🔄 Pull Metrics]
+```
+
+**📖 Definition:**
+> *Prometheus is an open-source monitoring system that collects metrics from targets by scraping HTTP endpoints, stores them in a time-series database, and provides a powerful query language (PromQL) for analysis.*
+
+---
+
+## 📍 Slide 12 – 🔄 Pull vs Push Model
+
+```mermaid
+flowchart TD
+  subgraph Pull (Prometheus)
+    P1[💾 Prometheus] -->|🔄 Scrape| T1[📦 Target]
+    P1 -->|🔄 Scrape| T2[📦 Target]
+  end
+  subgraph Push (StatsD)
+    S1[📦 App] -->|📤 Push| D1[💾 Collector]
+    S2[📦 App] -->|📤 Push| D1
+  end
+```
+
+**🔄 Pull Benefits:**
+* 🔍 Prometheus controls the rate
+* ✅ Know immediately if target is down (scrape fails)
+* 🎯 Apps don't need to know about monitoring
+* 🔧 Easy service discovery
+
+---
+
+## 📍 Slide 13 – 🏗️ Prometheus Architecture
+
+```mermaid
+flowchart TD
+  Targets[📦 Targets /metrics] --> Prometheus[💾 Prometheus TSDB]
+  Prometheus --> AlertManager[🚨 AlertManager]
+  Prometheus --> Grafana[📊 Grafana]
+  Prometheus --> API[🔗 HTTP API]
+  AlertManager --> Slack[💬 Slack]
+  AlertManager --> PagerDuty[📟 PagerDuty]
+```
+
+| 🧱 Component | 🎯 Purpose |
+|-------------|----------|
+| 💾 **Prometheus** | Scrape, store, query |
+| 📦 **Targets** | Expose /metrics endpoint |
+| 🚨 **AlertManager** | Handle alerts |
+| 📊 **Grafana** | Visualization |
+
+---
+
+## 📍 Slide 14 – 📊 Metric Types
+
+```mermaid
+flowchart LR
+  Counter[🔢 Counter] --> Always[Only goes UP]
+  Gauge[📊 Gauge] --> UpDown[Goes up AND down]
+  Histogram[📈 Histogram] --> Distribution[Value distribution]
+```
+
+| 📊 Type | 🎯 Use For | 📝 Example |
+|---------|----------|---------|
+| 🔢 **Counter** | Cumulative events | Total requests |
+| 📊 **Gauge** | Current value | Temperature, memory |
+| 📈 **Histogram** | Distribution | Request latency |
+| 📊 **Summary** | Percentiles | Pre-calculated p95 |
+
+---
+
+## 📍 Slide 15 – 🔢 Counter Deep Dive
+
+```python
+from prometheus_client import Counter
+
+# 🔢 Counter: Only goes up
+http_requests_total = Counter(
+    'http_requests_total',
+    'Total HTTP requests',
+    ['method', 'endpoint', 'status']
+)
+
+# Usage
+http_requests_total.labels(method='GET', endpoint='/', status='200').inc()
+```
+
+**📊 Query Patterns:**
+```promql
+# Total requests
+http_requests_total
+
+# Requests per second (rate over 5m)
+rate(http_requests_total[5m])
+
+# Requests per second by endpoint
+sum by (endpoint) (rate(http_requests_total[5m]))
+```
+
+**⚠️ Counter Rule:** Use `rate()` to get per-second values
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Application Instrumentation
+
+## 🐍 Python prometheus_client
+
+```python
+from prometheus_client import Counter, Gauge, Histogram, generate_latest
+from flask import Flask, Response
+
+app = Flask(__name__)
+
+# 📊 Define metrics
+requests = Counter('http_requests', 'Total requests', ['method', 'path'])
+latency = Histogram('http_latency_seconds', 'Request latency', ['path'])
+in_progress = Gauge('http_in_progress', 'Requests in progress')
+
+@app.route('/metrics')
+def metrics():
+    return Response(generate_latest(), content_type='text/plain')
+```
+
+**🎮 Let's instrument an application.**
+
+---
+
+## 📍 Slide 17 – 📊 Histogram Deep Dive
+
+```python
+from prometheus_client import Histogram
+
+# 📈 Histogram with buckets
+request_latency = Histogram(
+    'http_request_duration_seconds',
+    'Request latency in seconds',
+    ['method', 'endpoint'],
+    buckets=[0.01, 0.05, 0.1, 0.5, 1.0, 5.0]  # 🪣 Custom buckets
+)
+
+# Usage
+with request_latency.labels(method='GET', endpoint='/').time():
+    # ... handle request ...
+    pass
+```
+
+**📊 Query Patterns:**
+```promql
+# 95th percentile latency
+histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m]))
+
+# Average latency
+rate(http_request_duration_seconds_sum[5m]) / rate(http_request_duration_seconds_count[5m])
+```
+
+---
+
+## 📍 Slide 18 – 📈 The RED Method
+
+```mermaid
+flowchart LR
+  R[🔴 Rate] --> Requests[Requests per second]
+  E[🟡 Errors] --> Failures[Error rate]
+  D[🔵 Duration] --> Latency[Response time]
+```
+
+**📊 RED Method for Request-Driven Services:**
+
+| 📊 Metric | 🎯 Question | 📝 PromQL |
+|-----------|----------|---------|
+| 🔴 **Rate** | How busy? | `rate(requests[5m])` |
+| 🟡 **Errors** | How often failing? | `rate(errors[5m])` |
+| 🔵 **Duration** | How slow? | `histogram_quantile(0.95, ...)` |
+
+**🎯 If you monitor only 3 things, monitor these!**
+
+---
+
+## 📍 Slide 19 – 📈 The USE Method
+
+```mermaid
+flowchart LR
+  U[📊 Utilization] --> HowMuch[% resource busy]
+  S[📊 Saturation] --> Queuing[Extra work waiting]
+  E[📊 Errors] --> Failures[Error count]
+```
+
+**📊 USE Method for Resources (CPU, Memory, Disk):**
+
+| 📊 Metric | 🎯 Example |
+|-----------|----------|
+| 📊 **Utilization** | CPU at 80% |
+| 📊 **Saturation** | 10 requests queued |
+| 📊 **Errors** | Disk I/O errors |
+
+**🎯 USE for resources, RED for services**
+
+---
+
+## 📍 Slide 20 – ⚙️ Prometheus Configuration
+
+```yaml
+# prometheus/prometheus.yml
+global:
+  scrape_interval: 15s
+  evaluation_interval: 15s
+
+scrape_configs:
+  - job_name: 'prometheus'
+    static_configs:
+      - targets: ['localhost:9090']
+
+  - job_name: 'app'
+    static_configs:
+      - targets: ['app-python:8000']
+    metrics_path: '/metrics'
+
+  - job_name: 'loki'
+    static_configs:
+      - targets: ['loki:3100']
+```
+
+**🔑 Key Settings:**
+* ⏱️ `scrape_interval`: How often to collect (15s default)
+* 🎯 `targets`: What to scrape
+* 📍 `metrics_path`: Where metrics are exposed
+
+---
+
+## 📍 Slide 21 – 🎯 Scrape Targets
+
+```mermaid
+flowchart TD
+  Prometheus[💾 Prometheus] -->|🔄 Scrape| App[📦 app:8000/metrics]
+  Prometheus -->|🔄 Scrape| Loki[📦 loki:3100/metrics]
+  Prometheus -->|🔄 Scrape| Grafana[📦 grafana:3000/metrics]
+  Prometheus -->|🔄 Scrape| Self[📦 prometheus:9090/metrics]
+```
+
+**📊 Verify Targets:**
+```bash
+# Check targets status
+curl http://localhost:9090/api/v1/targets
+
+# Web UI
+http://localhost:9090/targets
+```
+
+**✅ All targets should show `UP`**
+
+---
+
+## 📍 Slide 22 – 📊 /metrics Endpoint Format
+
+```
+# HELP http_requests_total Total HTTP requests
+# TYPE http_requests_total counter
+http_requests_total{method="GET",endpoint="/",status="200"} 1234
+http_requests_total{method="GET",endpoint="/health",status="200"} 567
+http_requests_total{method="POST",endpoint="/api",status="201"} 89
+
+# HELP http_request_duration_seconds Request latency
+# TYPE http_request_duration_seconds histogram
+http_request_duration_seconds_bucket{le="0.01"} 100
+http_request_duration_seconds_bucket{le="0.05"} 200
+http_request_duration_seconds_bucket{le="0.1"} 250
+http_request_duration_seconds_bucket{le="+Inf"} 300
+http_request_duration_seconds_sum 45.67
+http_request_duration_seconds_count 300
+```
+
+**📊 Format:** `metric_name{labels} value`
+
+---
+
+## 📍 Slide 23 – 🏷️ Labels Best Practices
+
+```python
+# ✅ Good: Low cardinality labels
+http_requests.labels(method='GET', status='200', endpoint='/api')
+
+# ❌ Bad: High cardinality (user IDs, request IDs)
+http_requests.labels(user_id='12345')  # 💥 Millions of time series!
+```
+
+**🏷️ Label Rules:**
+* ✅ Use for: method, endpoint, status, service
+* ❌ Avoid: user_id, request_id, session_id
+* 📊 Target: < 1000 unique label combinations
+
+**⚠️ High cardinality = memory explosion**
+
+---
+
+## 📍 Slide 24 – 🔍 PromQL Basics
+
+```promql
+# Instant vector (current value)
+http_requests_total
+
+# Range vector (over time)
+http_requests_total[5m]
+
+# Rate (per-second)
+rate(http_requests_total[5m])
+
+# Sum by label
+sum by (endpoint) (rate(http_requests_total[5m]))
+
+# Filter by label
+http_requests_total{status="500"}
+```
+
+**🔑 Key Operators:**
+* `rate()` — Per-second rate for counters
+* `sum()` — Aggregate across series
+* `by ()` — Group results
+* `{}` — Filter by labels
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L8_MID
+
+---
+
+## 📍 Slide 26 – 📊 Section 4: Building Dashboards
+
+## 🎨 Dashboard Design with RED
+
+```mermaid
+flowchart TD
+  Row1[🔝 Row 1: Overview Stats]
+  Row2[📊 Row 2: Rate & Errors]
+  Row3[⏱️ Row 3: Latency]
+  Row4[📋 Row 4: Details]
+  Row1 --> Row2 --> Row3 --> Row4
+```
+
+**📊 Essential Panels:**
+1. 📊 **Request Rate** — Requests per second
+2. ❌ **Error Rate** — 5xx responses
+3. ⏱️ **Latency p95** — 95th percentile
+4. 📈 **Latency Heatmap** — Distribution
+
+---
+
+## 📍 Slide 27 – 📊 PromQL Dashboard Queries
+
+**1️⃣ Request Rate (Time series)**
+```promql
+sum(rate(http_requests_total[5m])) by (endpoint)
+```
+
+**2️⃣ Error Rate % (Time series)**
+```promql
+sum(rate(http_requests_total{status=~"5.."}[5m]))
+  / sum(rate(http_requests_total[5m])) * 100
+```
+
+**3️⃣ P95 Latency (Time series)**
+```promql
+histogram_quantile(0.95,
+  sum(rate(http_request_duration_seconds_bucket[5m])) by (le))
+```
+
+**4️⃣ Uptime (Stat)**
+```promql
+up{job="app"}
+```
+
+---
+
+## 📍 Slide 28 – 📈 Heatmap for Latency
+
+```promql
+# Latency distribution over time
+sum(rate(http_request_duration_seconds_bucket[1m])) by (le)
+```
+
+**🎨 Heatmap Benefits:**
+* 📊 See latency distribution
+* 🔍 Spot outliers
+* 📈 Track changes over time
+
+```mermaid
+flowchart LR
+  Green[🟢 Fast: < 100ms] --> Yellow[🟡 OK: 100-500ms]
+  Yellow --> Red[🔴 Slow: > 500ms]
+```
+
+---
+
+## 📍 Slide 29 – 📊 Monitoring Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| ⏱️ **Scrape Success** | Targets reachable | 100% |
+| 📊 **Series Count** | Time series | Stable |
+| 💾 **Storage Size** | Disk usage | Predictable |
+| 🔍 **Query Latency** | PromQL speed | < 1s |
+
+> 📚 Monitor your monitoring!
+
+**🤔 Question:** What happens if Prometheus goes down?
+
+---
+
+## 📍 Slide 30 – 🌊 From Guessing to Measuring
+
+```mermaid
+flowchart LR
+  subgraph 😱 Guessing
+    NoData[🤷 No Data]
+    Reactive[🔥 Reactive]
+    Slow[⏱️ Slow Detection]
+  end
+  subgraph 📊 Measuring
+    Metrics[📈 Real Metrics]
+    Proactive[⚡ Proactive]
+    Fast[🚀 Instant Detection]
+  end
+  Guessing -->|🚀 Prometheus| Measuring
+```
+
+**🎯 Monitoring State:**
+* ⚡ Detect issues before users
+* 📊 Data-driven capacity planning
+* 📈 Trend analysis and predictions
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: Production Monitoring
+
+## 📅 A Day with Prometheus
+
+**☀️ Morning:**
+* 📊 Check Grafana — all green ✅
+* 📈 Review overnight trends
+* 🔍 No anomalies detected
+
+**🌤️ Afternoon:**
+* 🚨 Alert: Latency p95 > 500ms
+* 📊 Dashboard shows spike at 2pm
+* 🔍 PromQL: `histogram_quantile(0.95, ...)`
+* 🔧 Found: Database slow query
+* ⏱️ **5 minutes** to identify
+
+**🌙 Evening:**
+* 📊 Review daily trends
+* 📈 Plan tomorrow's capacity
+* 🏠 Go home with confidence
+
+---
+
+## 📍 Slide 32 – 👥 Team Monitoring Workflow
+
+| 👤 Role | 🎯 Monitoring Responsibility |
+|---------|----------------------|
+| 👨‍💻 **Developer** | Add metrics to code |
+| 🔧 **DevOps** | Maintain Prometheus |
+| 🛡️ **SRE** | Design dashboards & alerts |
+| 📊 **On-call** | Respond to alerts |
+
+**🔗 Alert Flow:**
+```mermaid
+flowchart LR
+  Prometheus[💾 Prometheus] -->|🚨 Alert| AlertManager[📬 AlertManager]
+  AlertManager --> Slack[💬 Slack]
+  AlertManager --> PagerDuty[📟 PagerDuty]
+  PagerDuty --> OnCall[👤 On-call]
+```
+
+---
+
+## 📍 Slide 33 – 🔐 Production Considerations
+
+```yaml
+# Prometheus with retention
+command:
+  - '--config.file=/etc/prometheus/prometheus.yml'
+  - '--storage.tsdb.retention.time=15d'
+  - '--storage.tsdb.retention.size=10GB'
+
+deploy:
+  resources:
+    limits:
+      memory: 1G
+      cpus: '1.0'
+
+healthcheck:
+  test: ["CMD", "wget", "-q", "--spider", "http://localhost:9090/-/healthy"]
+  interval: 10s
+  timeout: 5s
+  retries: 5
+```
+
+**🛡️ Production Checklist:**
+* 💾 Persistent storage configured
+* 🗓️ Retention policy set
+* 📊 Resource limits defined
+* 🏥 Health checks enabled
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: Monitoring Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Basic metrics] --> Mid[💼 Mid: PromQL & dashboards]
+  Mid --> Senior[⭐ Senior: Full observability]
+  Senior --> Principal[🏆 Principal: SRE practices]
+```
+
+**🛠️ Skills to Build:**
+* 📊 Application instrumentation
+* 🔍 PromQL fluency
+* 📈 Dashboard design
+* 🚨 Alert engineering
+* 📊 SLO/SLI definition
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 Prometheus at Scale:**
+* ☁️ **SoundCloud**: Created Prometheus (2012)
+* 🔍 **Google**: Inspired Prometheus (Borgmon)
+* 🎬 **Netflix**: Millions of time series
+
+**☁️ Modern Practices:**
+* 📦 **Spotify**: Custom Prometheus federation
+* 🏦 **Stripe**: Fine-grained latency tracking
+* 🎮 **Riot Games**: Real-time game metrics
+
+**📊 Stats:**
+* 🌍 **#1** cloud-native monitoring tool
+* 📦 **CNCF graduated** project
+* 🏢 Adopted by **70%+** of K8s users
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 📊 **Metrics complement logs** — different purposes
+2. 🔢 **Counter, Gauge, Histogram** — choose wisely
+3. 🔴 **RED method** for services (Rate, Errors, Duration)
+4. 🏷️ **Labels** — keep cardinality low
+5. 📈 **PromQL** is powerful — learn it well
+
+> 💡 If you can't measure it, you can't improve it.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 📊 Metrics Mindset |
+|---------------|------------------|
+| 🙅 "Seems fine" | 📊 "Data shows it's fine" |
+| 🚫 "Users will tell us" | 🚨 "Alerts tell us first" |
+| 👉 "We need more servers" | 📈 "Data shows we need 3 more" |
+| 😨 "Deploy and hope" | 📊 "Deploy and measure" |
+| 💻 "Performance is subjective" | 🔢 "p95 is 250ms" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Metrics types and when to use each
+* ✅ Prometheus architecture and configuration
+* ✅ Application instrumentation patterns
+* ✅ PromQL query syntax
+* ✅ Dashboard design with RED method
+
+> 🚀 **You're ready for Lab 8: Prometheus Monitoring**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L8_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Kubernetes Fundamentals
+
+* ☸️ Container orchestration
+* 📦 Deployments and Services
+* 🔄 Scaling and self-healing
+* 💻 Hands-on: Deploying to Kubernetes
+
+**🎉 Your monitoring journey continues.**
+
+> 📊 From guessing to measuring — one metric at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Metrics[📊 Metrics Skills]
+  Metrics --> DataDriven[📈 Data-Driven Ops]
+  DataDriven --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Prometheus: Up & Running* — Brian Brazil
+* 📖 *Site Reliability Engineering* — Google
+* 📖 *The Art of Monitoring* — James Turnbull
+
+**🔗 Links:**
+* 🌐 [Prometheus Documentation](https://prometheus.io/docs/)
+* 🌐 [PromQL Basics](https://prometheus.io/docs/prometheus/latest/querying/basics/)
+* 🌐 [RED Method](https://grafana.com/blog/2018/08/02/the-red-method-how-to-instrument-your-services/)
+
+---
diff --git a/lectures/lec9.md b/lectures/lec9.md
index e5a265fd11..be086cb7d4 100644
--- a/lectures/lec9.md
+++ b/lectures/lec9.md
@@ -1,853 +1,853 @@
-# 📌 Lecture 9 — Kubernetes Fundamentals: Container Orchestration
-
-## 📍 Slide 1 – 🚀 Welcome to Kubernetes
-
-* 🌍 **Containers are great** — but who manages them at scale?
-* 😰 Manual container management doesn't scale
-* ☸️ **Kubernetes** = the operating system for containers
-* 🎯 This lecture: master deployments, services, and orchestration
-
-```mermaid
-flowchart LR
-  Containers[🐳 Containers] -->|☸️ Kubernetes| Orchestration[🎭 Orchestration]
-  Orchestration --> Scaling[📈 Auto-scaling]
-  Orchestration --> Healing[🏥 Self-healing]
-  Orchestration --> Updates[🔄 Rolling updates]
-```
-
----
-
-## 📍 Slide 2 – 🎯 What You Will Learn
-
-* ✅ Understand Kubernetes architecture and concepts
-* ✅ Write production-ready Deployment manifests
-* ✅ Expose applications with Services and Ingress
-* ✅ Implement health checks and resource management
-
-**🎓 Learning Outcomes:**
-| # | Outcome |
-|---|---------|
-| 1 | 🧠 Explain Kubernetes declarative model |
-| 2 | 🔍 Create Deployments with probes and limits |
-| 3 | 🛠️ Configure Services for networking |
-| 4 | 🗺️ Perform scaling and rolling updates |
-
----
-
-## 📍 Slide 3 – 📋 How This Lecture Works
-
-* 📚 **Concepts + YAML manifests** — hands-on focus
-* 🎮 **Real-world scenarios** — production deployment challenges
-* 📝 **3 quiz checkpoints**: PRE / MID / POST
-* 🛠️ **Tools**: kubectl, minikube, manifests
-
-**⏱️ Lecture Structure:**
-```
-Section 0: Introduction (now)     → 📝 PRE Quiz
-Section 1: The Orchestration Problem
-Section 2: Kubernetes Architecture
-Section 3: Core Resources          → 📝 MID Quiz
-Section 4: Health & Resource Management
-Section 5: Production Kubernetes
-Section 6: Reflection             → 📝 POST Quiz
-```
-
----
-
-## 📍 Slide 4 – ❓ The Big Question
-
-* 📊 **92%** of organizations use containers in production
-* ⏱️ Average container lifecycle: **minutes to hours** (not days)
-* 💥 Managing 100+ containers manually is **impossible**
-
-> 💬 *"Why did container 47 crash? Where's the replacement?"* — Nobody wants to ask this manually
-
-**🤔 Think about it:**
-* How do you ensure 10 copies of your app are always running?
-* What happens when a container crashes at 3am?
-* How do you update without downtime?
-
----
-
-## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L9_PRE
-
----
-
-## 📍 Slide 6 – 🔥 Section 1: The Orchestration Problem
-
-* 🐳 **One container is easy** — just `docker run`
-* 📦 100 containers? 1000 containers?
-* 🔧 Manual restart on crash?
-* 💥 Result: **operations nightmare**
-
-```mermaid
-flowchart LR
-  Single[🐳 1 Container] -->|Easy| Manual[👤 Manual]
-  Hundred[🐳 100 Containers] -->|Hard| Manual
-  Thousand[🐳 1000 Containers] -->|💥 Impossible| Manual
-```
-
----
-
-## 📍 Slide 7 – 😱 Container Management Chaos
-
-* 📋 Tracking which containers run where
-* 🔄 Restarting crashed containers
-* 📊 Load balancing between replicas
-* 🔒 Managing secrets and configs
-* 💀 Scaling up/down based on load
-
-```mermaid
-flowchart TD
-  Crash[💥 Container Crash] --> Detect[🔍 Detect (how?)]
-  Detect --> Restart[🔄 Restart (where?)]
-  Restart --> LoadBalance[⚖️ Update LB (manually?)]
-  LoadBalance --> Hope[🙏 Hope it works]
-```
-
-**📊 The Numbers:**
-* 🔍 **Netflix**: 100,000+ container instances
-* 📦 **Spotify**: 10,000+ services
-* ⏱️ Manual management: **impossible**
-
----
-
-## 📍 Slide 8 – 🔧 Docker Compose Limitations
-
-* ✅ Great for development and simple deployments
-* ❌ Single host only
-* ❌ No automatic restart across nodes
-* ❌ No rolling updates
-* ❌ No auto-scaling
-
-> ⚠️ **Docker Compose ≠ production orchestration**
-
-```mermaid
-flowchart TD
-  Compose[🐳 Docker Compose] --> SingleHost[🖥️ Single Host]
-  K8s[☸️ Kubernetes] --> MultiHost[🖥️🖥️🖥️ Multi-Host Cluster]
-  SingleHost --> DevTest[✅ Dev/Test]
-  MultiHost --> Production[✅ Production]
-```
-
----
-
-## 📍 Slide 9 – 😨 Zero Downtime Deployments
-
-* 📅 Traditional: Schedule maintenance window
-* 🔧 Stop old version, start new version
-* ⏱️ Downtime = lost revenue
-* 💀 Risky deployments = fear of deploying
-
-> ⚠️ **Every minute of downtime costs money**
-
-**💬 Discussion:** How do you update without any downtime?
-
----
-
-## 📍 Slide 10 – 💸 The Cost of Manual Orchestration
-
-| 🔥 Problem | 💥 Impact |
-|------------|-----------|
-| 🐢 Slow scaling | Can't handle traffic spikes |
-| 📋 Manual recovery | Long outages |
-| 👉 No load balancing | Uneven distribution |
-| 🙈 Version confusion | "Which version is running?" |
-
-**📈 Real Numbers:**
-* 🏢 **Manual ops**: 10+ hours/week
-* 🚀 **With Kubernetes**: Minutes/week
-* 💰 **Downtime cost**: $5,600/minute (average)
-
----
-
-## 📍 Slide 11 – 💡 Section 2: What Kubernetes Is
-
-* ☸️ **Container orchestration platform**
-* 🎭 **Manages** container lifecycle automatically
-* 🔄 **Declarative** — you define desired state
-* 🌐 **Portable** — runs anywhere (cloud, on-prem, laptop)
-
-```mermaid
-flowchart LR
-  You[👤 You] -->|📝 Declare| K8s[☸️ Kubernetes]
-  K8s -->|🔄 Reconcile| Cluster[🖥️ Cluster]
-  K8s -->|🔁 Continuously| Monitor[👀 Monitor & Fix]
-```
-
-**📖 Definition:**
-> *Kubernetes is an open-source container orchestration platform that automates deployment, scaling, and management of containerized applications.*
-
----
-
-## 📍 Slide 12 – 🎭 Declarative vs Imperative
-
-```mermaid
-flowchart TD
-  subgraph Declarative
-    D1[📝 Define: 3 replicas]
-    D2[☸️ K8s makes it happen]
-    D1 --> D2
-  end
-  subgraph Imperative
-    I1[💻 Run: create pod 1]
-    I2[💻 Run: create pod 2]
-    I3[💻 Run: create pod 3]
-    I1 --> I2 --> I3
-  end
-```
-
-| 📋 Approach | 📝 You Say | ☸️ K8s Does |
-|-------------|----------|------------|
-| 🎭 **Declarative** | "I want 3 replicas" | Creates/maintains 3 |
-| 💻 **Imperative** | "Create this pod" | Creates 1 pod |
-
-**🎯 Always prefer declarative manifests!**
-
----
-
-## 📍 Slide 13 – 🏗️ Kubernetes Architecture
-
-```mermaid
-flowchart TD
-  subgraph Control Plane
-    API[📡 API Server]
-    Scheduler[📊 Scheduler]
-    Controller[🔄 Controller Manager]
-    ETCD[💾 etcd]
-  end
-  subgraph Worker Nodes
-    Kubelet[🤖 kubelet]
-    Proxy[🌐 kube-proxy]
-    Runtime[🐳 Container Runtime]
-  end
-  API --> Scheduler
-  API --> Controller
-  API --> ETCD
-  API --> Kubelet
-  Kubelet --> Runtime
-```
-
-| 🧱 Component | 🎯 Purpose |
-|-------------|----------|
-| 📡 **API Server** | Gateway to cluster |
-| 📊 **Scheduler** | Places pods on nodes |
-| 🔄 **Controller** | Ensures desired state |
-| 💾 **etcd** | Cluster state database |
-| 🤖 **kubelet** | Node agent |
-
----
-
-## 📍 Slide 14 – 📦 Core Resources
-
-```mermaid
-flowchart TD
-  Pod[📦 Pod] --> Containers[🐳 Containers]
-  Deployment[🚀 Deployment] --> ReplicaSet[📊 ReplicaSet]
-  ReplicaSet --> Pod
-  Service[🌐 Service] --> Pod
-  Ingress[🚪 Ingress] --> Service
-```
-
-| 📦 Resource | 🎯 Purpose |
-|-------------|----------|
-| 📦 **Pod** | Smallest unit, contains containers |
-| 🚀 **Deployment** | Manages replicas and updates |
-| 🌐 **Service** | Stable network endpoint |
-| 🚪 **Ingress** | HTTP routing and TLS |
-
----
-
-## 📍 Slide 15 – ⚡ Before vs After Kubernetes
-
-| 😰 Before | 🚀 After |
-|----------|---------|
-| 📅 Manual restart on crash | 🔄 Auto-restart |
-| 📋 Manual scaling | 📈 Auto-scaling |
-| 👉 Downtime for updates | 🔄 Rolling updates |
-| 😨 Fear of deploying | 💪 Deploy anytime |
-| 🐌 Hours to scale | ⚡ Seconds to scale |
-| 📝 Track servers manually | 🎭 Declarative state |
-
-> 🤔 Ready to orchestrate?
-
----
-
-## 📍 Slide 16 – 🎮 Section 3: Core Resources
-
-## 📦 The Pod
-
-* 🐳 **One or more containers** sharing network/storage
-* 📦 **Smallest deployable unit**
-* ⏱️ **Ephemeral** — created and destroyed
-* 🏷️ **Labeled** for selection
-
-```yaml
-apiVersion: v1
-kind: Pod
-metadata:
-  name: my-app
-  labels:
-    app: web
-spec:
-  containers:
-  - name: web
-    image: nginx:latest
-    ports:
-    - containerPort: 80
-```
-
-**⚠️ Never create pods directly — use Deployments!**
-
----
-
-## 📍 Slide 17 – 🚀 Deployments
-
-```mermaid
-flowchart TD
-  Deployment[🚀 Deployment] --> RS1[📊 ReplicaSet v1]
-  RS1 --> Pod1[📦 Pod]
-  RS1 --> Pod2[📦 Pod]
-  RS1 --> Pod3[📦 Pod]
-```
-
-**🚀 Deployment manages:**
-* 📊 Desired replica count
-* 🔄 Rolling updates
-* 🔙 Rollback capability
-* 🏷️ Pod template
-
-```yaml
-apiVersion: apps/v1
-kind: Deployment
-metadata:
-  name: web-app
-spec:
-  replicas: 3
-  selector:
-    matchLabels:
-      app: web
-  template:
-    metadata:
-      labels:
-        app: web
-    spec:
-      containers:
-      - name: web
-        image: myapp:1.0
-```
-
----
-
-## 📍 Slide 18 – 🏷️ Labels and Selectors
-
-```mermaid
-flowchart LR
-  Deployment[🚀 Deployment] -->|selector: app=web| Pods[📦 Pods with label app=web]
-  Service[🌐 Service] -->|selector: app=web| Pods
-```
-
-**🏷️ Labels = Key-value pairs for organization**
-
-```yaml
-metadata:
-  labels:
-    app: web-frontend
-    environment: production
-    version: v1.2.3
-
-selector:
-  matchLabels:
-    app: web-frontend
-```
-
-**🎯 Labels enable:**
-* 🔍 Service discovery
-* 📊 Resource selection
-* 🏗️ Organization
-
----
-
-## 📍 Slide 19 – 🌐 Services
-
-```mermaid
-flowchart LR
-  Client[👥 Client] --> Service[🌐 Service: ClusterIP]
-  Service --> Pod1[📦 Pod 1]
-  Service --> Pod2[📦 Pod 2]
-  Service --> Pod3[📦 Pod 3]
-```
-
-**🌐 Service types:**
-| 🔧 Type | 🎯 Use Case |
-|---------|----------|
-| 🔒 **ClusterIP** | Internal cluster access |
-| 🔓 **NodePort** | External via node IP |
-| ☁️ **LoadBalancer** | Cloud load balancer |
-| 🔗 **ExternalName** | DNS alias |
-
-```yaml
-apiVersion: v1
-kind: Service
-metadata:
-  name: web-service
-spec:
-  type: NodePort
-  selector:
-    app: web
-  ports:
-  - port: 80
-    targetPort: 8000
-    nodePort: 30080
-```
-
----
-
-## 📍 Slide 20 – 🔄 Rolling Updates
-
-```mermaid
-flowchart LR
-  V1[📦 v1] --> V1_V2[📦 v1 + v2]
-  V1_V2 --> V2[📦 v2]
-```
-
-**🔄 How it works:**
-1. 📦 Create new pods with new version
-2. ⏳ Wait for them to be ready
-3. 🗑️ Terminate old pods gradually
-4. ✅ Zero downtime!
-
-```yaml
-spec:
-  strategy:
-    type: RollingUpdate
-    rollingUpdate:
-      maxSurge: 1        # Extra pods during update
-      maxUnavailable: 0  # Always maintain capacity
-```
-
----
-
-## 📍 Slide 21 – 📊 kubectl Commands
-
-```bash
-# 📋 Get resources
-kubectl get pods
-kubectl get deployments
-kubectl get services
-
-# 🔍 Describe (detailed info)
-kubectl describe pod <name>
-
-# 📝 Apply manifest
-kubectl apply -f deployment.yaml
-
-# 📊 Watch changes
-kubectl get pods -w
-
-# 🔙 Rollback
-kubectl rollout undo deployment/<name>
-
-# 📈 Scale
-kubectl scale deployment/<name> --replicas=5
-```
-
----
-
-## 📍 Slide 22 – 🚪 Ingress
-
-```mermaid
-flowchart LR
-  Internet[🌐 Internet] --> Ingress[🚪 Ingress Controller]
-  Ingress -->|/app1| Svc1[🌐 Service 1]
-  Ingress -->|/app2| Svc2[🌐 Service 2]
-  Svc1 --> Pods1[📦 Pods]
-  Svc2 --> Pods2[📦 Pods]
-```
-
-**🚪 Ingress provides:**
-* 🔗 URL routing
-* 🔐 TLS termination
-* 🏷️ Name-based virtual hosting
-
-```yaml
-apiVersion: networking.k8s.io/v1
-kind: Ingress
-metadata:
-  name: app-ingress
-spec:
-  rules:
-  - host: app.example.com
-    http:
-      paths:
-      - path: /
-        pathType: Prefix
-        backend:
-          service:
-            name: web-service
-            port:
-              number: 80
-```
-
----
-
-## 📍 Slide 23 – 🏥 Health Checks
-
-```yaml
-spec:
-  containers:
-  - name: app
-    image: myapp:1.0
-    livenessProbe:
-      httpGet:
-        path: /health
-        port: 8000
-      initialDelaySeconds: 10
-      periodSeconds: 5
-    readinessProbe:
-      httpGet:
-        path: /ready
-        port: 8000
-      initialDelaySeconds: 5
-      periodSeconds: 3
-```
-
-| 🏥 Probe | 🎯 Purpose | ❌ Failure Action |
-|----------|----------|------------------|
-| 🔴 **Liveness** | Is it alive? | Restart container |
-| 🟢 **Readiness** | Is it ready? | Remove from service |
-| 🟡 **Startup** | Did it start? | Keep waiting |
-
----
-
-## 📍 Slide 24 – 📊 Resource Management
-
-```yaml
-spec:
-  containers:
-  - name: app
-    image: myapp:1.0
-    resources:
-      requests:
-        memory: "128Mi"
-        cpu: "100m"       # 0.1 CPU core
-      limits:
-        memory: "256Mi"
-        cpu: "200m"       # 0.2 CPU core
-```
-
-**📊 Requests vs Limits:**
-| 📊 Setting | 🎯 Purpose |
-|-----------|----------|
-| 📋 **Requests** | Guaranteed resources, scheduling |
-| 🔒 **Limits** | Maximum allowed, OOM if exceeded |
-
-**⚠️ Always set both!**
-
----
-
-## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L9_MID
-
----
-
-## 📍 Slide 26 – 📁 Section 4: Manifest Best Practices
-
-## 📄 Complete Deployment Example
-
-```yaml
-apiVersion: apps/v1
-kind: Deployment
-metadata:
-  name: web-app
-  labels:
-    app: web-app
-spec:
-  replicas: 3
-  selector:
-    matchLabels:
-      app: web-app
-  strategy:
-    type: RollingUpdate
-    rollingUpdate:
-      maxSurge: 1
-      maxUnavailable: 0
-  template:
-    metadata:
-      labels:
-        app: web-app
-    spec:
-      containers:
-      - name: web-app
-        image: username/web-app:1.0.0
-        ports:
-        - containerPort: 8000
-        resources:
-          requests:
-            memory: "128Mi"
-            cpu: "100m"
-          limits:
-            memory: "256Mi"
-            cpu: "200m"
-        livenessProbe:
-          httpGet:
-            path: /health
-            port: 8000
-          initialDelaySeconds: 10
-        readinessProbe:
-          httpGet:
-            path: /health
-            port: 8000
-          initialDelaySeconds: 5
-```
-
----
-
-## 📍 Slide 27 – 🔐 Security Best Practices
-
-```yaml
-spec:
-  containers:
-  - name: app
-    image: myapp:1.0
-    securityContext:
-      runAsNonRoot: true
-      runAsUser: 1000
-      readOnlyRootFilesystem: true
-      allowPrivilegeEscalation: false
-```
-
-**🔐 Security Checklist:**
-* ✅ Run as non-root user
-* ✅ Read-only filesystem
-* ✅ No privilege escalation
-* ✅ Specific image tags (not `:latest`)
-* ✅ Resource limits defined
-
----
-
-## 📍 Slide 28 – 📊 Kubernetes Metrics
-
-| 📊 Metric | 📏 Measures | 🏆 Target |
-|-----------|------------|---------|
-| 📦 **Pod Restarts** | Stability | 0 |
-| ⏱️ **Pod Startup Time** | Speed | < 30s |
-| 📊 **Resource Usage** | Efficiency | 50-80% |
-| ✅ **Probe Success** | Health | 100% |
-
-> 📚 Monitor your cluster health!
-
-**🤔 Question:** How many pod restarts is "normal"?
-
----
-
-## 📍 Slide 29 – 🌊 From Manual to Orchestrated
-
-```mermaid
-flowchart LR
-  subgraph 😱 Manual
-    SSH[🔌 SSH to servers]
-    Docker[🐳 docker run]
-    Restart[🔄 Manual restart]
-  end
-  subgraph ☸️ Orchestrated
-    Manifest[📝 YAML Manifest]
-    Apply[kubectl apply]
-    AutoHeal[🏥 Auto-healing]
-  end
-  Manual -->|🚀 Kubernetes| Orchestrated
-```
-
-**🎯 Orchestration State:**
-* ⚡ Deploy in seconds
-* 🔄 Auto-healing always
-* 📈 Scale on demand
-
----
-
-## 📍 Slide 30 – 🏢 Section 5: Production Kubernetes
-
-## 📅 A Day with Kubernetes
-
-**☀️ Morning:**
-* 📊 Check cluster health — all green ✅
-* 📈 Review resource usage
-* 🔄 Approve deployment PR
-
-**🌤️ Afternoon:**
-* 🚀 `kubectl apply -f deployment.yaml`
-* 📊 Watch rolling update: `kubectl rollout status`
-* ✅ Zero downtime update complete
-
-**🌙 Evening:**
-* 📈 Auto-scaling handles traffic spike
-* 🏥 Crashed pod auto-restarted
-* 🏠 Sleep peacefully
-
----
-
-## 📍 Slide 31 – 👥 Team Kubernetes Workflow
-
-| 👤 Role | 🎯 Kubernetes Responsibility |
-|---------|----------------------|
-| 👨‍💻 **Developer** | Write manifests, define resources |
-| 🔧 **DevOps** | Manage cluster, set policies |
-| 🛡️ **SRE** | Monitor, scale, incident response |
-| 📊 **Platform** | Build internal tooling |
-
-**🔗 GitOps Flow:**
-```mermaid
-flowchart LR
-  PR[📝 Manifest PR] --> Review[👀 Review]
-  Review --> Merge[✅ Merge]
-  Merge --> ArgoCD[🔄 ArgoCD]
-  ArgoCD --> Cluster[☸️ Cluster]
-```
-
----
-
-## 📍 Slide 32 – 🔧 Local Development
-
-```bash
-# 🎯 minikube: Full-featured local cluster
-minikube start
-minikube status
-minikube service web-service --url
-
-# 🐳 kind: Lightweight, Docker-based
-kind create cluster
-kind load docker-image myapp:latest
-
-# 📊 Useful addons
-minikube addons enable ingress
-minikube addons enable metrics-server
-```
-
-**🛠️ Local Options:**
-| 🔧 Tool | 🎯 Best For |
-|---------|----------|
-| 🚀 **minikube** | Learning, full features |
-| 🐳 **kind** | CI/CD, fast startup |
-| 🖥️ **Docker Desktop** | Mac/Windows convenience |
-
----
-
-## 📍 Slide 33 – 📈 Career Path: Kubernetes Skills
-
-```mermaid
-flowchart LR
-  Junior[🌱 Junior: kubectl basics] --> Mid[💼 Mid: Manifests & debugging]
-  Mid --> Senior[⭐ Senior: Architecture & scaling]
-  Senior --> Principal[🏆 Principal: Platform design]
-```
-
-**🛠️ Skills to Build:**
-* 📝 YAML manifest fluency
-* 🔍 kubectl debugging
-* 🏗️ Architecture patterns
-* 📊 Resource optimization
-* 🔐 Security hardening
-
----
-
-## 📍 Slide 34 – 🌍 Real Company Examples
-
-**🏢 Kubernetes at Scale:**
-* 📦 **Spotify**: 10,000+ services on K8s
-* 🔍 **Google**: Runs everything on Kubernetes
-* 🎬 **Netflix**: Titus (K8s-inspired)
-
-**☁️ Modern Practices:**
-* 📦 **Airbnb**: 1000+ microservices
-* 🏦 **Capital One**: K8s for banking workloads
-* 🎮 **Pokemon Go**: Global scale with K8s
-
-**📊 Stats:**
-* 🌍 **5.6M+** Kubernetes developers
-* 📦 **92%** container adoption uses K8s
-* 🏢 **#1** CNCF project
-
----
-
-## 📍 Slide 35 – 🎯 Section 6: Reflection
-
-## 📝 Key Takeaways
-
-1. ☸️ **Kubernetes orchestrates containers** at scale
-2. 🎭 **Declarative** — define desired state, K8s maintains it
-3. 🚀 **Deployments** manage replicas and updates
-4. 🌐 **Services** provide stable networking
-5. 🏥 **Probes** ensure health, **limits** ensure stability
-
-> 💡 Kubernetes is the operating system for cloud-native applications.
-
----
-
-## 📍 Slide 36 – 🧠 The Mindset Shift
-
-| 😰 Old Mindset | ☸️ K8s Mindset |
-|---------------|------------------|
-| 🙅 "Restart manually" | 🔄 "K8s restarts automatically" |
-| 🚫 "SSH to fix" | 📝 "Fix manifest, apply" |
-| 👉 "Which server?" | 📦 "Which pod?" |
-| 😨 "Scale takes hours" | ⚡ "Scale in seconds" |
-| 💻 "Deploy on weekends" | 🚀 "Deploy anytime" |
-
-> ❓ Which mindset describes your team?
-
----
-
-## 📍 Slide 37 – ✅ Your Progress
-
-## 🎓 What You Now Understand
-
-* ✅ Kubernetes architecture and concepts
-* ✅ Deployments, Services, and Ingress
-* ✅ Health checks and resource management
-* ✅ Rolling updates and scaling
-* ✅ kubectl commands for daily use
-
-> 🚀 **You're ready for Lab 9: Kubernetes Fundamentals**
-
----
-
-## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L9_POST
-
----
-
-## 📍 Slide 39 – 🚀 What Comes Next
-
-## 📚 Next Lecture: Helm Package Management
-
-* ⛵ Helm charts for packaging
-* 📝 Templating with Go templates
-* 🔧 Values management
-* 💻 Hands-on: Creating Helm charts
-
-**🎉 Your Kubernetes journey continues.**
-
-> ☸️ From manual containers to orchestration — one manifest at a time.
-
-```mermaid
-flowchart LR
-  You[👤 You] --> K8s[☸️ Kubernetes Skills]
-  K8s --> CloudNative[☁️ Cloud-Native]
-  CloudNative --> Career[🚀 Career Growth]
-```
-
-**👋 See you in the next lecture!**
-
----
-
-## 📍 Slide 40 – 📚 Resources & Further Reading
-
-**📕 Books:**
-* 📖 *Kubernetes: Up & Running* — Brendan Burns
-* 📖 *The Kubernetes Book* — Nigel Poulton
-* 📖 *Cloud Native DevOps with Kubernetes* — John Arundel
-
-**🔗 Links:**
-* 🌐 [Kubernetes Documentation](https://kubernetes.io/docs/)
-* 🌐 [kubectl Cheat Sheet](https://kubernetes.io/docs/reference/kubectl/cheatsheet/)
-* 🌐 [Kubernetes the Hard Way](https://github.com/kelseyhightower/kubernetes-the-hard-way)
-
----
+# 📌 Lecture 9 — Kubernetes Fundamentals: Container Orchestration
+
+## 📍 Slide 1 – 🚀 Welcome to Kubernetes
+
+* 🌍 **Containers are great** — but who manages them at scale?
+* 😰 Manual container management doesn't scale
+* ☸️ **Kubernetes** = the operating system for containers
+* 🎯 This lecture: master deployments, services, and orchestration
+
+```mermaid
+flowchart LR
+  Containers[🐳 Containers] -->|☸️ Kubernetes| Orchestration[🎭 Orchestration]
+  Orchestration --> Scaling[📈 Auto-scaling]
+  Orchestration --> Healing[🏥 Self-healing]
+  Orchestration --> Updates[🔄 Rolling updates]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand Kubernetes architecture and concepts
+* ✅ Write production-ready Deployment manifests
+* ✅ Expose applications with Services and Ingress
+* ✅ Implement health checks and resource management
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Explain Kubernetes declarative model |
+| 2 | 🔍 Create Deployments with probes and limits |
+| 3 | 🛠️ Configure Services for networking |
+| 4 | 🗺️ Perform scaling and rolling updates |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + YAML manifests** — hands-on focus
+* 🎮 **Real-world scenarios** — production deployment challenges
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Tools**: kubectl, minikube, manifests
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Orchestration Problem
+Section 2: Kubernetes Architecture
+Section 3: Core Resources          → 📝 MID Quiz
+Section 4: Health & Resource Management
+Section 5: Production Kubernetes
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **92%** of organizations use containers in production
+* ⏱️ Average container lifecycle: **minutes to hours** (not days)
+* 💥 Managing 100+ containers manually is **impossible**
+
+> 💬 *"Why did container 47 crash? Where's the replacement?"* — Nobody wants to ask this manually
+
+**🤔 Think about it:**
+* How do you ensure 10 copies of your app are always running?
+* What happens when a container crashes at 3am?
+* How do you update without downtime?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L9_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Orchestration Problem
+
+* 🐳 **One container is easy** — just `docker run`
+* 📦 100 containers? 1000 containers?
+* 🔧 Manual restart on crash?
+* 💥 Result: **operations nightmare**
+
+```mermaid
+flowchart LR
+  Single[🐳 1 Container] -->|Easy| Manual[👤 Manual]
+  Hundred[🐳 100 Containers] -->|Hard| Manual
+  Thousand[🐳 1000 Containers] -->|💥 Impossible| Manual
+```
+
+---
+
+## 📍 Slide 7 – 😱 Container Management Chaos
+
+* 📋 Tracking which containers run where
+* 🔄 Restarting crashed containers
+* 📊 Load balancing between replicas
+* 🔒 Managing secrets and configs
+* 💀 Scaling up/down based on load
+
+```mermaid
+flowchart TD
+  Crash[💥 Container Crash] --> Detect[🔍 Detect (how?)]
+  Detect --> Restart[🔄 Restart (where?)]
+  Restart --> LoadBalance[⚖️ Update LB (manually?)]
+  LoadBalance --> Hope[🙏 Hope it works]
+```
+
+**📊 The Numbers:**
+* 🔍 **Netflix**: 100,000+ container instances
+* 📦 **Spotify**: 10,000+ services
+* ⏱️ Manual management: **impossible**
+
+---
+
+## 📍 Slide 8 – 🔧 Docker Compose Limitations
+
+* ✅ Great for development and simple deployments
+* ❌ Single host only
+* ❌ No automatic restart across nodes
+* ❌ No rolling updates
+* ❌ No auto-scaling
+
+> ⚠️ **Docker Compose ≠ production orchestration**
+
+```mermaid
+flowchart TD
+  Compose[🐳 Docker Compose] --> SingleHost[🖥️ Single Host]
+  K8s[☸️ Kubernetes] --> MultiHost[🖥️🖥️🖥️ Multi-Host Cluster]
+  SingleHost --> DevTest[✅ Dev/Test]
+  MultiHost --> Production[✅ Production]
+```
+
+---
+
+## 📍 Slide 9 – 😨 Zero Downtime Deployments
+
+* 📅 Traditional: Schedule maintenance window
+* 🔧 Stop old version, start new version
+* ⏱️ Downtime = lost revenue
+* 💀 Risky deployments = fear of deploying
+
+> ⚠️ **Every minute of downtime costs money**
+
+**💬 Discussion:** How do you update without any downtime?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Manual Orchestration
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow scaling | Can't handle traffic spikes |
+| 📋 Manual recovery | Long outages |
+| 👉 No load balancing | Uneven distribution |
+| 🙈 Version confusion | "Which version is running?" |
+
+**📈 Real Numbers:**
+* 🏢 **Manual ops**: 10+ hours/week
+* 🚀 **With Kubernetes**: Minutes/week
+* 💰 **Downtime cost**: $5,600/minute (average)
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Kubernetes Is
+
+* ☸️ **Container orchestration platform**
+* 🎭 **Manages** container lifecycle automatically
+* 🔄 **Declarative** — you define desired state
+* 🌐 **Portable** — runs anywhere (cloud, on-prem, laptop)
+
+```mermaid
+flowchart LR
+  You[👤 You] -->|📝 Declare| K8s[☸️ Kubernetes]
+  K8s -->|🔄 Reconcile| Cluster[🖥️ Cluster]
+  K8s -->|🔁 Continuously| Monitor[👀 Monitor & Fix]
+```
+
+**📖 Definition:**
+> *Kubernetes is an open-source container orchestration platform that automates deployment, scaling, and management of containerized applications.*
+
+---
+
+## 📍 Slide 12 – 🎭 Declarative vs Imperative
+
+```mermaid
+flowchart TD
+  subgraph Declarative
+    D1[📝 Define: 3 replicas]
+    D2[☸️ K8s makes it happen]
+    D1 --> D2
+  end
+  subgraph Imperative
+    I1[💻 Run: create pod 1]
+    I2[💻 Run: create pod 2]
+    I3[💻 Run: create pod 3]
+    I1 --> I2 --> I3
+  end
+```
+
+| 📋 Approach | 📝 You Say | ☸️ K8s Does |
+|-------------|----------|------------|
+| 🎭 **Declarative** | "I want 3 replicas" | Creates/maintains 3 |
+| 💻 **Imperative** | "Create this pod" | Creates 1 pod |
+
+**🎯 Always prefer declarative manifests!**
+
+---
+
+## 📍 Slide 13 – 🏗️ Kubernetes Architecture
+
+```mermaid
+flowchart TD
+  subgraph Control Plane
+    API[📡 API Server]
+    Scheduler[📊 Scheduler]
+    Controller[🔄 Controller Manager]
+    ETCD[💾 etcd]
+  end
+  subgraph Worker Nodes
+    Kubelet[🤖 kubelet]
+    Proxy[🌐 kube-proxy]
+    Runtime[🐳 Container Runtime]
+  end
+  API --> Scheduler
+  API --> Controller
+  API --> ETCD
+  API --> Kubelet
+  Kubelet --> Runtime
+```
+
+| 🧱 Component | 🎯 Purpose |
+|-------------|----------|
+| 📡 **API Server** | Gateway to cluster |
+| 📊 **Scheduler** | Places pods on nodes |
+| 🔄 **Controller** | Ensures desired state |
+| 💾 **etcd** | Cluster state database |
+| 🤖 **kubelet** | Node agent |
+
+---
+
+## 📍 Slide 14 – 📦 Core Resources
+
+```mermaid
+flowchart TD
+  Pod[📦 Pod] --> Containers[🐳 Containers]
+  Deployment[🚀 Deployment] --> ReplicaSet[📊 ReplicaSet]
+  ReplicaSet --> Pod
+  Service[🌐 Service] --> Pod
+  Ingress[🚪 Ingress] --> Service
+```
+
+| 📦 Resource | 🎯 Purpose |
+|-------------|----------|
+| 📦 **Pod** | Smallest unit, contains containers |
+| 🚀 **Deployment** | Manages replicas and updates |
+| 🌐 **Service** | Stable network endpoint |
+| 🚪 **Ingress** | HTTP routing and TLS |
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After Kubernetes
+
+| 😰 Before | 🚀 After |
+|----------|---------|
+| 📅 Manual restart on crash | 🔄 Auto-restart |
+| 📋 Manual scaling | 📈 Auto-scaling |
+| 👉 Downtime for updates | 🔄 Rolling updates |
+| 😨 Fear of deploying | 💪 Deploy anytime |
+| 🐌 Hours to scale | ⚡ Seconds to scale |
+| 📝 Track servers manually | 🎭 Declarative state |
+
+> 🤔 Ready to orchestrate?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Core Resources
+
+## 📦 The Pod
+
+* 🐳 **One or more containers** sharing network/storage
+* 📦 **Smallest deployable unit**
+* ⏱️ **Ephemeral** — created and destroyed
+* 🏷️ **Labeled** for selection
+
+```yaml
+apiVersion: v1
+kind: Pod
+metadata:
+  name: my-app
+  labels:
+    app: web
+spec:
+  containers:
+  - name: web
+    image: nginx:latest
+    ports:
+    - containerPort: 80
+```
+
+**⚠️ Never create pods directly — use Deployments!**
+
+---
+
+## 📍 Slide 17 – 🚀 Deployments
+
+```mermaid
+flowchart TD
+  Deployment[🚀 Deployment] --> RS1[📊 ReplicaSet v1]
+  RS1 --> Pod1[📦 Pod]
+  RS1 --> Pod2[📦 Pod]
+  RS1 --> Pod3[📦 Pod]
+```
+
+**🚀 Deployment manages:**
+* 📊 Desired replica count
+* 🔄 Rolling updates
+* 🔙 Rollback capability
+* 🏷️ Pod template
+
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: web-app
+spec:
+  replicas: 3
+  selector:
+    matchLabels:
+      app: web
+  template:
+    metadata:
+      labels:
+        app: web
+    spec:
+      containers:
+      - name: web
+        image: myapp:1.0
+```
+
+---
+
+## 📍 Slide 18 – 🏷️ Labels and Selectors
+
+```mermaid
+flowchart LR
+  Deployment[🚀 Deployment] -->|selector: app=web| Pods[📦 Pods with label app=web]
+  Service[🌐 Service] -->|selector: app=web| Pods
+```
+
+**🏷️ Labels = Key-value pairs for organization**
+
+```yaml
+metadata:
+  labels:
+    app: web-frontend
+    environment: production
+    version: v1.2.3
+
+selector:
+  matchLabels:
+    app: web-frontend
+```
+
+**🎯 Labels enable:**
+* 🔍 Service discovery
+* 📊 Resource selection
+* 🏗️ Organization
+
+---
+
+## 📍 Slide 19 – 🌐 Services
+
+```mermaid
+flowchart LR
+  Client[👥 Client] --> Service[🌐 Service: ClusterIP]
+  Service --> Pod1[📦 Pod 1]
+  Service --> Pod2[📦 Pod 2]
+  Service --> Pod3[📦 Pod 3]
+```
+
+**🌐 Service types:**
+| 🔧 Type | 🎯 Use Case |
+|---------|----------|
+| 🔒 **ClusterIP** | Internal cluster access |
+| 🔓 **NodePort** | External via node IP |
+| ☁️ **LoadBalancer** | Cloud load balancer |
+| 🔗 **ExternalName** | DNS alias |
+
+```yaml
+apiVersion: v1
+kind: Service
+metadata:
+  name: web-service
+spec:
+  type: NodePort
+  selector:
+    app: web
+  ports:
+  - port: 80
+    targetPort: 8000
+    nodePort: 30080
+```
+
+---
+
+## 📍 Slide 20 – 🔄 Rolling Updates
+
+```mermaid
+flowchart LR
+  V1[📦 v1] --> V1_V2[📦 v1 + v2]
+  V1_V2 --> V2[📦 v2]
+```
+
+**🔄 How it works:**
+1. 📦 Create new pods with new version
+2. ⏳ Wait for them to be ready
+3. 🗑️ Terminate old pods gradually
+4. ✅ Zero downtime!
+
+```yaml
+spec:
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1        # Extra pods during update
+      maxUnavailable: 0  # Always maintain capacity
+```
+
+---
+
+## 📍 Slide 21 – 📊 kubectl Commands
+
+```bash
+# 📋 Get resources
+kubectl get pods
+kubectl get deployments
+kubectl get services
+
+# 🔍 Describe (detailed info)
+kubectl describe pod <name>
+
+# 📝 Apply manifest
+kubectl apply -f deployment.yaml
+
+# 📊 Watch changes
+kubectl get pods -w
+
+# 🔙 Rollback
+kubectl rollout undo deployment/<name>
+
+# 📈 Scale
+kubectl scale deployment/<name> --replicas=5
+```
+
+---
+
+## 📍 Slide 22 – 🚪 Ingress
+
+```mermaid
+flowchart LR
+  Internet[🌐 Internet] --> Ingress[🚪 Ingress Controller]
+  Ingress -->|/app1| Svc1[🌐 Service 1]
+  Ingress -->|/app2| Svc2[🌐 Service 2]
+  Svc1 --> Pods1[📦 Pods]
+  Svc2 --> Pods2[📦 Pods]
+```
+
+**🚪 Ingress provides:**
+* 🔗 URL routing
+* 🔐 TLS termination
+* 🏷️ Name-based virtual hosting
+
+```yaml
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+metadata:
+  name: app-ingress
+spec:
+  rules:
+  - host: app.example.com
+    http:
+      paths:
+      - path: /
+        pathType: Prefix
+        backend:
+          service:
+            name: web-service
+            port:
+              number: 80
+```
+
+---
+
+## 📍 Slide 23 – 🏥 Health Checks
+
+```yaml
+spec:
+  containers:
+  - name: app
+    image: myapp:1.0
+    livenessProbe:
+      httpGet:
+        path: /health
+        port: 8000
+      initialDelaySeconds: 10
+      periodSeconds: 5
+    readinessProbe:
+      httpGet:
+        path: /ready
+        port: 8000
+      initialDelaySeconds: 5
+      periodSeconds: 3
+```
+
+| 🏥 Probe | 🎯 Purpose | ❌ Failure Action |
+|----------|----------|------------------|
+| 🔴 **Liveness** | Is it alive? | Restart container |
+| 🟢 **Readiness** | Is it ready? | Remove from service |
+| 🟡 **Startup** | Did it start? | Keep waiting |
+
+---
+
+## 📍 Slide 24 – 📊 Resource Management
+
+```yaml
+spec:
+  containers:
+  - name: app
+    image: myapp:1.0
+    resources:
+      requests:
+        memory: "128Mi"
+        cpu: "100m"       # 0.1 CPU core
+      limits:
+        memory: "256Mi"
+        cpu: "200m"       # 0.2 CPU core
+```
+
+**📊 Requests vs Limits:**
+| 📊 Setting | 🎯 Purpose |
+|-----------|----------|
+| 📋 **Requests** | Guaranteed resources, scheduling |
+| 🔒 **Limits** | Maximum allowed, OOM if exceeded |
+
+**⚠️ Always set both!**
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L9_MID
+
+---
+
+## 📍 Slide 26 – 📁 Section 4: Manifest Best Practices
+
+## 📄 Complete Deployment Example
+
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: web-app
+  labels:
+    app: web-app
+spec:
+  replicas: 3
+  selector:
+    matchLabels:
+      app: web-app
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1
+      maxUnavailable: 0
+  template:
+    metadata:
+      labels:
+        app: web-app
+    spec:
+      containers:
+      - name: web-app
+        image: username/web-app:1.0.0
+        ports:
+        - containerPort: 8000
+        resources:
+          requests:
+            memory: "128Mi"
+            cpu: "100m"
+          limits:
+            memory: "256Mi"
+            cpu: "200m"
+        livenessProbe:
+          httpGet:
+            path: /health
+            port: 8000
+          initialDelaySeconds: 10
+        readinessProbe:
+          httpGet:
+            path: /health
+            port: 8000
+          initialDelaySeconds: 5
+```
+
+---
+
+## 📍 Slide 27 – 🔐 Security Best Practices
+
+```yaml
+spec:
+  containers:
+  - name: app
+    image: myapp:1.0
+    securityContext:
+      runAsNonRoot: true
+      runAsUser: 1000
+      readOnlyRootFilesystem: true
+      allowPrivilegeEscalation: false
+```
+
+**🔐 Security Checklist:**
+* ✅ Run as non-root user
+* ✅ Read-only filesystem
+* ✅ No privilege escalation
+* ✅ Specific image tags (not `:latest`)
+* ✅ Resource limits defined
+
+---
+
+## 📍 Slide 28 – 📊 Kubernetes Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| 📦 **Pod Restarts** | Stability | 0 |
+| ⏱️ **Pod Startup Time** | Speed | < 30s |
+| 📊 **Resource Usage** | Efficiency | 50-80% |
+| ✅ **Probe Success** | Health | 100% |
+
+> 📚 Monitor your cluster health!
+
+**🤔 Question:** How many pod restarts is "normal"?
+
+---
+
+## 📍 Slide 29 – 🌊 From Manual to Orchestrated
+
+```mermaid
+flowchart LR
+  subgraph 😱 Manual
+    SSH[🔌 SSH to servers]
+    Docker[🐳 docker run]
+    Restart[🔄 Manual restart]
+  end
+  subgraph ☸️ Orchestrated
+    Manifest[📝 YAML Manifest]
+    Apply[kubectl apply]
+    AutoHeal[🏥 Auto-healing]
+  end
+  Manual -->|🚀 Kubernetes| Orchestrated
+```
+
+**🎯 Orchestration State:**
+* ⚡ Deploy in seconds
+* 🔄 Auto-healing always
+* 📈 Scale on demand
+
+---
+
+## 📍 Slide 30 – 🏢 Section 5: Production Kubernetes
+
+## 📅 A Day with Kubernetes
+
+**☀️ Morning:**
+* 📊 Check cluster health — all green ✅
+* 📈 Review resource usage
+* 🔄 Approve deployment PR
+
+**🌤️ Afternoon:**
+* 🚀 `kubectl apply -f deployment.yaml`
+* 📊 Watch rolling update: `kubectl rollout status`
+* ✅ Zero downtime update complete
+
+**🌙 Evening:**
+* 📈 Auto-scaling handles traffic spike
+* 🏥 Crashed pod auto-restarted
+* 🏠 Sleep peacefully
+
+---
+
+## 📍 Slide 31 – 👥 Team Kubernetes Workflow
+
+| 👤 Role | 🎯 Kubernetes Responsibility |
+|---------|----------------------|
+| 👨‍💻 **Developer** | Write manifests, define resources |
+| 🔧 **DevOps** | Manage cluster, set policies |
+| 🛡️ **SRE** | Monitor, scale, incident response |
+| 📊 **Platform** | Build internal tooling |
+
+**🔗 GitOps Flow:**
+```mermaid
+flowchart LR
+  PR[📝 Manifest PR] --> Review[👀 Review]
+  Review --> Merge[✅ Merge]
+  Merge --> ArgoCD[🔄 ArgoCD]
+  ArgoCD --> Cluster[☸️ Cluster]
+```
+
+---
+
+## 📍 Slide 32 – 🔧 Local Development
+
+```bash
+# 🎯 minikube: Full-featured local cluster
+minikube start
+minikube status
+minikube service web-service --url
+
+# 🐳 kind: Lightweight, Docker-based
+kind create cluster
+kind load docker-image myapp:latest
+
+# 📊 Useful addons
+minikube addons enable ingress
+minikube addons enable metrics-server
+```
+
+**🛠️ Local Options:**
+| 🔧 Tool | 🎯 Best For |
+|---------|----------|
+| 🚀 **minikube** | Learning, full features |
+| 🐳 **kind** | CI/CD, fast startup |
+| 🖥️ **Docker Desktop** | Mac/Windows convenience |
+
+---
+
+## 📍 Slide 33 – 📈 Career Path: Kubernetes Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: kubectl basics] --> Mid[💼 Mid: Manifests & debugging]
+  Mid --> Senior[⭐ Senior: Architecture & scaling]
+  Senior --> Principal[🏆 Principal: Platform design]
+```
+
+**🛠️ Skills to Build:**
+* 📝 YAML manifest fluency
+* 🔍 kubectl debugging
+* 🏗️ Architecture patterns
+* 📊 Resource optimization
+* 🔐 Security hardening
+
+---
+
+## 📍 Slide 34 – 🌍 Real Company Examples
+
+**🏢 Kubernetes at Scale:**
+* 📦 **Spotify**: 10,000+ services on K8s
+* 🔍 **Google**: Runs everything on Kubernetes
+* 🎬 **Netflix**: Titus (K8s-inspired)
+
+**☁️ Modern Practices:**
+* 📦 **Airbnb**: 1000+ microservices
+* 🏦 **Capital One**: K8s for banking workloads
+* 🎮 **Pokemon Go**: Global scale with K8s
+
+**📊 Stats:**
+* 🌍 **5.6M+** Kubernetes developers
+* 📦 **92%** container adoption uses K8s
+* 🏢 **#1** CNCF project
+
+---
+
+## 📍 Slide 35 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. ☸️ **Kubernetes orchestrates containers** at scale
+2. 🎭 **Declarative** — define desired state, K8s maintains it
+3. 🚀 **Deployments** manage replicas and updates
+4. 🌐 **Services** provide stable networking
+5. 🏥 **Probes** ensure health, **limits** ensure stability
+
+> 💡 Kubernetes is the operating system for cloud-native applications.
+
+---
+
+## 📍 Slide 36 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | ☸️ K8s Mindset |
+|---------------|------------------|
+| 🙅 "Restart manually" | 🔄 "K8s restarts automatically" |
+| 🚫 "SSH to fix" | 📝 "Fix manifest, apply" |
+| 👉 "Which server?" | 📦 "Which pod?" |
+| 😨 "Scale takes hours" | ⚡ "Scale in seconds" |
+| 💻 "Deploy on weekends" | 🚀 "Deploy anytime" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 37 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Kubernetes architecture and concepts
+* ✅ Deployments, Services, and Ingress
+* ✅ Health checks and resource management
+* ✅ Rolling updates and scaling
+* ✅ kubectl commands for daily use
+
+> 🚀 **You're ready for Lab 9: Kubernetes Fundamentals**
+
+---
+
+## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L9_POST
+
+---
+
+## 📍 Slide 39 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Helm Package Management
+
+* ⛵ Helm charts for packaging
+* 📝 Templating with Go templates
+* 🔧 Values management
+* 💻 Hands-on: Creating Helm charts
+
+**🎉 Your Kubernetes journey continues.**
+
+> ☸️ From manual containers to orchestration — one manifest at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> K8s[☸️ Kubernetes Skills]
+  K8s --> CloudNative[☁️ Cloud-Native]
+  CloudNative --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📍 Slide 40 – 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Kubernetes: Up & Running* — Brendan Burns
+* 📖 *The Kubernetes Book* — Nigel Poulton
+* 📖 *Cloud Native DevOps with Kubernetes* — John Arundel
+
+**🔗 Links:**
+* 🌐 [Kubernetes Documentation](https://kubernetes.io/docs/)
+* 🌐 [kubectl Cheat Sheet](https://kubernetes.io/docs/reference/kubectl/cheatsheet/)
+* 🌐 [Kubernetes the Hard Way](https://github.com/kelseyhightower/kubernetes-the-hard-way)
+
+---
diff --git a/pulumi/.gitignore b/pulumi/.gitignore
index 3a8f831143..fe0c95b3a9 100644
--- a/pulumi/.gitignore
+++ b/pulumi/.gitignore
@@ -1,5 +1,5 @@
-*.pyc
-venv/
-.pulumi-state/
-Pulumi.*.yaml
+*.pyc
+venv/
+.pulumi-state/
+Pulumi.*.yaml
 __pycache__/
\ No newline at end of file
diff --git a/pulumi/Pulumi.yaml b/pulumi/Pulumi.yaml
index 66bf83a3bf..fa96a73acb 100644
--- a/pulumi/Pulumi.yaml
+++ b/pulumi/Pulumi.yaml
@@ -1,7 +1,7 @@
-name: lab04-pulumi
-description: Lab04 Yandex Cloud VM
-runtime: python
-config:
-  pulumi:tags:
-    value:
+name: lab04-pulumi
+description: Lab04 Yandex Cloud VM
+runtime: python
+config:
+  pulumi:tags:
+    value:
       pulumi:template: python
\ No newline at end of file
diff --git a/pulumi/__main__.py b/pulumi/__main__.py
index 77aef574b2..bd95b091f4 100644
--- a/pulumi/__main__.py
+++ b/pulumi/__main__.py
@@ -1,92 +1,92 @@
-import pulumi
-import pulumi_yandex as yandex
-
-config = pulumi.Config()
-zone = config.get("zone") or "ru-central1-a"
-ssh_username = config.get("sshUsername") or "yc-user"
-ssh_pub_key_path = config.get("sshPubKeyPath") or "~/.ssh/id_ed25519.pub"
-
-import os
-
-ssh_pub_key = open(os.path.expanduser(ssh_pub_key_path)).read().strip()
-
-labels = {"project": "devops-lab04", "tool": "pulumi"}
-
-image = yandex.get_compute_image(family="ubuntu-2204-lts")
-
-network = yandex.VpcNetwork("lab04-network", name="lab04-network", labels=labels)
-
-subnet = yandex.VpcSubnet(
-    "lab04-subnet",
-    name="lab04-subnet",
-    zone=zone,
-    network_id=network.id,
-    v4_cidr_blocks=["10.0.1.0/24"],
-    labels=labels,
-)
-
-sg = yandex.VpcSecurityGroup(
-    "lab04-sg",
-    name="lab04-sg",
-    network_id=network.id,
-    labels=labels,
-    ingresses=[
-        yandex.VpcSecurityGroupIngressArgs(
-            description="SSH", protocol="TCP", port=22, v4_cidr_blocks=["0.0.0.0/0"]
-        ),
-        yandex.VpcSecurityGroupIngressArgs(
-            description="HTTP", protocol="TCP", port=80, v4_cidr_blocks=["0.0.0.0/0"]
-        ),
-        yandex.VpcSecurityGroupIngressArgs(
-            description="App", protocol="TCP", port=5000, v4_cidr_blocks=["0.0.0.0/0"]
-        ),
-    ],
-    egresses=[
-        yandex.VpcSecurityGroupEgressArgs(
-            description="Allow all outbound",
-            protocol="ANY",
-            v4_cidr_blocks=["0.0.0.0/0"],
-        ),
-    ],
-)
-
-user_data = f"""#cloud-config
-users:
-  - name: {ssh_username}
-    sudo: ALL=(ALL) NOPASSWD:ALL
-    shell: /bin/bash
-    ssh_authorized_keys:
-      - {ssh_pub_key}
-"""
-
-vm = yandex.ComputeInstance(
-    "lab04-vm",
-    name="lab04-vm",
-    hostname="lab04-vm",
-    platform_id="standard-v2",
-    zone=zone,
-    labels=labels,
-    resources=yandex.ComputeInstanceResourcesArgs(
-        cores=2, core_fraction=20, memory=1
-    ),
-    boot_disk=yandex.ComputeInstanceBootDiskArgs(
-        initialize_params=yandex.ComputeInstanceBootDiskInitializeParamsArgs(
-            image_id=image.id, size=10, type="network-hdd"
-        )
-    ),
-    network_interfaces=[
-        yandex.ComputeInstanceNetworkInterfaceArgs(
-            subnet_id=subnet.id, nat=True, security_group_ids=[sg.id]
-        )
-    ],
-    metadata={"user-data": user_data},
-)
-
-pulumi.export("vm_public_ip", vm.network_interfaces[0].nat_ip_address)
-pulumi.export("vm_private_ip", vm.network_interfaces[0].ip_address)
-pulumi.export(
-    "ssh_command",
-    vm.network_interfaces[0].nat_ip_address.apply(
-        lambda ip: f"ssh -i ~/.ssh/id_ed25519 {ssh_username}@{ip}"
-    ),
+import pulumi
+import pulumi_yandex as yandex
+
+config = pulumi.Config()
+zone = config.get("zone") or "ru-central1-a"
+ssh_username = config.get("sshUsername") or "yc-user"
+ssh_pub_key_path = config.get("sshPubKeyPath") or "~/.ssh/id_ed25519.pub"
+
+import os
+
+ssh_pub_key = open(os.path.expanduser(ssh_pub_key_path)).read().strip()
+
+labels = {"project": "devops-lab04", "tool": "pulumi"}
+
+image = yandex.get_compute_image(family="ubuntu-2204-lts")
+
+network = yandex.VpcNetwork("lab04-network", name="lab04-network", labels=labels)
+
+subnet = yandex.VpcSubnet(
+    "lab04-subnet",
+    name="lab04-subnet",
+    zone=zone,
+    network_id=network.id,
+    v4_cidr_blocks=["10.0.1.0/24"],
+    labels=labels,
+)
+
+sg = yandex.VpcSecurityGroup(
+    "lab04-sg",
+    name="lab04-sg",
+    network_id=network.id,
+    labels=labels,
+    ingresses=[
+        yandex.VpcSecurityGroupIngressArgs(
+            description="SSH", protocol="TCP", port=22, v4_cidr_blocks=["0.0.0.0/0"]
+        ),
+        yandex.VpcSecurityGroupIngressArgs(
+            description="HTTP", protocol="TCP", port=80, v4_cidr_blocks=["0.0.0.0/0"]
+        ),
+        yandex.VpcSecurityGroupIngressArgs(
+            description="App", protocol="TCP", port=5000, v4_cidr_blocks=["0.0.0.0/0"]
+        ),
+    ],
+    egresses=[
+        yandex.VpcSecurityGroupEgressArgs(
+            description="Allow all outbound",
+            protocol="ANY",
+            v4_cidr_blocks=["0.0.0.0/0"],
+        ),
+    ],
+)
+
+user_data = f"""#cloud-config
+users:
+  - name: {ssh_username}
+    sudo: ALL=(ALL) NOPASSWD:ALL
+    shell: /bin/bash
+    ssh_authorized_keys:
+      - {ssh_pub_key}
+"""
+
+vm = yandex.ComputeInstance(
+    "lab04-vm",
+    name="lab04-vm",
+    hostname="lab04-vm",
+    platform_id="standard-v2",
+    zone=zone,
+    labels=labels,
+    resources=yandex.ComputeInstanceResourcesArgs(
+        cores=2, core_fraction=20, memory=1
+    ),
+    boot_disk=yandex.ComputeInstanceBootDiskArgs(
+        initialize_params=yandex.ComputeInstanceBootDiskInitializeParamsArgs(
+            image_id=image.id, size=10, type="network-hdd"
+        )
+    ),
+    network_interfaces=[
+        yandex.ComputeInstanceNetworkInterfaceArgs(
+            subnet_id=subnet.id, nat=True, security_group_ids=[sg.id]
+        )
+    ],
+    metadata={"user-data": user_data},
+)
+
+pulumi.export("vm_public_ip", vm.network_interfaces[0].nat_ip_address)
+pulumi.export("vm_private_ip", vm.network_interfaces[0].ip_address)
+pulumi.export(
+    "ssh_command",
+    vm.network_interfaces[0].nat_ip_address.apply(
+        lambda ip: f"ssh -i ~/.ssh/id_ed25519 {ssh_username}@{ip}"
+    ),
 )
\ No newline at end of file
diff --git a/pulumi/requirements.txt b/pulumi/requirements.txt
index 2356228903..8cf1b03c0d 100644
--- a/pulumi/requirements.txt
+++ b/pulumi/requirements.txt
@@ -1,2 +1,2 @@
-pulumi>=3.0.0,<4.0.0
+pulumi>=3.0.0,<4.0.0
 pulumi-yandex>=0.13.0
\ No newline at end of file
diff --git a/terraform.tfvars b/terraform.tfvars
index b8b044845f..cf31be7f65 100644
--- a/terraform.tfvars
+++ b/terraform.tfvars
@@ -1,4 +1,4 @@
-cloud_id  = "b1g07cju7m9et0m08nk6"
-folder_id = "b1gmc0hedluug99gn0d8"
-zone      = "ru-central1-a"
-ssh_public_key_path = "C:/Users/11kvv/.ssh/lab04_ed25519.pub"
+cloud_id  = "b1g07cju7m9et0m08nk6"
+folder_id = "b1gmc0hedluug99gn0d8"
+zone      = "ru-central1-a"
+ssh_public_key_path = "C:/Users/11kvv/.ssh/lab04_ed25519.pub"
diff --git a/terraform/.gitignore b/terraform/.gitignore
index daaf14ddef..351d5ded60 100644
--- a/terraform/.gitignore
+++ b/terraform/.gitignore
@@ -1,11 +1,11 @@
-*.tfstate
-*.tfstate.*
-.terraform/
-.terraform.lock.hcl
-terraform.tfvars
-*.tfvars
-crash.log
-override.tf
-override.tf.json
-*_override.tf
+*.tfstate
+*.tfstate.*
+.terraform/
+.terraform.lock.hcl
+terraform.tfvars
+*.tfvars
+crash.log
+override.tf
+override.tf.json
+*_override.tf
 *_override.tf.json
\ No newline at end of file
diff --git a/terraform/main.tf b/terraform/main.tf
index 5d16a07a29..6a6a46078a 100644
--- a/terraform/main.tf
+++ b/terraform/main.tf
@@ -1,103 +1,103 @@
-terraform {
-  required_providers {
-    yandex = {
-      source  = "yandex-cloud/yandex"
-      version = "~> 0.135"
-    }
-  }
-  required_version = ">= 1.5"
-}
-
-provider "yandex" {
-  zone = var.zone
-}
-
-data "yandex_compute_image" "ubuntu" {
-  family = var.image_family
-}
-
-resource "yandex_vpc_network" "lab" {
-  name   = "lab04-network"
-  labels = var.labels
-}
-
-resource "yandex_vpc_subnet" "lab" {
-  name           = "lab04-subnet"
-  zone           = var.zone
-  network_id     = yandex_vpc_network.lab.id
-  v4_cidr_blocks = ["10.0.1.0/24"]
-  labels         = var.labels
-}
-
-resource "yandex_vpc_security_group" "lab" {
-  name       = "lab04-sg"
-  network_id = yandex_vpc_network.lab.id
-  labels     = var.labels
-
-  ingress {
-    description    = "SSH"
-    protocol       = "TCP"
-    port           = 22
-    v4_cidr_blocks = ["0.0.0.0/0"]
-  }
-
-  ingress {
-    description    = "HTTP"
-    protocol       = "TCP"
-    port           = 80
-    v4_cidr_blocks = ["0.0.0.0/0"]
-  }
-
-  ingress {
-    description    = "App"
-    protocol       = "TCP"
-    port           = 5000
-    v4_cidr_blocks = ["0.0.0.0/0"]
-  }
-
-  egress {
-    description    = "Allow all outbound"
-    protocol       = "ANY"
-    v4_cidr_blocks = ["0.0.0.0/0"]
-  }
-}
-
-resource "yandex_compute_instance" "lab" {
-  name        = "lab04-vm"
-  hostname    = "lab04-vm"
-  platform_id = var.platform_id
-  zone        = var.zone
-  labels      = var.labels
-
-  resources {
-    cores         = var.cores
-    core_fraction = var.core_fraction
-    memory        = var.memory
-  }
-
-  boot_disk {
-    initialize_params {
-      image_id = data.yandex_compute_image.ubuntu.id
-      size     = var.disk_size
-      type     = var.disk_type
-    }
-  }
-
-  network_interface {
-    subnet_id          = yandex_vpc_subnet.lab.id
-    nat                = true
-    security_group_ids = [yandex_vpc_security_group.lab.id]
-  }
-
-  metadata = {
-    user-data = <<-EOF
-      #cloud-config
-      users:
-        - name: ${var.ssh_username}
-          sudo: ALL=(ALL) NOPASSWD:ALL
-          shell: /bin/bash
-          ssh_authorized_keys:
-            - ${file(var.ssh_public_key_path)}
-      EOF
-  }
+terraform {
+  required_providers {
+    yandex = {
+      source  = "yandex-cloud/yandex"
+      version = "~> 0.135"
+    }
+  }
+  required_version = ">= 1.5"
+}
+
+provider "yandex" {
+  zone = var.zone
+}
+
+data "yandex_compute_image" "ubuntu" {
+  family = var.image_family
+}
+
+resource "yandex_vpc_network" "lab" {
+  name   = "lab04-network"
+  labels = var.labels
+}
+
+resource "yandex_vpc_subnet" "lab" {
+  name           = "lab04-subnet"
+  zone           = var.zone
+  network_id     = yandex_vpc_network.lab.id
+  v4_cidr_blocks = ["10.0.1.0/24"]
+  labels         = var.labels
+}
+
+resource "yandex_vpc_security_group" "lab" {
+  name       = "lab04-sg"
+  network_id = yandex_vpc_network.lab.id
+  labels     = var.labels
+
+  ingress {
+    description    = "SSH"
+    protocol       = "TCP"
+    port           = 22
+    v4_cidr_blocks = ["0.0.0.0/0"]
+  }
+
+  ingress {
+    description    = "HTTP"
+    protocol       = "TCP"
+    port           = 80
+    v4_cidr_blocks = ["0.0.0.0/0"]
+  }
+
+  ingress {
+    description    = "App"
+    protocol       = "TCP"
+    port           = 5000
+    v4_cidr_blocks = ["0.0.0.0/0"]
+  }
+
+  egress {
+    description    = "Allow all outbound"
+    protocol       = "ANY"
+    v4_cidr_blocks = ["0.0.0.0/0"]
+  }
+}
+
+resource "yandex_compute_instance" "lab" {
+  name        = "lab04-vm"
+  hostname    = "lab04-vm"
+  platform_id = var.platform_id
+  zone        = var.zone
+  labels      = var.labels
+
+  resources {
+    cores         = var.cores
+    core_fraction = var.core_fraction
+    memory        = var.memory
+  }
+
+  boot_disk {
+    initialize_params {
+      image_id = data.yandex_compute_image.ubuntu.id
+      size     = var.disk_size
+      type     = var.disk_type
+    }
+  }
+
+  network_interface {
+    subnet_id          = yandex_vpc_subnet.lab.id
+    nat                = true
+    security_group_ids = [yandex_vpc_security_group.lab.id]
+  }
+
+  metadata = {
+    user-data = <<-EOF
+      #cloud-config
+      users:
+        - name: ${var.ssh_username}
+          sudo: ALL=(ALL) NOPASSWD:ALL
+          shell: /bin/bash
+          ssh_authorized_keys:
+            - ${file(var.ssh_public_key_path)}
+      EOF
+  }
 }
\ No newline at end of file
diff --git a/terraform/outputs.tf b/terraform/outputs.tf
index f168518f56..d32476e99e 100644
--- a/terraform/outputs.tf
+++ b/terraform/outputs.tf
@@ -1,14 +1,14 @@
-output "vm_public_ip" {
-  description = "Public IP address of the VM"
-  value       = yandex_compute_instance.lab.network_interface[0].nat_ip_address
-}
-
-output "vm_private_ip" {
-  description = "Private IP address of the VM"
-  value       = yandex_compute_instance.lab.network_interface[0].ip_address
-}
-
-output "ssh_command" {
-  description = "SSH command to connect to the VM"
-  value       = "ssh -i ~/.ssh/id_ed25519 ${var.ssh_username}@${yandex_compute_instance.lab.network_interface[0].nat_ip_address}"
+output "vm_public_ip" {
+  description = "Public IP address of the VM"
+  value       = yandex_compute_instance.lab.network_interface[0].nat_ip_address
+}
+
+output "vm_private_ip" {
+  description = "Private IP address of the VM"
+  value       = yandex_compute_instance.lab.network_interface[0].ip_address
+}
+
+output "ssh_command" {
+  description = "SSH command to connect to the VM"
+  value       = "ssh -i ~/.ssh/id_ed25519 ${var.ssh_username}@${yandex_compute_instance.lab.network_interface[0].nat_ip_address}"
 }
\ No newline at end of file
diff --git a/terraform/variables.tf b/terraform/variables.tf
index 3e9bc6acb0..8c4cdc9cdf 100644
--- a/terraform/variables.tf
+++ b/terraform/variables.tf
@@ -1,68 +1,68 @@
-variable "zone" {
-  description = "Yandex Cloud availability zone"
-  type        = string
-  default     = "ru-central1-a"
-}
-
-variable "platform_id" {
-  description = "VM platform identifier"
-  type        = string
-  default     = "standard-v2"
-}
-
-variable "cores" {
-  description = "Number of CPU cores"
-  type        = number
-  default     = 2
-}
-
-variable "core_fraction" {
-  description = "Guaranteed vCPU share (%)"
-  type        = number
-  default     = 20
-}
-
-variable "memory" {
-  description = "RAM in GB"
-  type        = number
-  default     = 1
-}
-
-variable "disk_size" {
-  description = "Boot disk size in GB"
-  type        = number
-  default     = 10
-}
-
-variable "disk_type" {
-  description = "Boot disk type"
-  type        = string
-  default     = "network-hdd"
-}
-
-variable "image_family" {
-  description = "OS image family"
-  type        = string
-  default     = "ubuntu-2204-lts"
-}
-
-variable "ssh_username" {
-  description = "SSH user created on the VM"
-  type        = string
-  default     = "yc-user"
-}
-
-variable "ssh_public_key_path" {
-  description = "Path to SSH public key"
-  type        = string
-  default     = "~/.ssh/id_ed25519.pub"
-}
-
-variable "labels" {
-  description = "Resource labels"
-  type        = map(string)
-  default = {
-    project = "devops-lab04"
-    tool    = "terraform"
-  }
+variable "zone" {
+  description = "Yandex Cloud availability zone"
+  type        = string
+  default     = "ru-central1-a"
+}
+
+variable "platform_id" {
+  description = "VM platform identifier"
+  type        = string
+  default     = "standard-v2"
+}
+
+variable "cores" {
+  description = "Number of CPU cores"
+  type        = number
+  default     = 2
+}
+
+variable "core_fraction" {
+  description = "Guaranteed vCPU share (%)"
+  type        = number
+  default     = 20
+}
+
+variable "memory" {
+  description = "RAM in GB"
+  type        = number
+  default     = 1
+}
+
+variable "disk_size" {
+  description = "Boot disk size in GB"
+  type        = number
+  default     = 10
+}
+
+variable "disk_type" {
+  description = "Boot disk type"
+  type        = string
+  default     = "network-hdd"
+}
+
+variable "image_family" {
+  description = "OS image family"
+  type        = string
+  default     = "ubuntu-2204-lts"
+}
+
+variable "ssh_username" {
+  description = "SSH user created on the VM"
+  type        = string
+  default     = "yc-user"
+}
+
+variable "ssh_public_key_path" {
+  description = "Path to SSH public key"
+  type        = string
+  default     = "~/.ssh/id_ed25519.pub"
+}
+
+variable "labels" {
+  description = "Resource labels"
+  type        = map(string)
+  default = {
+    project = "devops-lab04"
+    tool    = "terraform"
+  }
 }
\ No newline at end of file
diff --git a/terraform/versions.tf b/terraform/versions.tf
index f1c7bd63d3..768d24219c 100644
--- a/terraform/versions.tf
+++ b/terraform/versions.tf
@@ -1,10 +1,10 @@
-terraform {
-  required_version = ">= 1.9.0"
-
-  required_providers {
-    yandex = {
-      source  = "yandex-cloud/yandex"
-      version = ">= 0.120.0"
-    }
-  }
-}
+terraform {
+  required_version = ">= 1.9.0"
+
+  required_providers {
+    yandex = {
+      source  = "yandex-cloud/yandex"
+      version = ">= 0.120.0"
+    }
+  }
+}

From a1141043e1548339bff2f15f6b8ffd1a59c7730e Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 20:20:26 +0300
Subject: [PATCH 12/13] retry CI after cancel


From 011fecabaa90cf13f2da7b2e9ca7880165743560 Mon Sep 17 00:00:00 2001
From: Cdeth567 <11kvvkvv11@mail.ru>
Date: Thu, 5 Mar 2026 20:29:24 +0300
Subject: [PATCH 13/13] trigger CI with latest fixes