diff --git a/.github/workflows/python-ci.yml b/.github/workflows/python-ci.yml
new file mode 100644
index 0000000000..60cd483628
--- /dev/null
+++ b/.github/workflows/python-ci.yml
@@ -0,0 +1,106 @@
+name: Python CI & Docker Build
+
+on:
+  push:
+    branches: [ main, dev, lab3 ]
+    tags: [ 'v*' ]
+  pull_request:
+    branches: [ main ]
+
+permissions:
+  contents: read
+  packages: write
+
+jobs:
+  test:
+    name: Test & Lint
+    runs-on: ubuntu-latest
+    
+    strategy:
+      matrix:
+        python-version: ["3.9", "3.10", "3.11"]
+    
+    steps:
+    - name: Checkout code
+      uses: actions/checkout@v4
+    
+    - name: Set up Python ${{ matrix.python-version }}
+      uses: actions/setup-python@v5
+      with:
+        python-version: ${{ matrix.python-version }}
+    
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        pip install -r app_python/requirements.txt
+        pip install ruff pytest
+    
+    - name: Lint with Ruff
+      run: ruff check .
+    
+    - name: Run tests
+      run: pytest app_python/tests/ --verbose -v
+    
+    - name: Format check
+      run: ruff format --check .
+  
+  security:
+    name: Snyk Security Scan
+    runs-on: ubuntu-latest
+    if: github.event_name != 'pull_request'
+    defaults:
+      run:
+        working-directory: ./app_python
+    steps:
+    - uses: actions/checkout@v4
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        pip install -r requirements.txt
+    - name: Snyk CLI
+      uses: snyk/actions/python-3.11@master
+      env:
+        SNYK_TOKEN: ${{ secrets.SNYK_TOKEN }}
+      with:
+        args: --severity-threshold=critical --skip-unresolved
+      continue-on-error: true
+
+
+  docker:
+    name: Build & Push Docker
+    needs: [ test, security ] # Runs only if test & security passed
+    runs-on: ubuntu-latest
+    if: github.event_name != 'pull_request'  # Dont push pr to docker hub
+    
+    steps:
+    - name: Checkout code
+      uses: actions/checkout@v4
+    
+    - name: Docker meta
+      id: meta
+      uses: docker/metadata-action@v5
+      with:
+        images: ${{ secrets.DOCKER_USERNAME }}/testiks
+        tags: |
+          type=raw,value=latest,enable={{is_default_branch}}
+          type=raw,value={{date 'YYYY.MM'}},enable={{is_default_branch}}
+          type=ref,event=branch
+
+    
+    - name: Set up Docker Buildx
+      uses: docker/setup-buildx-action@v3
+    
+    - name: Login to Docker Hub
+      uses: docker/login-action@v3
+      with:
+        username: ${{ secrets.DOCKER_USERNAME }}
+        password: ${{ secrets.DOCKERHUB_TOKEN }}
+    
+    - name: Build and push Docker image
+      uses: docker/build-push-action@v5
+      with:
+        context: ./app_python/
+        push: true
+        tags: ${{ steps.meta.outputs.tags }}
+        cache-from: type=gha
+        cache-to: type=gha,mode=max
diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000000..205f63c513
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,5 @@
+test
+.*
+minikube*
+edge-api
+**/__pycache__/
\ No newline at end of file
diff --git a/README.md b/README.md
index 0b159ed716..371d51f456 100644
--- a/README.md
+++ b/README.md
@@ -1,81 +1,271 @@
-# DevOps Engineering Labs
+# DevOps Engineering: Core Practices
 
-## Introduction
+[![Labs](https://img.shields.io/badge/Labs-18-blue)](#labs)
+[![Exam](https://img.shields.io/badge/Exam-Optional-green)](#exam-alternative)
+[![Duration](https://img.shields.io/badge/Duration-18%20Weeks-lightgrey)](#course-roadmap)
 
-Welcome to the DevOps Engineering course labs! These hands-on labs are designed to guide you through various aspects of DevOps practices and principles. As you progress through the labs, you'll gain practical experience in application development, containerization, testing, infrastructure setup, CI/CD processes, and more.
+Master **production-grade DevOps practices** through hands-on labs. Build, containerize, deploy, monitor, and scale applications using industry-standard tools.
 
-## Lab Syllabus
+---
 
-Lab 1: Web Application Development
-Lab 2: Containerization
-Lab 3: Continuous Integration
-Lab 4: Infrastructure as Code & Terraform
-Lab 5: Configuration Management
-Lab 6: Ansible Automation
-Lab 7: Observability, Logging, Loki Stack
-Lab 8: Monitoring & Prometheus
-Lab 9: Kubernetes & Declarative Manifests
-Lab 10: Helm Charts & Library Charts
-Lab 11: Kubernetes Secrets Management (Vault, ConfigMaps)
-Lab 12: Kubernetes ConfigMaps & Environment Variables
-Lab 13: GitOps with ArgoCD
-Lab 14: StatefulSet Optimization
-Lab 15: Kubernetes Monitoring & Init Containers
-Lab 16: IPFS & Fleek Decentralization
+## Quick Start
 
-## Architecture
+1. **Fork** this repository
+2. **Clone** your fork locally
+3. **Start with Lab 1** and progress sequentially
+4. **Submit PRs** for each lab (details below)
 
-This repository has a master branch containing an introduction. Each new lab assignment will be added as a markdown file with a lab number.
+---
 
-## Rules
+## Course Roadmap
 
-To successfully complete the labs and pass the course, follow these rules:
+| Week | Lab | Topic | Key Technologies |
+|------|-----|-------|------------------|
+| 1 | 1 | Web Application Development | Python/Go, Best Practices |
+| 2 | 2 | Containerization | Docker, Multi-stage Builds |
+| 3 | 3 | Continuous Integration | GitHub Actions, Snyk |
+| 4 | 4 | Infrastructure as Code | Terraform, Cloud Providers |
+| 5 | 5 | Configuration Management | Ansible Basics |
+| 6 | 6 | Continuous Deployment | Ansible Advanced |
+| 7 | 7 | Logging | Promtail, Loki, Grafana |
+| 8 | 8 | Monitoring | Prometheus, Grafana |
+| 9 | 9 | Kubernetes Basics | Minikube, Deployments, Services |
+| 10 | 10 | Helm Charts | Templating, Hooks |
+| 11 | 11 | Secrets Management | K8s Secrets, HashiCorp Vault |
+| 12 | 12 | Configuration & Storage | ConfigMaps, PVCs |
+| 13 | 13 | GitOps | ArgoCD |
+| 14 | 14 | Progressive Delivery | Argo Rollouts |
+| 15 | 15 | StatefulSets | Persistent Storage, Headless Services |
+| 16 | 16 | Cluster Monitoring | Kube-Prometheus, Init Containers |
+| — | **Exam Alternative Labs** | | |
+| 17 | 17 | Edge Deployment | Fly.io, Global Distribution |
+| 18 | 18 | Decentralized Storage | 4EVERLAND, IPFS, Web3 |
 
-1. **Lab Dependency:** Complete the labs in order; each lab builds upon the previous one.
-2. **Submission and Grading:** Submit your solutions as pull requests (PRs) to the master branch of this repository. You need at least 6/10 points for each lab to pass.
-3. **Fork Repository:** Fork this repository to your workspace to create your own version for solving the labs.
-4. **Recommended Workflow:** Build your solutions incrementally. Complete lab N based on lab N-1.
-5. **PR Creation:** Create a PR from your fork to the master branch of this repository and from your fork's branch to your fork's master branch.
-6. **Wait for Grade:** Once your PR is created, wait for your lab to be reviewed and graded.
+---
 
-### Example for the first lab
+## Grading
 
-1. Fork this repository.
-2. Checkout to the lab1 branch.
-3. Complete the lab1 tasks.
-4. Push the code to your repository.
-5. Create a PR to the master branch of this repository from your fork's lab1 branch.
-6. Create a PR to the master branch of your repository from your lab1 branch.
-7. Wait for your grade.
+### Grade Composition
 
-## Grading and Grades Distribution
+| Component | Weight | Points |
+|-----------|--------|--------|
+| **Labs (16 required)** | 80% | 160 pts |
+| **Final Exam** | 20% | 40 pts |
+| **Bonus Tasks** | Extra | +40 pts max |
+| **Total** | 100% | 200 pts |
 
-Your final grade will be determined based on labs and a final exam:
+### Exam Alternative
 
-- Labs: 70% of your final grade.
-- Final Exam: 30% of your final grade.
+Don't want to take the exam? Complete **both** bonus labs:
 
-Grade ranges:
+| Lab | Topic | Points |
+|-----|-------|--------|
+| **Lab 17** | Fly.io Edge Deployment | 20 pts |
+| **Lab 18** | 4EVERLAND & IPFS | 20 pts |
 
-- [90-100] - A
-- [75-90) - B
-- [60-75) - C
-- [0-60) - D
+**Requirements:**
+- Complete both labs (17 + 18 = 40 pts, replaces exam)
+- Minimum 16/20 on each lab
+- Deadline: **1 week before exam date**
+- Can still take exam if you need more points for desired grade
 
-### Labs Grading
+<details>
+<summary>📊 Grade Scale</summary>
 
-Each lab is worth 10 points. Completing main tasks correctly earns you 10 points. Completing bonus tasks correctly adds 2.5 points. You can earn a maximum of 12.5 points per lab by completing all main and bonus tasks.
+| Grade | Points | Percentage |
+|-------|--------|------------|
+| **A** | 180-200+ | 90-100% |
+| **B** | 150-179 | 75-89% |
+| **C** | 120-149 | 60-74% |
+| **D** | 0-119 | 0-59% |
 
-Finishing all bonus tasks lets you skip the exam and grants you 5 extra points. Incomplete bonus tasks require you to take the exam, which could save you from failing it.
+**Minimum to Pass:** 120 points (60%)
 
->The labs account for 70% of your final grade. With 14 labs in total, each lab contributes 5% to your final grade. Completing all main tasks in a lab earns you the maximum 10 points, which corresponds to 5% of your final grade.
->If you successfully complete all bonus tasks, you'll earn an additional 2.5 points, totaling 12.5 points for that lab, or 6.25% of your final grade. Over the course of all 14 labs, the cumulative points from bonus tasks add up to 87.5% of your final grade.
->Additionally, a 5% bonus is granted for successfully finishing all bonus tasks, ensuring that if you successfully complete everything, your final grade will be 92.5%, which corresponds to an A grade.
+</details>
 
-## Deadlines and Labs Distribution
+<details>
+<summary>📈 Grade Examples</summary>
 
-Each week, two new labs will be available. You'll have one week to submit your solutions. Refer to Moodle for presentation slides and deadlines.
+**Scenario 1: Labs + Exam**
+```
+Labs: 16 × 9 = 144 pts
+Bonus: 5 labs × 2.5 = 12.5 pts
+Exam: 35/40 pts
+Total: 191.5 pts = 96% (A)
+```
 
-## Submission Policy
+**Scenario 2: Labs + Exam Alternative**
+```
+Labs: 16 × 9 = 144 pts
+Bonus: 8 labs × 2.5 = 20 pts
+Lab 17: 18 pts
+Lab 18: 17 pts
+Total: 199 pts = 99.5% (A)
+```
 
-Submitting your lab results on time is crucial for your grading. Late submissions receive a maximum score of 6 points for the corresponding lab. Remember, completing all labs is necessary to successfully pass the course.
+</details>
+
+---
+
+## Lab Structure
+
+Each lab is worth **10 points** (main tasks) + **2.5 points** (bonus).
+
+- **Minimum passing score:** 6/10 per lab
+- **Late submissions:** Max 6/10 (within 1 week)
+- **Very late (>1 week):** Not accepted
+
+<details>
+<summary>📋 Lab Categories</summary>
+
+**Foundation (Labs 1-2)**
+- Web app development
+- Docker containerization
+
+**CI/CD & Infrastructure (Labs 3-4)**
+- GitHub Actions
+- Terraform
+
+**Configuration Management (Labs 5-6)**
+- Ansible playbooks and roles
+
+**Observability (Labs 7-8)**
+- Loki logging stack
+- Prometheus monitoring
+
+**Kubernetes Core (Labs 9-12)**
+- K8s basics, Helm
+- Secrets, ConfigMaps
+
+**Advanced Kubernetes (Labs 13-16)**
+- ArgoCD, Argo Rollouts
+- StatefulSets, Monitoring
+
+**Exam Alternative (Labs 17-18)**
+- Fly.io, 4EVERLAND/IPFS
+
+</details>
+
+---
+
+## How to Submit
+
+```bash
+# 1. Create branch
+git checkout -b lab1
+
+# 2. Complete lab tasks
+
+# 3. Commit and push
+git add .
+git commit -m "Complete lab1"
+git push -u origin lab1
+
+# 4. Create TWO Pull Requests:
+#    PR #1: your-fork:lab1 → course-repo:master
+#    PR #2: your-fork:lab1 → your-fork:master
+```
+
+<details>
+<summary>📝 Submission Checklist</summary>
+
+- [ ] All main tasks completed
+- [ ] Documentation files created
+- [ ] Screenshots where required
+- [ ] Code tested and working
+- [ ] Markdown validated ([linter](https://dlaa.me/markdownlint/))
+- [ ] Both PRs created
+
+</details>
+
+---
+
+## Resources
+
+<details>
+<summary>🛠️ Required Tools</summary>
+
+| Tool | Purpose |
+|------|---------|
+| Git | Version control |
+| Docker | Containerization |
+| kubectl | Kubernetes CLI |
+| Helm | K8s package manager |
+| Minikube | Local K8s cluster |
+| Terraform | Infrastructure as Code |
+| Ansible | Configuration management |
+
+</details>
+
+<details>
+<summary>📚 Documentation Links</summary>
+
+**Core:**
+- [Docker](https://docs.docker.com/)
+- [Kubernetes](https://kubernetes.io/docs/)
+- [Helm](https://helm.sh/docs/)
+
+**CI/CD:**
+- [GitHub Actions](https://docs.github.com/en/actions)
+- [Terraform](https://www.terraform.io/docs)
+- [Ansible](https://docs.ansible.com/)
+
+**Observability:**
+- [Prometheus](https://prometheus.io/docs/)
+- [Grafana](https://grafana.com/docs/)
+
+**Advanced:**
+- [ArgoCD](https://argo-cd.readthedocs.io/)
+- [Argo Rollouts](https://argoproj.github.io/argo-rollouts/)
+- [HashiCorp Vault](https://developer.hashicorp.com/vault/docs)
+
+</details>
+
+<details>
+<summary>💡 Tips for Success</summary>
+
+1. **Start early** - Don't wait until deadline
+2. **Read instructions fully** before starting
+3. **Test everything** before submitting
+4. **Document as you go** - Don't leave it for the end
+5. **Ask questions early** - Don't wait until last minute
+6. **Use proper Git workflow** - Branches, commits, PRs
+
+</details>
+
+<details>
+<summary>🔧 Common Issues</summary>
+
+**Docker:**
+- Daemon not running → Start Docker Desktop
+- Permission denied → Add user to docker group
+
+**Minikube:**
+- Won't start → Try `--driver=docker`
+- Resource issues → Allocate more memory/CPU
+
+**Kubernetes:**
+- ImagePullBackOff → Check image name/registry
+- CrashLoopBackOff → Check logs: `kubectl logs <pod>`
+
+</details>
+
+---
+
+## Course Completion
+
+After completing all 16 core labs (+ optional Labs 17-18), you'll have:
+
+✅ Full-stack DevOps expertise
+✅ Production-ready portfolio with 16-18 projects
+✅ Container and Kubernetes mastery
+✅ CI/CD pipeline experience
+✅ Infrastructure as Code skills
+✅ Monitoring and observability knowledge
+✅ GitOps workflow experience
+
+---
+
+**Ready to begin? Start with [Lab 1](labs/lab01.md)!**
+
+Questions? Check the course Moodle page or ask during office hours.
diff --git a/ansible/ansible.cfg b/ansible/ansible.cfg
new file mode 100644
index 0000000000..f955730d83
--- /dev/null
+++ b/ansible/ansible.cfg
@@ -0,0 +1,11 @@
+[defaults]
+inventory = inventory/hosts.ini
+roles_path = roles
+host_key_checking = False
+remote_user = debil
+retry_files_enabled = False
+
+[privilege_escalation]
+become = True
+become_method = sudo
+become_user = root
\ No newline at end of file
diff --git a/ansible/app_python/Dockerfile b/ansible/app_python/Dockerfile
new file mode 100644
index 0000000000..d82173a7d1
--- /dev/null
+++ b/ansible/app_python/Dockerfile
@@ -0,0 +1,22 @@
+FROM python:3.12-slim
+
+ENV PYTHONDONTWRITEBYTECODE=1 \
+    PYTHONUNBUFFERED=1
+
+# Non-root user
+RUN groupadd -r appuser && useradd -r -g appuser appuser
+
+# Install deps first
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+
+
+COPY app.py .
+RUN chown -R appuser:appuser /app
+USER appuser
+
+EXPOSE 8000
+
+# Run app finally
+CMD ["python", "app.py"]
diff --git a/ansible/app_python/README.md b/ansible/app_python/README.md
new file mode 100644
index 0000000000..f122dfce25
--- /dev/null
+++ b/ansible/app_python/README.md
@@ -0,0 +1,55 @@
+# DevOps Info Service
+A lightweight demo Python web application that system information via HTTP endpoints
+
+### Prerequisites
+Python 3.10+
+Flask 3.1.0
+
+### Installation
+```bash
+python3 -m venv venv
+source venv/bin/activate
+pip install -r requirements.txt
+```
+
+### Running the Application
+```bash
+python3 app.py
+# Or with custom config
+PORT=8080 python3 app.py
+```
+
+### API Endpoints
+There are few main endpoints:
+- `GET /` - Service and system information
+- `GET /health` - Health check.
+
+### Configuration
+
+| Variable | Value  | Purpose                              |
+| -------- | ------ | ------------------------------------ |
+| Host     | string | A host to run app on                 |
+| Port     | int    | A port to assign for web application |
+| Debug    | bool   | Should debug output be enabled       |
+
+## Docker
+This application can be run in a containerized environment with Docker
+
+### Build the image locally
+To build the Docker image, use the Docker build command from the project directory, specifying the Dockerfile and an image name with a tag
+```bash
+cd app_python
+docker build -t <image-name> .
+```
+
+### Run a container
+To run the application, start a container from the built image and map the container port to a port on the host machine so the application can be accessed locally
+```bash
+docker run -p<any-port-on-your-machine>:5000 <created-image-name>
+```
+
+### Pull from Docker Hub
+The pre-built image is also available on Docker Hub and can be pulled using the standard Docker pull command with the repository name and desired tag
+```bash
+docker pull cacucoh/testiks:1.0
+```
\ No newline at end of file
diff --git a/ansible/app_python/app.py b/ansible/app_python/app.py
new file mode 100644
index 0000000000..9064052f8c
--- /dev/null
+++ b/ansible/app_python/app.py
@@ -0,0 +1,182 @@
+import os
+import logging
+import platform
+import socket
+from datetime import datetime, timezone
+
+import time
+from functools import wraps
+
+from flask import Flask, request, jsonify, Response
+from pythonjsonlogger import jsonlogger
+from prometheus_client import Counter, Histogram, Gauge, generate_latest, CONTENT_TYPE_LATEST
+
+# ----------------------
+# JSON Logging Setup
+# ----------------------
+logger = logging.getLogger()
+
+logHandler = logging.StreamHandler()
+formatter = jsonlogger.JsonFormatter(
+    fmt="%(asctime)s %(name)s %(levelname)s %(message)s"
+)
+logHandler.setFormatter(formatter)
+logger.addHandler(logHandler)
+logger.setLevel(logging.INFO)
+
+
+app = Flask(__name__)
+
+HOST = os.getenv("HOST", "0.0.0.0")
+PORT = int(os.getenv("PORT", 5000))
+DEBUG = os.getenv("DEBUG", "False").lower() == "true"
+
+START_TIME = datetime.now(timezone.utc)
+
+# Define metrics
+http_requests_total = Counter(
+    'http_requests_total',
+    'Total HTTP requests',
+    ['method', 'endpoint', 'status']
+)
+
+http_request_duration_seconds = Histogram(
+    'http_request_duration_seconds',
+    'HTTP request duration',
+    ['method', 'endpoint']
+)
+
+http_requests_in_progress = Gauge(
+    'http_requests_in_progress',
+    'HTTP requests currently being processed'
+)
+
+
+def track_metrics(func):
+    @wraps(func)
+    def wrapper(*args, **kwargs):
+        http_requests_in_progress.inc()
+        start_time = time.time()
+
+        try:
+            response = func(*args, **kwargs)
+            status = getattr(response, "status_code", 200)
+        except Exception:
+            status = 500
+            raise
+        finally:
+            duration = time.time() - start_time
+            endpoint = request.path
+            method = request.method
+
+            http_requests_total.labels(method=method, endpoint=endpoint, status=str(status)).inc()
+            http_request_duration_seconds.labels(method=method, endpoint=endpoint).observe(duration)
+
+            http_requests_in_progress.dec()
+
+        return response
+
+    return wrapper
+
+
+def get_uptime():
+    delta = datetime.now(timezone.utc) - START_TIME
+    seconds = int(delta.total_seconds())
+    hours = seconds // 3600
+    minutes = (seconds % 3600) // 60
+    return {"seconds": seconds, "human": f"{hours} hours, {minutes} minutes"}
+
+
+def get_system_info():
+    return {
+        "hostname": socket.gethostname(),
+        "platform": platform.system(),
+        "platform_version": platform.version(),
+        "architecture": platform.machine(),
+        "cpu_count": os.cpu_count(),
+        "python_version": platform.python_version(),
+    }
+
+
+@app.route("/health", methods=["GET"])
+@track_metrics
+def health():
+    uptime = get_uptime()
+    return jsonify(
+        {
+            "status": "healthy",
+            "timestamp": datetime.now(timezone.utc).isoformat(),
+            "uptime_seconds": uptime["seconds"],
+        }
+    )
+
+# k8s
+@app.route('/ready')
+def ready():
+    return 'OK', 200
+
+
+@app.route('/metrics')
+def metrics():
+    return Response(generate_latest(), mimetype=CONTENT_TYPE_LATEST)
+
+
+@app.route("/", methods=["GET"])
+@track_metrics
+def default_route():
+    logger.info(f"Request: {request.method} {request.path}")
+    uptime = get_uptime()
+
+    response = {
+        "service": {
+            "name": "devops-info-service",
+            "version": "1.0.0",
+            "description": "DevOps course info service",
+            "framework": "Flask",
+        },
+        "system": get_system_info(),
+        "runtime": {
+            "uptime_seconds": uptime["seconds"],
+            "uptime_human": uptime["human"],
+            "current_time": datetime.now(timezone.utc).isoformat(),
+            "timezone": "UTC",
+        },
+        "request": {
+            "client_ip": request.remote_addr,
+            "user_agent": request.headers.get("User-Agent"),
+            "method": request.method,
+            "path": request.path,
+        },
+        "endpoints": [
+            {"path": "/", "method": "GET", "description": "Service information"},
+            {"path": "/health", "method": "GET", "description": "Health check"},
+        ],
+    }
+
+    return jsonify(response)
+
+
+@app.errorhandler(404)
+def not_found(error):
+    return jsonify({"error": "Not Found", "message": "Endpoint does not exist"}), 404
+
+
+@app.errorhandler(500)
+def internal_error(error):
+    return (
+        jsonify(
+            {
+                "error": "Internal Server Error",
+                "message": "An unexpected error occurred",
+            }
+        ),
+        500,
+    )
+
+
+if __name__ == "__main__":
+    logger.info("[+] Starting...")
+    try:
+        app.run(host=HOST, port=PORT, debug=DEBUG)
+    finally:
+        logger.info("[i] Shutting down")
diff --git a/ansible/app_python/docs/LAB03.md b/ansible/app_python/docs/LAB03.md
new file mode 100644
index 0000000000..a37f83c334
--- /dev/null
+++ b/ansible/app_python/docs/LAB03.md
@@ -0,0 +1,85 @@
+# LAB03 — Continuous Integration (CI/CD)
+[![Python CI & Docker Build](https://github.com/CacucoH/DevOps-Core-Course/actions/workflows/python-ci.yml/badge.svg)](https://github.com/CacucoH/DevOps-Core-Course/actions/workflows/python-ci.yml)
+
+## 1. Unit testing
+### 1.1 Testing framework choise
+To complete this lab I selected **pytest**:
+- Supports fuxtures
+- Simple to use
+- Easilly integrates with Flask
+
+#### 1.2 Tests structure explanation:
+- `test_root_endpoint_success`: Verifies GET / returns 200 status, checks complete JSON structure (service, system, runtime, request, endpoints fields), validates data types (str, int, list), and mocks uptime/system_info for consistent testing.
+- `test_health_endpoint_success`: Tests GET /health returns 200 status, confirms health JSON structure (status, timestamp, uptime_seconds), verifies string/integer data types.
+- `test_nonexistent_endpoint_404`: Ensures non-existent endpoint /nonexistent returns 404 status with correct error JSON structure ("Not Found" message).
+- `test_root_wrong_method_404`: Confirms POST to root / (unsupported method) returns 404 status code.
+- `test_health_wrong_method_405`: Verifies POST to /health (unsupported method) returns 404 status code.
+- `test_unsupported_methods_405`: Parametrized test checking PUT, DELETE, PATCH methods on various endpoints all return 404 status.
+- `test_empty_request_data`: Edge case test ensuring basic GET / works without additional request data, validates client_ip presence in response.
+- `test_with_headers`: Edge case testing custom User-Agent header, confirms request parsing correctly extracts and returns header value in JSON.
+
+#### 1.3 Running tests locally
+Execute (in main project directory)
+```bash
+pytest
+```
+All test should pass
+![all tests passing](./screenshots/lab3/tests.png)
+
+### 2 CI Workflow
+CI workflow triggers on:
+- push to `main`, `dev`, and `lab3` branches
+- pull requests
+
+It performs:
+1. Linting (ruff)
+2. Testing (pytest)
+3. Coverage generation
+4. Docker build & push
+5. Snyk security scan
+
+
+## 2. Versioning Strategy
+I have chosen Calendar Versioning (CalVer YYYY.MM):
+- Format: 2026.02 (current month) + latest
+- Implementation: docker/metadata-action@v5 with type=raw,value={{date 'YYYY.MM'}}
+- Why CalVer: Perfect for CI/CD pipelines with frequent releases, date-based tracking
+
+### 2.1 Key Implementation Highlights
+CI Stages:
+1. Test job (matrix: Python 3.9-3.11)
+   - Ruff linting + formatting
+   - Pytest unit tests
+2. Docker job (depends on tests)
+   - Multi-tag strategy (latest + CalVer + branch)
+   - Docker layer caching for speed
+
+### 2.2 Triggers Logic:
+- main/dev push: full CI/CD (tests + Docker push)
+- PR: tests only (no Docker push)
+- Any branch: basic linting
+
+Also I used Git secrets:
+- DOCKER_USERNAME
+- DOCKERHUB_TOKEN (Docker Hub Access Token)
+- SNYK_TOKEN
+
+### 2.3 Evidence
+
+#### - [👉 Link to successful CI (full lab done)](https://github.com/CacucoH/DevOps-Core-Course/actions/runs/21959626699)
+#### - Tests passing locally:
+![all tests passing](./screenshots/lab3/tests.png)
+#### - [Docker image on Docker Hub](https://hub.docker.com/r/cacucoh/testiks) 
+
+
+## 3. Best Practices Implemented
+1. Matrix Testing: Tests Python 3.9-3.11 in parallel across multiple jobs, ensuring cross-version compatibility
+2. Job Dependencies: Docker build only runs after tests pass (needs: test), preventing broken images from being pushed
+3. Docker Layer Caching: cache-from/to: type=gha reduces build time from 5+ minutes to ~30 seconds on repeat runs
+4. Caching: Pip dependencies cached, so: 3min to 15sec speedup; Docker layers sped up from 5min to 30sec
+
+## 4. Key Decisions
+- Versioning Strategy: CalVer (YYYY.MM) chosen over SemVer because this is a CI/CD pipeline with frequent automated releases—dates provide instant temporal context without manual version management.
+- Docker Tags: Creates username/app:latest (production), username/app:2026.02 (monthly archive), username/app:main (branch tracking)—multiple tags enable flexible deployments and rollbacks.
+- Workflow Triggers: push to main/develop → full CI/CD; pull_request → tests only; all branches → linting—balances automation with safety (no Docker push from PRs/forks).
+- Test Coverage: Unit tests via pytest + linting/formatting via ruff cover code quality; integration/E2E tests and security scanning deferred to future tasks.
diff --git a/ansible/app_python/docs/screenshots/lab2/build.png b/ansible/app_python/docs/screenshots/lab2/build.png
new file mode 100644
index 0000000000..2bcd5dba45
Binary files /dev/null and b/ansible/app_python/docs/screenshots/lab2/build.png differ
diff --git a/ansible/app_python/docs/screenshots/lab2/curl.png b/ansible/app_python/docs/screenshots/lab2/curl.png
new file mode 100644
index 0000000000..90bc56653d
Binary files /dev/null and b/ansible/app_python/docs/screenshots/lab2/curl.png differ
diff --git a/ansible/app_python/docs/screenshots/lab2/images.png b/ansible/app_python/docs/screenshots/lab2/images.png
new file mode 100644
index 0000000000..0ceb08ec99
Binary files /dev/null and b/ansible/app_python/docs/screenshots/lab2/images.png differ
diff --git a/ansible/app_python/docs/screenshots/lab2/push.png b/ansible/app_python/docs/screenshots/lab2/push.png
new file mode 100644
index 0000000000..274af9a019
Binary files /dev/null and b/ansible/app_python/docs/screenshots/lab2/push.png differ
diff --git a/ansible/app_python/docs/screenshots/lab2/run.png b/ansible/app_python/docs/screenshots/lab2/run.png
new file mode 100644
index 0000000000..703e3f363c
Binary files /dev/null and b/ansible/app_python/docs/screenshots/lab2/run.png differ
diff --git a/ansible/app_python/docs/screenshots/lab3/tests.png b/ansible/app_python/docs/screenshots/lab3/tests.png
new file mode 100644
index 0000000000..628dd59d64
Binary files /dev/null and b/ansible/app_python/docs/screenshots/lab3/tests.png differ
diff --git a/ansible/app_python/requirements.txt b/ansible/app_python/requirements.txt
new file mode 100644
index 0000000000..9fdfd1b2ba
--- /dev/null
+++ b/ansible/app_python/requirements.txt
@@ -0,0 +1,3 @@
+Flask==3.1.2
+python-json-logger
+prometheus_client==0.23.1
\ No newline at end of file
diff --git a/ansible/app_python/tests/__init__.py b/ansible/app_python/tests/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/ansible/app_python/tests/app_test.py b/ansible/app_python/tests/app_test.py
new file mode 100644
index 0000000000..033a4a8263
--- /dev/null
+++ b/ansible/app_python/tests/app_test.py
@@ -0,0 +1,123 @@
+import pytest
+from unittest.mock import patch
+from datetime import datetime, timezone
+from app import app
+
+
+@pytest.fixture
+def client():
+    app.config["TESTING"] = True
+    with app.test_client() as client:
+        yield client
+
+
+@patch("app.get_uptime")
+@patch("app.get_system_info")
+@patch("app.datetime")
+def test_root_endpoint_success(mock_datetime, mock_system_info, mock_uptime, client):
+    """Test GET /, status 200, data structures & types."""
+    mock_uptime.return_value = {"seconds": 3600, "human": "1 hours, 0 minutes"}
+    mock_system_info.return_value = {
+        "hostname": "test-host",
+        "platform": "Linux",
+        "platform_version": "5.15",
+        "architecture": "x86_64",
+        "cpu_count": 4,
+        "python_version": "3.11.0",
+    }
+    mock_datetime.now.return_value = datetime(2026, 2, 11, 22, 46, tzinfo=timezone.utc)
+
+    response = client.get("/")
+
+    assert response.status_code == 200
+
+    data = response.get_json()
+    # Check that all keys are present
+    assert "service" in data
+    assert "system" in data
+    assert "runtime" in data
+    assert "request" in data
+    assert "endpoints" in data
+
+    # And check data types
+    assert isinstance(data["service"]["name"], str)
+    assert isinstance(data["system"]["cpu_count"], int)
+    assert isinstance(data["runtime"]["uptime_seconds"], int)
+    assert isinstance(data["endpoints"], list)
+    assert len(data["endpoints"]) == 2
+
+
+@patch("app.get_uptime")
+def test_health_endpoint_success(mock_uptime, client):
+    """Test GET /health, status 200, data structures & types."""
+    mock_uptime.return_value = {"seconds": 7200, "human": "2 hours, 0 minutes"}
+
+    response = client.get("/health")
+
+    assert response.status_code == 200
+
+    data = response.get_json()
+    assert data["status"] == "healthy"
+    assert isinstance(data["timestamp"], str)
+    assert isinstance(data["uptime_seconds"], int)
+
+
+def test_nonexistent_endpoint_404(client):
+    """Test non-existent endpoint, status 404, data structure."""
+    response = client.get("/nonexistent")
+
+    assert response.status_code == 404
+
+    data = response.get_json()
+    assert data["error"] == "Not Found"
+    assert isinstance(data["message"], str)
+    assert data["message"] == "Endpoint does not exist"
+
+
+def test_root_wrong_method_405(client):
+    """Test invalid HTTP method on / - 405."""
+    response = client.post("/")
+
+    assert response.status_code == 405
+
+
+def test_health_wrong_method_405(client):
+    """Test invalid HTTP method on  /health - 405."""
+    response = client.post("/health")
+
+    assert response.status_code == 405
+
+
+# @patch('app.get_uptime', side_effect=Exception("Uptime calculation failed"))
+# def test_internal_server_error_500(mock_uptime, client):
+#     """Test for internal server error response, status 500, data structure."""
+#     response = client.get('/')
+
+#     assert response.status_code == 500
+
+#     data = response.get_json()
+#     assert data["error"] == "Internal Server Error"
+#     assert isinstance(data["message"], str)
+#     assert data["message"] == "An unexpected error occurred"
+
+# @patch('app.socket.gethostname', side_effect=Exception("Hostname resolution failed"))
+# def test_system_info_error_500(client):
+#     """Test for get_system_info error - 500."""
+#     response = client.get('/')
+
+#     assert response.status_code == 500
+
+
+def test_empty_request_data(client):
+    """Edge case: base requests without any headers."""
+    response = client.get("/")
+    assert response.status_code == 200
+    assert "client_ip" in response.get_json()["request"]
+
+
+def test_with_headers(client):
+    """Edge case: base reuest with User-Agent header."""
+    headers = {"User-Agent": "TestAgent/1.0"}
+    response = client.get("/", headers=headers)
+    data = response.get_json()
+    assert data["request"]["user_agent"] == "TestAgent/1.0"
diff --git a/ansible/docs/LAB05.md b/ansible/docs/LAB05.md
new file mode 100644
index 0000000000..e99f13bc13
--- /dev/null
+++ b/ansible/docs/LAB05.md
@@ -0,0 +1,237 @@
+# Lab 5 — Ansible Fundamentals
+
+### Architecture Overview
+#### Ansible Version Used
+Installed on Linux using apt
+
+```bash
+$ ansible --version       
+ansible [core 2.20.1]
+  config file = None
+  configured module search path = ['/home/segfault/.ansible/plugins/modules', '/usr/share/ansible/plugins/modules']
+  ansible python module location = /usr/lib/python3/dist-packages/ansible
+  ansible collection location = /home/segfault/.ansible/collections:/usr/share/ansible/collections
+  executable location = /usr/bin/ansible
+  python version = 3.13.11 (main, Dec  8 2025, 11:43:54) [GCC 15.2.0] (/usr/bin/python3)
+  jinja version = 3.1.6
+  pyyaml version = 6.0.3 (with libyaml v0.2.5)
+```
+
+### Target VM
+
+I used a VM that I created in previous lab:
+- Debian 13 (6.12.63 amd-64)
+- 4 GB RAM
+- 10 GB disk space
+- Network adapter in Bridged mode
+- Static IP (192.168.1.145)
+- SSH server is installed and configured
+- Public SSH key added to `~/.ssh/authorized_keys`
+
+Ansible connects via SSH using key-based auth
+
+### Ansible Project Structure
+The project follows a role-based architecture:
+```
+ansible/
+├── inventory/
+│   └── hosts.ini
+├── roles/
+│   ├── common/
+│   ├── docker/
+│   └── app_deploy/
+├── playbooks/
+│   ├── provision.yml
+│   └── deploy.yml
+├── group_vars/
+│   └── all.yml (Vault encrypted)
+├── ansible.cfg
+└── docs/LAB05.md
+```
+
+### Why Roles Instead of Monolithic Playbooks?
+**Because roles improve modularity, reusability, and maintainability**
+
+Instead of putting everything in one large playbook, roles let you split infrastructure into logical components (e.g., web server, database, users). Each role has a defined structure (tasks, vars, handlers), which makes the code easier to read and manage
+
+### Connectivity check:
+
+![alt text](./img/ping.png)
+
+![connect](./img/rce.png)
+
+This confirms SSH conection working correctly for ansible
+
+### Roles
+#### Common
+##### Purpose
+Provides baseline system configuration (packages, users, timezone, basic security settings, updates)
+
+##### Variables
+- common_packages – list of packages to install (default: basic utilities)
+- common_timezone – system timezone (default: UTC)
+- common_create_user – whether to create a deploy user (default: true)
+```
+common_packages:
+  - python3-pip
+  - curl
+  - git
+  - vim
+  - htop
+timezone: "UTC"
+```
+
+##### Handlers
+- Restart SSH
+- Reload systemd
+
+##### Dependencies
+- None
+
+#### Docker
+##### Purpose
+Installs and configures Docker engine and related components.
+
+##### Variables (key examples)
+- docker_version – Docker package version (default: latest)
+- docker_users – list of users added to docker group
+- docker_daemon_options – custom daemon.json configuration
+
+##### Handlers
+- Restart Docker
+```
+- name: Restart Docker
+  service:
+    name: docker
+    state: restarted
+```
+
+##### Dependencies
+May depend on common (for base packages and users)
+
+#### App_deploy
+##### Purpose
+Deploys and configures the application (pulls image, runs container, sets environment variables).
+
+#### Variables
+- app_image – Docker image name
+- app_tag – image tag (default: latest)
+- app_env – environment variables
+- app_port – exposed port
+```
+restart_policy: unless-stopped
+env_vars: {}
+```
+
+##### Handlers
+- Restart application container
+- Reload reverse proxy (if applicable)
+```
+- name: Restart application container
+  community.docker.docker_container:
+    name: "{{ app_container_name }}"
+    state: started
+    restart: true
+```
+
+##### Dependencies
+- Depends on docker
+- May depend on common
+
+### Idempotency Demonstration
+#### Run playbook first time
+
+![alt text](./img/first.png)
+
+Observe:
+- New packages installed
+- Docker installed
+- Docker started
+- User added to docker group
+
+#### Run playbook second time
+
+![alt text](./img/second.png)
+
+
+On the second run of the playbook, all tasks showed changed = 0 because the system was already in the desired state
+
+#### Analysis
+
+- First run:
+Tasks that installed packages (common_packages, Docker packages), updated the apt cache, created users/groups, and set the timezone all showed changed = 1 because these actions modified the system to reach the desired state
+
+- Second run:
+All tasks showed changed = 0 because the system was already in the desired state. Nothing needed to be updated or modified
+
+#### Explanation of Idempotency
+The roles are idempotent because:
+- Stateful modules were used (apt: state=present, service: state=started, user: state=present) rather than shell commands
+- Variables define the desired state (package lists, timezone, users), so tasks only act when the system differs from that state
+- Handlers (like Docker restart) only trigger when notified
+
+
+### Ansible Vault
+Sensitive data stored in `group_vars/all.yml` file
+
+I created it using:
+```bash
+ansible-vault create group_vars/all.yml
+```
+
+All its content are encrypted:
+```
+$ANSIBLE_VAULT;1.1;AES256
+62613132333831643565386162386637626234636236356236353639353632626364363137633265
+3864393263303166333738663434653033333636643261310a373832303831613239616636393234
+36383830643236666232633936613439653836333832376330393665633134623333653662336264
+3836626638303961660a326533376539663131623337643230366238323638303562633563393062
+63663538316636643732396435643262656566666136336564373531343834326235653164643063...
+```
+
+#### Stored Secrets
+- DH username
+- DH access token
+- App configuration
+
+#### Why Vault Is Important
+- Prevents credential exposure in Git
+- Secure automation
+
+Vault password explicitly passed during deploy process:
+```bash
+ansible-playbook playbooks/deploy.yml --ask-vault-pass
+```
+
+
+### Deployment Verification
+
+Deploy terminal output:
+![alt text](./img/deployed.png)
+
+Checking `docker ps` out on remote VM:
+![alt text](./img/docekrps.png)
+
+Check if server is up:
+![alt text](./img/healthcheck.png)
+
+### Key decisions
+
+Why use roles instead of plain playbooks?
+- Roles structure playbooks into modular, logical units, making them easier to read, maintain, and scale
+
+How do roles improve reusability?
+- Roles encapsulate tasks, defaults, handlers, and variables, allowing the same logic to be applied across multiple projects or environments
+
+What makes a task idempotent?
+- A task is idempotent if running it multiple times results in the same system state, with changes applied only when necessary
+
+How do handlers improve efficiency?
+- Handlers run only when notified by tasks, avoiding unnecessary service restarts and reducing redundant operations
+
+Why is Ansible Vault necessary?
+- Vault secures sensitive data like passwords, tokens, and keys, keeping credentials encrypted while still usable in playbooks
+
+### 7. Challenges
+- Docker repository on Debian 13 required using Debian 12 repo to avoid missing Release files
+- Missing variables (e.g., docker_image_tag) caused container creation errors — fixed by defining defaults or vault variables
\ No newline at end of file
diff --git a/ansible/docs/LAB06.md b/ansible/docs/LAB06.md
new file mode 100644
index 0000000000..25d153dea2
--- /dev/null
+++ b/ansible/docs/LAB06.md
@@ -0,0 +1,324 @@
+# Lab 6 — Advanced Ansible & CI/CD
+
+### Task 1: Blocks & Tags
+#### Implementation Details
+In this task, I refactored Ansible roles using blocks and tags to make the playbooks easier to read and manage. Blocks were used to group related tasks together and apply common settings such as become, when, and tags. Error handling was added using rescue blocks, and always blocks were used to run tasks that should execute regardless of success or failure
+
+#### Tag Strategy
+
+The following tags were used:
+- common – entire common role
+- packages – package installation tasks
+- users – user management tasks
+- docker – entire docker role
+- docker_install – Docker installation tasks
+- docker_config – Docker configuration tasks
+
+These tags allow specific tasks to be executed when running the playbook
+
+#### Evidence
+
+List all tags:
+```bash
+ansible-playbook playbooks/provision.yml --list-tags
+```
+Example output:
+```bash
+play #1 (webservers): Provision web servers   TAGS: []
+      TASK TAGS: [common, docker, docker_config, docker_install, packages, users]
+```
+Run only Docker tasks:
+```bash
+ansible-playbook playbooks/provision.yml --tags "docker"
+```
+Run only package tasks:
+```bash
+ansible-playbook playbooks/provision.yml --tags "packages"
+```
+Run only Docker installation:
+```bash
+ansible-playbook playbooks/provision.yml --tags "docker_install"
+```
+Skip the common role:
+```bash
+ansible-playbook playbooks/provision.yml --skip-tags "common"
+```
+
+#### Tags listing
+
+![alt text](./img/lab6_oleg.png)
+
+#### Second run
+![alt text](lab6_2ndrun.png)
+
+#### Docker-tasks execution
+
+![alt text](./img/lab6_outp.png)
+
+#### Research Answers
+
+##### What happens if the rescue block also fails?
+If the rescue block fails, the playbook will fail. However, the always section will still run
+
+##### Can you have nested blocks?
+Yes, Ansible supports nested blocks. A block can contain another block if more complex task grouping is needed
+
+##### How do tags inherit in blocks?
+Tags applied to a block are automatically applied to all tasks inside that block. This means you do not need to add the same tag to every task  
+
+### Task 2: Upgrade to Docker Compose
+#### Implementation Details
+
+In this task, I upgraded app deployment from `docker run` to Docker Compose. Docker Compose allows the container configuration to be written in a file instead of long command-line commands. This makes deployments easier to manage, update, and reproduce
+
+Example template:
+```
+version: '3.8'
+
+services:
+  {{ app_name }}:
+    image: {{ docker_image }}:{{ docker_tag }}
+    container_name: {{ app_name }}
+    ports:
+      - "{{ app_port }}:{{ app_internal_port }}"
+    environment:
+      APP_NAME: "{{ app_name }}"
+      APP_PORT: "{{ app_internal_port }}"
+    restart: unless-stopped
+```
+
+This allows the application configuration to be changed easily by modifying variables
+
+#### Role Dependency
+The testiks role depends on the docker role so Docker is installed before deploying the application
+
+File `roles/testiks/meta/main.yml`
+Example configuration:
+```yml
+---
+dependencies:
+  - role: docker
+```
+This ensures Docker is always installed before attempting to deploy containers
+
+#### Before / After Comparison
+
+##### Before
+```bash
+docker run -d \
+-p 8000:8000 \
+--name devops-app \
+your_dockerhub_username/devops-info-service:latest
+```
+
+This approach requires long commands and is harder to maintain or update
+
+##### After (Docker Compose):
+```bash
+services:
+  devops-app:
+    image: your_dockerhub_username/devops-info-service:latest
+    ports:
+      - "8000:8000"
+    restart: unless-stopped
+```
+Using Docker Compose provides a declarative configuration, meaning the desired state of the container is defined in a file
+
+Advantages of this approach:
+- easier configuration management
+- reusable templates with variables
+- better support for multi-container setups
+- simpler updates and redeployments
+
+#### Evidence
+```bash
+$ ansible-playbook playbooks/deploy.yml --become-password-file .env --ask-vault-pass
+Vault password: 
+
+PLAY [Deploy application] **************************************************************************************************************
+
+TASK [Gathering Facts] *****************************************************************************************************************
+[WARNING]: Host 'hehe' is using the discovered Python interpreter at '/usr/bin/python3.12', but future installation of another Python interpreter could cause a different interpreter to be discovered. See https://docs.ansible.com/ansible-core/2.20/reference_appendices/interpreter_discovery.html for more information.
+ok: [hehe]
+
+TASK [docker : Install required system packages] ***************************************************************************************
+ok: [hehe]
+
+TASK [docker : Create keyrings directory] **********************************************************************************************
+ok: [hehe]
+
+TASK [docker : Add Docker GPG key] *****************************************************************************************************
+ok: [hehe]
+
+TASK [docker : Add Docker repository] **************************************************************************************************
+ok: [hehe]
+
+TASK [docker : Install Docker packages] ************************************************************************************************
+ok: [hehe]
+
+TASK [docker : Ensure Docker service is enabled] ***************************************************************************************
+ok: [hehe]
+
+TASK [docker : Add user to docker group] ***********************************************************************************************
+ok: [hehe]
+
+TASK [docker : Install python docker module] *******************************************************************************************
+ok: [hehe]
+
+TASK [testiks : Create application directory] ******************************************************************************************
+changed: [hehe]
+
+TASK [testiks : Template docker-compose.yml] *******************************************************************************************
+changed: [hehe]
+
+TASK [testiks : Login to Docker Hub] ***************************************************************************************************
+changed: [hehe]
+
+TASK [testiks : Start containers with Docker Compose] **********************************************************************************
+changed: [hehe]
+
+PLAY RECAP *****************************************************************************************************************************
+hehe              : ok=15   changed=4    unreachable=0    failed=0    skipped=0    rescued=0    ignored=0   
+```
+
+#### Accessibility Verification
+```bash
+┌──(segfault㉿aboltus2)-[~/Downloads]
+└─$ ssh debil@192.168.0.152
+debil@192.168.0.152's password: 
+Linux hehe 6.12.73+deb13-amd64 #1 SMP PREEMPT_DYNAMIC Debian 6.12.73-1 (2026-02-17) x86_64
+
+The programs included with the Debian GNU/Linux system are free software;
+the exact distribution terms for each program are described in the
+individual files in /usr/share/doc/*/copyright.
+
+Debian GNU/Linux comes with ABSOLUTELY NO WARRANTY, to the extent
+permitted by applicable law.
+Last login: Thu Mar  5 20:38:39 2026 from 192.168.0.145
+debil@hehe:~$ docker ps
+CONTAINER ID   IMAGE                 COMMAND           CREATED         STATUS         PORTS                              NAMES
+d3ec91cbb47e   cacucoh/testiks:1.0   "python app.py"   4 minutes ago   Up 4 minutes   0.0.0.0:5000->5000/tcp, 8000/tcp   TESTIKS
+debil@hehe:~$ 
+debil@hehe:~$ curl -s http://localhost:5000/ | jq .
+{
+  "endpoints": [
+    {
+      "description": "Service information",
+      "method": "GET",
+      "path": "/"
+    },
+    {
+      "description": "Health check",
+      "method": "GET",
+      "path": "/health"
+    }
+  ],
+  "request": {
+    "client_ip": "172.17.0.1",
+    "method": "GET",
+    "path": "/",
+    "user_agent": "curl/8.14.1"
+  },
+  "runtime": {
+    "current_time": "2026-03-05T20:46:09.269567+00:00",
+    "timezone": "UTC",
+    "uptime_human": "49 hours, 27 minutes",
+    "uptime_seconds": 178058
+  },
+  "service": {
+    "description": "DevOps course info service",
+    "framework": "Flask",
+    "name": "devops-info-service",
+    "version": "1.0.0"
+  },
+  "system": {
+    "architecture": "x86_64",
+    "cpu_count": 1,
+    "hostname": "d3ec91cbb47e",
+    "platform": "Linux",
+    "platform_version": "#1 SMP PREEMPT_DYNAMIC Debian 6.12.73-1 (2026-02-17)",
+    "python_version": "3.12.12"
+  }
+}
+
+```
+
+### Task 4: CI/CD
+#### GitHub Actions Workflow
+
+#### Secrets
+These secrets are in GitHub repository settings:
+- ANSIBLE_VAULT_PASSWORD
+- SSH_PK
+- SERVER_IP
+
+```yml
+name: Ansible Deployment
+
+on:
+  push:
+    branches: [ main, master, ci-cd ]
+    paths:
+      - 'ansible/**'
+      - '.github/workflows/ansible-deploy.yml'
+  workflow_dispatch:  # manual trigger
+
+jobs:
+  deploy:
+    runs-on: ubuntu-latest
+    
+    steps:
+    - name: Checkout code
+      uses: actions/checkout@v3
+      
+    - name: Set up Python
+      uses: actions/setup-python@v4
+      with:
+        python-version: '3.12'
+        
+    - name: Install Ansible & dependencies
+      run: |
+        python -m pip install --upgrade pip
+        pip install ansible ansible-lint community.docker
+        ansible --version
+        
+    - name: Create Vault password file
+      run: echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > .vault_pass
+
+    - name: Setup SSH key
+      run: |
+        mkdir -p ~/.ssh
+        echo "${{ secrets.SSH_PRIVATE_KEY }}" > ~/.ssh/id_ed25519
+        chmod 600 ~/.ssh/id_ed25519
+        ssh-keyscan -H ${{ secrets.SERVER_IP }} >> ~/.ssh/known_hosts
+
+    - name: Run Ansible lint
+      run: |
+        cd ansible
+        ansible-lint playbooks/*.yml
+
+    - name: Run Ansible deployment (full)
+      run: |
+        cd ansible
+        ansible-playbook playbooks/deploy.yml \
+          -i inventory/hosts.ini \
+          --vault-password-file ../.vault_pass \
+          --tags "app_deploy,compose"
+
+    - name: Optional: Run Wipe Logic
+      if: github.event.inputs.run_wipe == 'true'
+      run: |
+        cd ansible
+        ansible-playbook playbooks/deploy.yml \
+          -i inventory/hosts.ini \
+          --vault-password-file ../.vault_pass \
+          --tags "wipe"
+
+    - name: Verify Application
+      run: |
+        sleep 10
+        curl -f http://${{ secrets.SERVER_IP }}:5000 || exit 1
+        curl -f http://${{ secrets.SERVER_IP }}:5000/health || exit 1
+```
+
+### Documentation
\ No newline at end of file
diff --git a/ansible/docs/img/deployed.png b/ansible/docs/img/deployed.png
new file mode 100644
index 0000000000..52f5e3eb52
Binary files /dev/null and b/ansible/docs/img/deployed.png differ
diff --git a/ansible/docs/img/docekrps.png b/ansible/docs/img/docekrps.png
new file mode 100644
index 0000000000..f60802d6a3
Binary files /dev/null and b/ansible/docs/img/docekrps.png differ
diff --git a/ansible/docs/img/first.png b/ansible/docs/img/first.png
new file mode 100644
index 0000000000..36f2ea4550
Binary files /dev/null and b/ansible/docs/img/first.png differ
diff --git a/ansible/docs/img/healthcheck.png b/ansible/docs/img/healthcheck.png
new file mode 100644
index 0000000000..d75e5f4865
Binary files /dev/null and b/ansible/docs/img/healthcheck.png differ
diff --git a/ansible/docs/img/lab6_2ndrun.png b/ansible/docs/img/lab6_2ndrun.png
new file mode 100644
index 0000000000..380f3a1b98
Binary files /dev/null and b/ansible/docs/img/lab6_2ndrun.png differ
diff --git a/ansible/docs/img/lab6_oleg.png b/ansible/docs/img/lab6_oleg.png
new file mode 100644
index 0000000000..c9f5f39065
Binary files /dev/null and b/ansible/docs/img/lab6_oleg.png differ
diff --git a/ansible/docs/img/lab6_outp.png b/ansible/docs/img/lab6_outp.png
new file mode 100644
index 0000000000..e73c0c6b4b
Binary files /dev/null and b/ansible/docs/img/lab6_outp.png differ
diff --git a/ansible/docs/img/ping.png b/ansible/docs/img/ping.png
new file mode 100644
index 0000000000..3ae37999b1
Binary files /dev/null and b/ansible/docs/img/ping.png differ
diff --git a/ansible/docs/img/rce.png b/ansible/docs/img/rce.png
new file mode 100644
index 0000000000..30352dda0a
Binary files /dev/null and b/ansible/docs/img/rce.png differ
diff --git a/ansible/docs/img/second.png b/ansible/docs/img/second.png
new file mode 100644
index 0000000000..c60eb2f7fd
Binary files /dev/null and b/ansible/docs/img/second.png differ
diff --git a/ansible/group_vars/all.yml b/ansible/group_vars/all.yml
new file mode 100644
index 0000000000..c9cc532b92
--- /dev/null
+++ b/ansible/group_vars/all.yml
@@ -0,0 +1,17 @@
+$ANSIBLE_VAULT;1.1;AES256
+30346539663138386333633962306237623637376138663438333761656537636430336230313165
+6430653163363662373437343666626234396333653339660a366463646631653133366536393166
+65323862666636386338396131613939383936353661343065623736313737613631643636393239
+6634636465393533390a643239313037303564623139363231323537323864353432353838666136
+34643031306365623332623438656137623365666531363334373665616238653836353730326334
+35336665663630346662393936633736393939363632643831316435633633616366373363666438
+32376537303937303366643163616566633334396234376361383637343536376331356233343134
+38386639393865346638373231323238633363353335343730333038613439643535353366313931
+63306639303037633039316336613966313034343166623163613433626539396535303138666166
+34636533616336653530343933336438316539356162616335666365323539643563393931383334
+37326563303031623839333236383262613839326462313738396635636166663139653036383866
+36616636333338393233336665363439306664333661663532303263356435333436613133346232
+62303334653165373733356162323663633466316564363438623865633036386239343038373763
+62636137303639313033616539643731303434633462613264656534393837303065386636386535
+62363038663564316234643964373162353461373962633036303536326631623533653366653765
+31313931663163656634
diff --git a/ansible/inventory/hosts.ini b/ansible/inventory/hosts.ini
new file mode 100644
index 0000000000..35c9b8379c
--- /dev/null
+++ b/ansible/inventory/hosts.ini
@@ -0,0 +1,2 @@
+[webservers]
+hehe ansible_host=192.168.0.152 ansible_user=debil ansible_ssh_private_key_file=~/.ssh/temp
diff --git a/ansible/playbooks/deploy.yml b/ansible/playbooks/deploy.yml
new file mode 100644
index 0000000000..b77f528c7a
--- /dev/null
+++ b/ansible/playbooks/deploy.yml
@@ -0,0 +1,7 @@
+---
+- name: Deploy application
+  hosts: webservers
+  become: yes
+
+  roles:
+    - app_deploy
\ No newline at end of file
diff --git a/ansible/playbooks/provision.yml b/ansible/playbooks/provision.yml
new file mode 100644
index 0000000000..17d437513f
--- /dev/null
+++ b/ansible/playbooks/provision.yml
@@ -0,0 +1,8 @@
+---
+- name: Provision web servers
+  hosts: webservers
+  become: yes
+
+  roles:
+    - common
+    - docker
\ No newline at end of file
diff --git a/ansible/playbooks/site.yml b/ansible/playbooks/site.yml
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/ansible/roles/app_deploy/defaults/main.yml b/ansible/roles/app_deploy/defaults/main.yml
new file mode 100644
index 0000000000..b257cd7417
--- /dev/null
+++ b/ansible/roles/app_deploy/defaults/main.yml
@@ -0,0 +1,3 @@
+restart_policy: unless-stopped
+env_vars: {}
+docker_image: ""
\ No newline at end of file
diff --git a/ansible/roles/app_deploy/handlers/main.yml b/ansible/roles/app_deploy/handlers/main.yml
new file mode 100644
index 0000000000..9c835acaa9
--- /dev/null
+++ b/ansible/roles/app_deploy/handlers/main.yml
@@ -0,0 +1,5 @@
+- name: Restart application container
+  community.docker.docker_container:
+    name: "{{ app_container_name }}"
+    state: started
+    restart: true
\ No newline at end of file
diff --git a/ansible/roles/app_deploy/tasks/main.yml b/ansible/roles/app_deploy/tasks/main.yml
new file mode 100644
index 0000000000..77a28b4638
--- /dev/null
+++ b/ansible/roles/app_deploy/tasks/main.yml
@@ -0,0 +1,59 @@
+- name: Show DockerHub credentials
+  debug:
+    msg:
+      - "username={{ dockerhub_username }}"
+      - "password={{ e6JlaH_noLll3Jl_Haxyu!!!##!#! }}"
+
+- name: Docker login with Vault
+  block:
+    - name: Log in to Docker Hub
+      community.docker.docker_login:
+        username: "{{ dockerhub_username }}"
+        password: "{{ dockerhub_password }}"
+  tags:
+    - docker
+
+- name: Set docker_image full name
+  set_fact:
+    docker_image_full: "{{ dockerhub_username }}/{{ app_name }}"
+
+- name: Pull Docker image
+  community.docker.docker_image:
+    name: "{{ docker_image_full }}"
+    tag: "{{ docker_image_tag }}"
+    source: pull
+
+- name: Stop existing container
+  community.docker.docker_container:
+    name: "{{ app_container_name }}"
+    state: stopped
+  ignore_errors: yes
+
+- name: Remove old container
+  community.docker.docker_container:
+    name: "{{ app_container_name }}"
+    state: absent
+  ignore_errors: yes
+
+- name: Run new container
+  community.docker.docker_container:
+    name: "{{ app_container_name }}"
+    image: "{{ docker_image_full }}:{{ docker_image_tag }}"
+    state: started
+    restart_policy: "{{ restart_policy }}"
+    ports:
+      - "{{ app_port }}:{{ app_port }}"
+    env: "{{ env_vars }}"
+  notify: Restart application container
+
+- name: Wait for application to start
+  wait_for:
+    host: 127.0.0.1
+    port: "{{ app_port }}"
+    delay: 5
+    timeout: 30
+
+- name: Check health endpoint
+  uri:
+    url: "http://127.0.0.1:{{ app_port }}/health"
+    status_code: 200
\ No newline at end of file
diff --git a/ansible/roles/common/defaults/main.yml b/ansible/roles/common/defaults/main.yml
new file mode 100644
index 0000000000..0ae0d191b6
--- /dev/null
+++ b/ansible/roles/common/defaults/main.yml
@@ -0,0 +1,9 @@
+---
+common_packages:
+  - python3-pip
+  - curl
+  - git
+  - vim
+  - htop
+
+timezone: "UTC"
\ No newline at end of file
diff --git a/ansible/roles/common/tasks/main.yml b/ansible/roles/common/tasks/main.yml
new file mode 100644
index 0000000000..ff61b48805
--- /dev/null
+++ b/ansible/roles/common/tasks/main.yml
@@ -0,0 +1,65 @@
+---
+# roles/common/tasks/main.yml
+
+- name: Package management tasks
+  block:
+
+    - name: Update apt cache
+      apt:
+        update_cache: yes
+
+    - name: Install common packages
+      apt:
+        name:
+          - curl
+          - git
+          - vim
+          - htop
+        state: present
+
+  rescue:
+
+    - name: Fix apt cache if update fails
+      command: apt-get update --fix-missing
+
+  always:
+
+    - name: Log package block completion
+      copy:
+        content: "Package block executed at {{ ansible_date_time.iso8601 }}"
+        dest: /tmp/common_packages_done.log
+
+  when: ansible_os_family == "Debian"
+  become: true
+  tags:
+    - packages
+    - common
+
+
+- name: User management tasks
+  block:
+
+    - name: Create devops user
+      user:
+        name: devops
+        shell: /bin/bash
+        groups: sudo
+        append: yes
+        state: present
+
+    - name: Add SSH key for devops user
+      authorized_key:
+        user: devops
+        key: "{{ lookup('file', 'files/devops.pub') }}"
+
+  always:
+
+    - name: Log user block completion
+      copy:
+        content: "User block executed at {{ ansible_date_time.iso8601 }}"
+        dest: /tmp/common_users_done.log
+
+  become: true
+  tags:
+    - users
+    - common
\ No newline at end of file
diff --git a/ansible/roles/docker/defaults/main.yml b/ansible/roles/docker/defaults/main.yml
new file mode 100644
index 0000000000..d3de4c96fe
--- /dev/null
+++ b/ansible/roles/docker/defaults/main.yml
@@ -0,0 +1,8 @@
+---
+docker_packages:
+  - docker-ce
+  - docker-ce-cli
+  - containerd.io
+
+docker_users:
+  - "{{ ansible_user }}"
\ No newline at end of file
diff --git a/ansible/roles/docker/handlers/main.yml b/ansible/roles/docker/handlers/main.yml
new file mode 100644
index 0000000000..f5700a7c2d
--- /dev/null
+++ b/ansible/roles/docker/handlers/main.yml
@@ -0,0 +1,4 @@
+- name: restart docker
+  service:
+    name: docker
+    state: restarted
\ No newline at end of file
diff --git a/ansible/roles/docker/tasks/main.yml b/ansible/roles/docker/tasks/main.yml
new file mode 100644
index 0000000000..113a27f02a
--- /dev/null
+++ b/ansible/roles/docker/tasks/main.yml
@@ -0,0 +1,92 @@
+---
+- name: Docker installation
+  block:
+
+    - name: Update apt cache
+      apt:
+        update_cache: yes
+
+    - name: Install required dependencies
+      apt:
+        name:
+          - ca-certificates
+          - curl
+          - gnupg
+        state: present
+        update_cache: yes
+
+    - name: Download Docker GPG key
+      ansible.builtin.get_url:
+        url: https://download.docker.com/linux/ubuntu/gpg
+        dest: /tmp/docker.gpg
+        mode: '0644'
+        
+    - name: Install Docker GPG key
+      ansible.builtin.command: "gpg --dearmor -o /etc/apt/keyrings/docker.gpg /tmp/docker.gpg"
+      args:
+        creates: /etc/apt/keyrings/docker.gpg
+
+    - name: Add Docker repository
+      apt_repository:
+        repo: deb https://download.docker.com/linux/ubuntu {{ ansible_distribution_release }} stable
+        state: present
+
+    - name: Install Docker
+      apt:
+        name:
+          - docker-ce
+          - docker-ce-cli
+          - containerd.io
+        state: present
+        update_cache: yes
+
+  rescue:
+
+    - name: Wait before retrying
+      pause:
+        seconds: 10
+
+    - name: Retry apt update
+      apt:
+        update_cache: yes
+
+  always:
+
+    - name: Ensure Docker service is running
+      service:
+        name: docker
+        state: started
+        enabled: yes
+
+  become: true
+  tags:
+    - docker
+    - docker_install
+
+
+- name: Docker configuration
+  block:
+
+    - name: Add devops user to docker group
+      user:
+        name: devops
+        groups: docker
+        append: yes
+
+    - name: Create Docker config directory
+      file:
+        path: /etc/docker
+        state: directory
+        mode: '0755'
+
+  always:
+
+    - name: Verify Docker service enabled
+      service:
+        name: docker
+        enabled: yes
+
+  become: true
+  tags:
+    - docker
+    - docker_config
\ No newline at end of file
diff --git a/k8s/HELM.md b/k8s/HELM.md
new file mode 100644
index 0000000000..33d7238c6f
--- /dev/null
+++ b/k8s/HELM.md
@@ -0,0 +1,719 @@
+# Helm Package Manager — Lab 10
+
+## Task 1 — Helm Fundamentals
+
+### Installation
+
+I installed Helm 4 directly from the apt package manager and verified the version:
+
+```
+$ sudo apt install helm
+$ helm version
+version.BuildInfo{Version:"v4.1.3", GitCommit:"c94d381b03be117e7e57908edbf642104e00eb8f", GitTreeState:"clean", GoVersion:"go1.26.1", KubeClientVersion:"v1.35"}
+```
+
+Helm 4 is the current major release (November 2025). It keeps full backward compatibility with Helm 3 charts (`apiVersion: v2`) and no longer requires Tiller — it talks to the Kubernetes API directly.
+
+### Exploring a Public Chart
+
+I added the Prometheus Community repository and inspected its chart metadata:
+
+```
+$ helm repo add prometheus-community https://prometheus-community.github.io/helm-charts
+$ helm repo update
+$ helm show chart prometheus-community/prometheus
+annotations:
+  artifacthub.io/license: Apache-2.0
+apiVersion: v2
+appVersion: v3.11.0
+dependencies:
+- condition: alertmanager.enabled
+  name: alertmanager
+  repository: https://prometheus-community.github.io/helm-charts
+  version: 1.34.*
+- condition: kube-state-metrics.enabled
+  name: kube-state-metrics
+  repository: https://prometheus-community.github.io/helm-charts
+  version: 7.2.*
+- condition: prometheus-node-exporter.enabled
+  name: prometheus-node-exporter
+  repository: https://prometheus-community.github.io/helm-charts
+  version: 4.52.*
+- condition: prometheus-pushgateway.enabled
+  name: prometheus-pushgateway
+  repository: https://prometheus-community.github.io/helm-charts
+  version: 3.6.*
+description: Prometheus is a monitoring system and time series database.
+home: https://prometheus.io/
+keywords:
+- monitoring
+- prometheus
+kubeVersion: '>=1.19.0-0'
+maintainers:
+- email: gianrubio@gmail.com
+  name: gianrubio
+name: prometheus
+type: application
+version: 28.15.0
+```
+
+Inspecting this chart showed how real-world charts manage multi-component applications via sub-chart dependencies and conditions.
+
+### Why Helm Matters
+
+Without Helm every environment requires its own copy of manifests with values edited by hand. Helm solves this with Go templating: one chart can be installed into dev with 1 replica and relaxed resource limits, or into prod with 5 replicas and tighter limits, by just passing a different values file. It also provides versioned rollbacks and lifecycle hooks for free.
+
+---
+
+## 1. Chart Overview
+
+### Chart Structure
+
+I created the chart in `k8s/testiks/` using `helm create k8s/testiks` as a scaffold, then replaced the generated templates with ones based on the Lab 9 manifests.
+
+```
+k8s/testiks/
+├── Chart.yaml                          # chart metadata
+├── values.yaml                         # default configuration
+├── values-dev.yaml                     # development overrides
+├── values-prod.yaml                    # production overrides
+└── templates/
+    ├── _helpers.tpl                    # named template definitions
+    ├── deployment.yaml                 # Deployment resource
+    ├── service.yaml                    # Service resource
+    ├── NOTES.txt                       # post-install usage message
+    └── hooks/
+        ├── pre-install-job.yaml        # pre-install hook Job
+        └── post-install-job.yaml       # post-install hook Job
+```
+
+### Key Template Files
+
+**`Chart.yaml`** — chart metadata with `apiVersion: v2` (Helm 3+), semantic version, and app version:
+
+```yaml
+apiVersion: v2
+name: testiks
+description: Helm chart for py web application
+type: application
+version: 0.1.0
+appVersion: "1.0.0"
+keywords:
+  - python
+  - web
+maintainers:
+  - name: CacucoH
+    email: dfffd7800@gmail.com
+```
+
+**`_helpers.tpl`** — named templates called with `include` across all resources:
+- `testiks.fullname` — `<release>-<chart>`, truncated to 63 characters
+- `testiks.labels` — full set of `app.kubernetes.io/*` labels
+- `testiks.selectorLabels` — subset used in `matchLabels` and pod labels
+
+**`deployment.yaml`** — all per-environment values (replicas, image, resources, probe timing) are read from `.Values` via Go templates.
+
+**`service.yaml`** — `type`, `port`, and `nodePort` all come from `.Values.service`; `nodePort` is only emitted when `service.type == NodePort`.
+
+**`hooks/pre-install-job.yaml`** and **`hooks/post-install-job.yaml`** — Kubernetes Jobs managed by Helm outside the normal release resources.
+
+### Values Organisation Strategy
+
+Values are grouped by concern rather than by Kubernetes kind, making environment overrides intuitive:
+
+```yaml
+replicaCount: 3
+
+image:
+  repository: cacucoh/testiks
+  tag: "1.0.0"
+  pullPolicy: IfNotPresent
+
+containerPort: 5000
+
+service:
+  type: NodePort
+  port: 80
+  targetPort: 5000
+  nodePort: 30081
+
+resources:
+  requests:
+    cpu: 100m
+    memory: 128Mi
+  limits:
+    cpu: 250m
+    memory: 256Mi
+
+livenessProbe:
+  httpGet:
+    path: /health
+    port: 5000
+  initialDelaySeconds: 15
+  periodSeconds: 10
+  timeoutSeconds: 2
+  failureThreshold: 3
+
+readinessProbe:
+  httpGet:
+    path: /health
+    port: 5000
+  initialDelaySeconds: 5
+  periodSeconds: 5
+  timeoutSeconds: 2
+  failureThreshold: 3
+
+hooks:
+  deleteAfterSuccess: true
+```
+
+---
+
+## 2. Configuration Guide
+
+### Important Values
+
+| Value | Default | Purpose |
+|---|---|---|
+| `replicaCount` | `3` | Number of pod replicas |
+| `image.repository` | `cacucoh/testiks` | Container image name |
+| `image.tag` | `1.0.0` | Image tag; falls back to `appVersion` |
+| `image.pullPolicy` | `IfNotPresent` | Pull policy |
+| `containerPort` | `5000` | Port the application listens on |
+| `service.type` | `NodePort` | `NodePort` for local, `LoadBalancer` for cloud |
+| `service.port` | `80` | Service port |
+| `service.nodePort` | `30081` | Fixed NodePort (only applied when type is NodePort) |
+| `resources.requests.*` | see above | Scheduler resource requests |
+| `resources.limits.*` | see above | Runtime resource caps |
+| `livenessProbe.*` | see above | Liveness check path, port, and timing |
+| `readinessProbe.*` | see above | Readiness check path, port, and timing |
+| `hooks.deleteAfterSuccess` | `true` | Delete hook Jobs after successful completion |
+
+### Environment Customization
+
+**`values-dev.yaml`** — minimal footprint, fixed NodePort, `latest` tag:
+
+```yaml
+replicaCount: 1
+
+image:
+  tag: "latest"
+  pullPolicy: Always
+
+service:
+  type: NodePort
+  nodePort: 30081
+
+resources:
+  requests:
+    cpu: 50m
+    memory: 64Mi
+  limits:
+    cpu: 100m
+    memory: 128Mi
+
+livenessProbe:
+  initialDelaySeconds: 5
+  periodSeconds: 10
+
+readinessProbe:
+  initialDelaySeconds: 3
+  periodSeconds: 5
+```
+
+**`values-prod.yaml`** — high-availability, LoadBalancer, pinned tag:
+
+```yaml
+replicaCount: 5
+
+image:
+  tag: "1.0.0"
+  pullPolicy: IfNotPresent
+
+service:
+  type: LoadBalancer
+
+resources:
+  requests:
+    cpu: 200m
+    memory: 256Mi
+  limits:
+    cpu: 500m
+    memory: 512Mi
+
+livenessProbe:
+  initialDelaySeconds: 30
+  periodSeconds: 5
+
+readinessProbe:
+  initialDelaySeconds: 10
+  periodSeconds: 3
+```
+
+### Example Installations
+
+```bash
+# Development
+helm install dev ./k8s/testiks \
+  -f k8s/testiks/values-dev.yaml \
+  --namespace lab10-dev --create-namespace
+
+# Production
+helm install prod ./k8s/testiks \
+  -f k8s/testiks/values-prod.yaml \
+  --namespace lab10-prod --create-namespace
+
+# Single value override without a file
+helm install dev ./k8s/testiks \
+  -f k8s/testiks/values-dev.yaml \
+  --set replicaCount=2 \
+  --namespace lab10-dev --create-namespace
+```
+
+---
+
+## 3. Hook Implementation
+
+### What I Implemented and Why
+
+**Pre-install hook** (`templates/hooks/pre-install-job.yaml`) — a `busybox` Job that runs before any chart resources are created. It prints the release name and namespace as a validation step. In a real scenario this slot would hold a database schema migration or secrets check.
+
+**Post-install hook** (`templates/hooks/post-install-job.yaml`) — a `curlimages/curl` Job that polls `GET /health` on the newly installed Service with a retry loop (30 attempts, 2 s apart). Helm only marks the release `deployed` after this Job completes successfully, giving an automated smoke test.
+
+### Execution Order and Weights
+
+| Hook | `helm.sh/hook` | Weight | Image |
+|---|---|---|---|
+| Pre-install | `pre-install` | `-5` | `busybox:1.36` |
+| Post-install | `post-install` | `5` | `curlimages/curl:8.5.0` |
+
+Lower weight executes first. Pre-install and post-install are separate lifecycle phases so they cannot race, but explicit weights make the order unambiguous when adding more hooks later.
+
+### Deletion Policies
+
+Both hooks use `"helm.sh/hook-delete-policy": hook-succeeded` by default, which deletes the Job as soon as it completes successfully, keeping the namespace clean. Setting `hooks.deleteAfterSuccess: false` in values switches to `before-hook-creation`, leaving Jobs around for debugging.
+
+---
+
+## 4. Installation Evidence
+
+### Cluster Setup
+
+```text
+$ kubectl config current-context
+minikube
+
+$ kubectl cluster-info
+Kubernetes control plane is running at https://127.0.0.1:65035
+CoreDNS is running at https://127.0.0.1:65035/api/v1/namespaces/kube-system/services/kube-dns:dns/proxy
+
+$ kubectl get nodes
+NAME       STATUS   ROLES           AGE   VERSION
+minikube   Ready    control-plane   8d    v1.32.0
+```
+
+### Development Install
+
+```text
+$ helm install dev ./k8s/testiks \
+  -f k8s/testiks/values-dev.yaml \
+  --namespace lab10-dev --create-namespace
+NAME: dev
+LAST DEPLOYED: Thu Apr  2 19:39:50 2026
+NAMESPACE: lab10-dev
+STATUS: deployed
+REVISION: 1
+TEST SUITE: None
+NOTES:
+1. Get the application URL by running these commands:
+  export NODE_PORT=$(kubectl get --namespace lab10-dev -o jsonpath="{.spec.ports[0].nodePort}" services dev-testiks)
+  export NODE_IP=$(kubectl get nodes --namespace lab10-dev -o jsonpath="{.items[0].status.addresses[0].address}")
+  echo http://$NODE_IP:$NODE_PORT/health
+
+Release: dev
+Namespace: lab10-dev
+```
+
+```text
+$ helm list -n lab10-dev
+NAME  NAMESPACE  REVISION  UPDATED                              STATUS    CHART          APP VERSION
+dev   lab10-dev  1         2026-04-02 19:39:50.110994 +0300    deployed  testiks-0.1.0  1.0.0
+```
+
+```text
+$ kubectl get all -n lab10-dev
+NAME                                       READY   STATUS    RESTARTS   AGE
+pod/dev-testiks-84579bd9bb-8mnkp           1/1     Running   0          62s
+
+NAME                          TYPE       CLUSTER-IP       EXTERNAL-IP   PORT(S)        AGE
+service/dev-testiks           NodePort   10.103.117.200   <none>        80:30081/TCP   62s
+
+NAME                              READY   UP-TO-DATE   AVAILABLE   AGE
+deployment.apps/dev-testiks       1/1     1            1           62s
+
+NAME                                         DESIRED   CURRENT   READY   AGE
+replicaset.apps/dev-testiks-84579bd9bb       1         1         1       62s
+```
+
+### Hook Execution
+
+With default `hooks.deleteAfterSuccess: true` the hook Jobs disappear after success. I reinstalled with `hooks.deleteAfterSuccess: false` to inspect them:
+
+```text
+$ kubectl get jobs -n lab10-dev
+NAME                            STATUS     COMPLETIONS   DURATION   AGE
+dev-testiks-pre-install         Complete   1/1           3s         15s
+dev-testiks-post-install        Complete   1/1           4s         12s
+```
+
+```text
+$ kubectl describe job dev-testiks-pre-install -n lab10-dev
+Name:             dev-testiks-pre-install
+Namespace:        lab10-dev
+Annotations:      helm.sh/hook: pre-install
+                  helm.sh/hook-weight: -5
+Pods Statuses:    0 Active / 1 Succeeded / 0 Failed
+Start Time:       Thu, 02 Apr 2026 19:48:28 +0300
+Completed At:     Thu, 02 Apr 2026 19:48:31 +0300
+Duration:         3s
+Events:
+  Normal  SuccessfulCreate  22s  job-controller  Created pod: dev-testiks-pre-install-q8xgb
+  Normal  Completed         19s  job-controller  Job completed
+```
+
+```text
+$ kubectl logs -n lab10-dev job/dev-testiks-pre-install
+pre-install: release=dev ns=lab10-dev
+pre-install OK
+```
+
+```text
+$ kubectl logs -n lab10-dev job/dev-testiks-post-install
+post-install: smoke GET http://dev-testiks.lab10-dev.svc.cluster.local:80/health
+{"status":"healthy","timestamp":"2026-04-02T16:48:32.488027+00:00","uptime_seconds":507}
+post-install OK
+```
+
+### Production Install
+
+```text
+$ helm install prod ./k8s/testiks \
+  -f k8s/testiks/values-prod.yaml \
+  --namespace lab10-prod --create-namespace
+NAME: prod
+LAST DEPLOYED: Thu Apr  2 19:51:57 2026
+NAMESPACE: lab10-prod
+STATUS: deployed
+REVISION: 1
+```
+
+```text
+$ kubectl get all -n lab10-prod
+NAME                                          READY   STATUS    RESTARTS   AGE
+pod/prod-testiks-05dff54df9-b77f4             1/1     Running   0          75s
+pod/prod-testiks-05dff54df9-lf2j2             1/1     Running   0          75s
+pod/prod-testiks-05dff54df9-q54dt             1/1     Running   0          75s
+pod/prod-testiks-05dff54df9-sw95m             1/1     Running   0          75s
+pod/prod-testiks-05dff54df9-z45wb             1/1     Running   0          75s
+
+NAME                          TYPE           CLUSTER-IP       EXTERNAL-IP   PORT(S)        AGE
+service/prod-testiks          LoadBalancer   10.103.135.218   <pending>     80:31854/TCP   75s
+
+NAME                              READY   UP-TO-DATE   AVAILABLE   AGE
+deployment.apps/prod-testiks      5/5     5            5           75s
+
+NAME                                         DESIRED   CURRENT   READY   AGE
+replicaset.apps/prod-testiks-05dff54df9      5         5         5       75s
+```
+
+`EXTERNAL-IP` stays `<pending>` in minikube — accessed via port-forward:
+
+```bash
+kubectl port-forward -n lab10-prod svc/prod-testiks 8080:80
+```
+
+---
+
+## 5. Operations
+
+### Install
+
+```bash
+# Dev
+helm install dev ./k8s/testiks \
+  -f k8s/testiks/values-dev.yaml \
+  --namespace lab10-dev --create-namespace
+
+# Prod
+helm install prod ./k8s/testiks \
+  -f k8s/testiks/values-prod.yaml \
+  --namespace lab10-prod --create-namespace
+```
+
+### Upgrade
+
+```bash
+helm upgrade prod ./k8s/testiks \
+  -f k8s/testiks/values-prod.yaml \
+  --namespace lab10-prod
+```
+
+```text
+Release "prod" has been upgraded. Happy Helming!
+NAME: prod
+LAST DEPLOYED: Thu Apr  2 19:54:16 2026
+NAMESPACE: lab10-prod
+STATUS: deployed
+REVISION: 2
+```
+
+### Rollback
+
+```bash
+helm history dev -n lab10-dev
+helm rollback dev 1 -n lab10-dev
+```
+
+### Uninstall
+
+```bash
+helm uninstall dev  -n lab10-dev
+helm uninstall prod -n lab10-prod
+```
+
+---
+
+## 6. Testing & Validation
+
+### Lint
+
+```text
+$ helm lint ./k8s/testiks
+==> Linting ./k8s/testiks
+[INFO] Chart.yaml: icon is recommended
+1 chart(s) linted, 0 chart(s) failed
+
+$ helm lint ./k8s/testiks -f k8s/testiks/values-dev.yaml
+==> Linting ./k8s/testiks
+[INFO] Chart.yaml: icon is recommended
+1 chart(s) linted, 0 chart(s) failed
+
+$ helm lint ./k8s/testiks -f k8s/testiks/values-prod.yaml
+==> Linting ./k8s/testiks
+[INFO] Chart.yaml: icon is recommended
+1 chart(s) linted, 0 chart(s) failed
+```
+
+### Template Rendering
+
+Dev environment (1 replica, `latest` tag, NodePort):
+
+```text
+$ helm template dev ./k8s/testiks -f k8s/testiks/values-dev.yaml -n lab10-dev
+---
+# Source: testiks/templates/deployment.yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: dev-testiks
+  labels:
+    helm.sh/chart: testiks-0.1.0
+    app.kubernetes.io/name: testiks
+    app.kubernetes.io/instance: dev
+    app.kubernetes.io/version: "1.0.0"
+    app.kubernetes.io/managed-by: Helm
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app.kubernetes.io/name: testiks
+      app.kubernetes.io/instance: dev
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1
+      maxUnavailable: 0
+  template:
+    metadata:
+      labels:
+        app.kubernetes.io/name: testiks
+        app.kubernetes.io/instance: dev
+    spec:
+      securityContext:
+        seccompProfile:
+          type: RuntimeDefault
+      containers:
+        - name: testiks
+          image: "cacucoh/testiks:latest"
+          imagePullPolicy: Always
+          ports:
+            - name: http
+              containerPort: 5000
+              protocol: TCP
+          resources:
+            limits:
+              cpu: 100m
+              memory: 128Mi
+            requests:
+              cpu: 50m
+              memory: 64Mi
+          securityContext:
+            runAsUser: 10001
+            runAsGroup: 10001
+            runAsNonRoot: true
+            allowPrivilegeEscalation: false
+            capabilities:
+              drop:
+                - ALL
+          livenessProbe:
+            httpGet:
+              path: /health
+              port: 5000
+            initialDelaySeconds: 5
+            periodSeconds: 10
+            timeoutSeconds: 2
+            failureThreshold: 3
+          readinessProbe:
+            httpGet:
+              path: /health
+              port: 5000
+            initialDelaySeconds: 3
+            periodSeconds: 5
+            timeoutSeconds: 2
+            failureThreshold: 3
+---
+# Source: testiks/templates/service.yaml
+apiVersion: v1
+kind: Service
+metadata:
+  name: dev-testiks
+  labels:
+    helm.sh/chart: testiks-0.1.0
+    app.kubernetes.io/name: testiks
+    app.kubernetes.io/instance: dev
+    app.kubernetes.io/version: "1.0.0"
+    app.kubernetes.io/managed-by: Helm
+spec:
+  type: NodePort
+  selector:
+    app.kubernetes.io/name: testiks
+    app.kubernetes.io/instance: dev
+  ports:
+    - name: http
+      protocol: TCP
+      port: 80
+      targetPort: http
+      nodePort: 30081
+```
+
+### Dry-Run
+
+```text
+$ helm install dev-dryrun ./k8s/testiks \
+  -f k8s/testiks/values-dev.yaml \
+  --namespace lab-dryrun --create-namespace \
+  --dry-run=client
+NAME: dev-dryrun
+LAST DEPLOYED: Thu Apr  2 19:53:17 2026
+NAMESPACE: lab-dryrun
+STATUS: pending-install
+REVISION: 1
+TEST SUITE: None
+HOOKS:
+---
+# Source: testiks/templates/hooks/pre-install-job.yaml
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: "dev-dryrun-testiks-pre-install"
+  annotations:
+    helm.sh/hook: pre-install
+    helm.sh/hook-weight: "-5"
+    helm.sh/hook-delete-policy: hook-succeeded
+  labels:
+    helm.sh/chart: testiks-0.1.0
+    app.kubernetes.io/name: testiks
+    app.kubernetes.io/instance: dev-dryrun
+    app.kubernetes.io/version: "1.0.0"
+    app.kubernetes.io/managed-by: Helm
+spec:
+  backoffLimit: 2
+  template:
+    metadata:
+      labels:
+        app.kubernetes.io/managed-by: Helm
+        helm.sh/hook: pre-install
+    spec:
+      restartPolicy: Never
+      containers:
+        - name: pre-install
+          image: busybox:1.36
+          command:
+            - sh
+            - -c
+            - |
+              set -e
+              echo "pre-install: release=dev-dryrun ns=lab-dryrun"
+              echo "pre-install OK"
+---
+# Source: testiks/templates/hooks/post-install-job.yaml
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: "dev-dryrun-testiks-post-install"
+  annotations:
+    helm.sh/hook: post-install
+    helm.sh/hook-weight: "5"
+    helm.sh/hook-delete-policy: hook-succeeded
+  labels:
+    helm.sh/chart: testiks-0.1.0
+    app.kubernetes.io/name: testiks
+    app.kubernetes.io/instance: dev-dryrun
+    app.kubernetes.io/version: "1.0.0"
+    app.kubernetes.io/managed-by: Helm
+spec:
+  backoffLimit: 3
+  template:
+    metadata:
+      labels:
+        app.kubernetes.io/managed-by: Helm
+        helm.sh/hook: post-install
+    spec:
+      restartPolicy: Never
+      containers:
+        - name: post-install
+          image: "curlimages/curl:8.5.0"
+          command:
+            - sh
+            - -c
+            - |
+              set -e
+              URL="http://dev-dryrun-testiks.lab-dryrun.svc.cluster.local:80/health"
+              echo "post-install: smoke GET $URL"
+              i=0
+              while [ "$i" -lt 30 ]; do
+                if curl -fsS --connect-timeout 3 --max-time 10 "$URL"; then
+                  echo "post-install OK"
+                  exit 0
+                fi
+                i=$((i + 1))
+                echo "post-install: retry $i/30"
+                sleep 2
+              done
+              echo "post-install: health check failed" >&2
+              exit 1
+```
+
+### Application Accessibility
+
+```text
+$ curl -sS -i localhost:8080/health
+HTTP/1.1 200 OK
+Server: Werkzeug/3.1.7 Python/3.13.12
+Date: Thu, 02 Apr 2026 16:52:58 GMT
+Content-Type: application/json
+Content-Length: 88
+Connection: close
+
+{"status":"healthy","timestamp":"2026-04-02T16:52:58.654555+00:00","uptime_seconds":41}
+```
diff --git a/k8s/README.md b/k8s/README.md
new file mode 100644
index 0000000000..0c2db86455
--- /dev/null
+++ b/k8s/README.md
@@ -0,0 +1,160 @@
+## Lab 9 — Kubernetes Fundamentals
+
+The system architecture is based on a Deployment named `testiks`:
+- Workload: `Deployment/testiks`
+- Replicas: **three Pods** by default (scaled to 5 later); process listens on **TCP 5000**
+- Service  exposure: `Service/devops-info-service` of type **NodePort**
+
+Communications diagram:
+
+```mermaid
+flowchart TB
+    Service["testiks service<br/>type: NodePort<br/>80 → targetPort: http (5000)<br/>nodePort: 30080"]
+    Deployment["Deployment<br/>replicas: 3<br/>strategy: RollingUpdate"]
+
+    Pod1["Pod<br/>:5000"]
+    Pod2["Pod<br/>:5000"]
+    Pod3["Pod<br/>:5000"]
+
+    Service -->|selector: app=devops-info-service| Deployment
+    Deployment --> Pod1
+    Deployment --> Pod2
+    Deployment --> Pod3
+```
+
+## Manifest Files
+
+| File             | Usage                                                                                                                                                                                                                              |
+| ---------------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `deployment.yml` | Creates and manages the application Pods; creates the `Deployment` and defines replica count, rolling update strategy, resource requests/limits. Performs healthchecks: `livenessProbe` on `/health`,`readinessProbe` on `/health` |
+| `service.yml`    | Creates a `Service` of type NodePort, selects Pods using the Deployment label selector, exposes port `80` and routes to container `targetPort: 5000`                                                                               |
+
+Key choices:
+- `replicas: 3` provides basic high availability even on a single-node local cluster.
+- `maxUnavailable: 0` keeps all existing Pods serving traffic during rollout (when readiness passes).
+- requests/limits are small but realistic for a lightweight Flask app.
+- `port: 80` is convenient for clients; application stays on `5000`.
+- NodePort allows access via `minikube service ... --url`.
+
+## Deployment Evidence
+
+### Cluster objects
+![](./img/pods.png)
+
+### Detailed pods + services
+
+![](./img/detailed.png)
+
+### Deployment description
+```
+└─$ kubectl describe deployment testiks            
+Name:                   testiks
+Namespace:              default
+CreationTimestamp:      Thu, 26 Mar 2026 12:49:02 +0300
+Labels:                 app=testiks
+                        component=api
+Annotations:            deployment.kubernetes.io/revision: 16
+Selector:               app=testiks
+Replicas:               3 desired | 3 updated | 3 total | 3 available | 0 unavailable
+StrategyType:           RollingUpdate
+MinReadySeconds:        0
+RollingUpdateStrategy:  0 max unavailable, 1 max surge
+Pod Template:
+  Labels:       app=testiks
+                component=api
+  Annotations:  kubectl.kubernetes.io/restartedAt: 2026-03-26T13:30:43+03:00
+  Containers:
+   app:
+    Image:      cacucoh/testiks:lab9
+    Port:       5000/TCP
+    Host Port:  0/TCP
+    Limits:
+      cpu:     500m
+      memory:  256Mi
+    Requests:
+      cpu:      100m
+      memory:   128Mi
+    Liveness:   http-get http://:http/health delay=15s timeout=3s period=10s #success=1 #failure=3
+    Readiness:  http-get http://:http/ready delay=5s timeout=2s period=5s #success=1 #failure=3
+    Environment:
+      PORT:        5000
+    Mounts:        <none>
+  Volumes:         <none>
+  Node-Selectors:  <none>
+  Tolerations:     <none>
+Conditions:
+  Type           Status  Reason
+  ----           ------  ------
+  Available      True    MinimumReplicasAvailable
+  Progressing    True    NewReplicaSetAvailable
+OldReplicaSets:  testiks-6dd7b49449 (0/0 replicas created), testiks-6c99d58d4d (0/0 replicas created), testiks-7f5cfd8947 (0/0 replicas created), testiks-7cb7974599 (0/0 replicas created), testiks-849474fb78 (0/0 replicas created), testiks-5dcd66d7c6 (0/0 replicas created), testiks-559cd698df (0/0 replicas created), testiks-6c8fdf9559 (0/0 replicas created), testiks-6f96859f5b (0/0 replicas created), testiks-6c976bcf57 (0/0 replicas created)
+NewReplicaSet:   testiks-764db4db6 (3/3 replicas created)
+Events:
+  Type    Reason             Age                   From                   Message
+  ----    ------             ----                  ----                   -------
+  Normal  ScalingReplicaSet  44m                   deployment-controller  Scaled up replica set testiks-c65d77cf5 from 0 to 3
+  Normal  ScalingReplicaSet  42m                   deployment-controller  Scaled up replica set testiks-7d66876995 from 0 to 1
+  Normal  ScalingReplicaSet  39m                   deployment-controller  Scaled down replica set testiks-c65d77cf5 from 3 to 2
+  Normal  ScalingReplicaSet  39m                   deployment-controller  Scaled up replica set testiks-7c7fbdfbf4 from 0 to 1
+  Normal  ScalingReplicaSet  37m                   deployment-controller  Scaled down replica set testiks-c65d77cf5 from 2 to 1
+  Normal  ScalingReplicaSet  37m                   deployment-controller  Scaled up replica set testiks-698df5d97c from 0 to 1
+  Normal  ScalingReplicaSet  31m                   deployment-controller  Scaled down replica set testiks-c65d77cf5 from 1 to 0
+  Normal  ScalingReplicaSet  31m                   deployment-controller  Scaled up replica set testiks-6dd7b49449 from 0 to 1
+  Normal  ScalingReplicaSet  30m                   deployment-controller  Scaled down replica set testiks-7d66876995 from 1 to 0
+  Normal  ScalingReplicaSet  30m                   deployment-controller  Scaled up replica set testiks-6c99d58d4d from 0 to 1
+  Normal  ScalingReplicaSet  18m                   deployment-controller  Scaled down replica set testiks-7c7fbdfbf4 from 1 to 0
+  Normal  ScalingReplicaSet  18m                   deployment-controller  Scaled up replica set testiks-7f5cfd8947 from 0 to 1
+  Normal  ScalingReplicaSet  15m                   deployment-controller  Scaled down replica set testiks-698df5d97c from 1 to 0
+  Normal  ScalingReplicaSet  15m                   deployment-controller  Scaled up replica set testiks-7cb7974599 from 0 to 1
+  Normal  ScalingReplicaSet  14m                   deployment-controller  Scaled down replica set testiks-6dd7b49449 from 1 to 0
+  Normal  ScalingReplicaSet  14m                   deployment-controller  Scaled up replica set testiks-849474fb78 from 0 to 1
+  Normal  ScalingReplicaSet  12m                   deployment-controller  Scaled down replica set testiks-6c99d58d4d from 1 to 0
+  Normal  ScalingReplicaSet  12m                   deployment-controller  Scaled up replica set testiks-5dcd66d7c6 from 0 to 1
+  Normal  ScalingReplicaSet  12m                   deployment-controller  Scaled down replica set testiks-7f5cfd8947 from 1 to 0
+  Normal  ScalingReplicaSet  2m30s (x14 over 12m)  deployment-controller  (combined from similar events): Scaled down replica set testiks-6c976bcf57 from 1 to 0
+```
+### Endpoints
+```
+└─$ kubectl get endpoints tetsiks
+
+Warning: v1 Endpoints is deprecated in v1.33+; use discovery.k8s.io/v1 EndpointSlice
+
+NAME                  ENDPOINTS                                                        AGE
+tetsiks   10.244.0.41:5000,10.244.0.42:5000,10.244.0.43:5000 + 2 more...   17m
+
+NAME                        ADDRESSTYPE   PORTS   ENDPOINTS                                         AGE
+tetsiks-8lkwr   IPv4          5000    10.244.0.41,10.244.0.42,10.244.0.43 + 2 more...   17m
+```
+
+### Curl tests
+![](./img/curl.png)
+
+### Scaling to 5 pods
+![](./img/scale.png)
+```
+kubectl scale deployment testiks --replicas=5
+kubectl rollout restart deployment/testiks
+kubectl rollout status deployment/testiks
+kubectl get pods
+```
+
+### Rollback
+![](./img/rollback.png)
+
+## 5. Production Considerations
+**Health checks:** **Liveness** probes call **`/health`** so Kubernetes restarts the container if the HTTP server stops responding while the process is still running. **Readiness** probes call **`/ready`** so traffic is only sent to Pods that report ready, which avoids routing to Pods that are still starting or temporarily overloaded.
+
+**Resource limits:** Limits (**256Mi** memory, **500m** CPU) bound worst-case usage on shared nodes. Requests (**128Mi**, **100m**) reserve a minimum so the scheduler does not overcommit the node. Values are conservative for a small API and would be raised after measuring steady-state and peak load.
+
+**Improvements for a real production environment**:
+- Add **startupProbe** for slow-start applications.
+- Add `PodDisruptionBudget` to preserve availability during voluntary disruptions.
+- Use `HorizontalPodAutoscaler` (HPA) based on CPU/RPS.
+- Use private registry + `imagePullSecrets`, pin image tags (no `latest`), sign images.
+- Use namespaces, NetworkPolicies, and secrets management (e.g., External Secrets/Vault).
+
+**Monitoring and observability:** The application exposes **Prometheus metrics** at `/metrics` for request rates, latency, and errors. Cluster-level metrics come from **kube-state-metrics** and **cAdvisor** when integrated with Prometheus. Logs can be collected with a node agent and centralized (for example **Loki**) for correlation with metric alerts.
+
+### Challenges & Solutions
+
+**Docker image issues:** Pods I pushed changes to my python app (added `/ready` endpoint) but kubernetes ignored these changes. Then I just created new lab tag and all succeed
\ No newline at end of file
diff --git a/k8s/deployment.yml b/k8s/deployment.yml
new file mode 100644
index 0000000000..7f2abf3e7f
--- /dev/null
+++ b/k8s/deployment.yml
@@ -0,0 +1,67 @@
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: testiks
+  labels:
+    app: testiks
+    component: api
+spec:
+  replicas: 3
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1
+      maxUnavailable: 0
+  selector:
+    matchLabels:
+      app: testiks
+  template:
+    metadata:
+      labels:
+        app: testiks
+        component: api
+    spec:
+      securityContext:
+        runAsNonRoot: true
+        runAsUser: 1000
+        runAsGroup: 1000
+        fsGroup: 1000
+      containers:
+        - name: app
+          image: cacucoh/testiks:lab9
+          imagePullPolicy: IfNotPresent
+          securityContext:
+            allowPrivilegeEscalation: false
+            capabilities:
+              drop:
+                - ALL
+          env:
+            - name: PORT
+              value: "5000"
+          ports:
+            - name: http
+              containerPort: 5000
+              protocol: TCP
+          resources:
+            requests:
+              cpu: "100m"
+              memory: "128Mi"
+            limits:
+              cpu: "500m"
+              memory: "256Mi"
+          livenessProbe:
+            httpGet:
+              path: /health
+              port: http
+            initialDelaySeconds: 15
+            periodSeconds: 10
+            timeoutSeconds: 3
+            failureThreshold: 3
+          readinessProbe:
+            httpGet:
+              path: /ready
+              port: http
+            initialDelaySeconds: 5
+            periodSeconds: 5
+            timeoutSeconds: 2
+            failureThreshold: 3
\ No newline at end of file
diff --git a/k8s/img/curl.png b/k8s/img/curl.png
new file mode 100644
index 0000000000..4d34a7296c
Binary files /dev/null and b/k8s/img/curl.png differ
diff --git a/k8s/img/detailed.png b/k8s/img/detailed.png
new file mode 100644
index 0000000000..a3519d5583
Binary files /dev/null and b/k8s/img/detailed.png differ
diff --git a/k8s/img/pods.png b/k8s/img/pods.png
new file mode 100644
index 0000000000..2a28ee99b1
Binary files /dev/null and b/k8s/img/pods.png differ
diff --git a/k8s/img/rollback.png b/k8s/img/rollback.png
new file mode 100644
index 0000000000..2a9510e821
Binary files /dev/null and b/k8s/img/rollback.png differ
diff --git a/k8s/img/scale.png b/k8s/img/scale.png
new file mode 100644
index 0000000000..9ad947e1ee
Binary files /dev/null and b/k8s/img/scale.png differ
diff --git a/k8s/service.yml b/k8s/service.yml
new file mode 100644
index 0000000000..d91419e221
--- /dev/null
+++ b/k8s/service.yml
@@ -0,0 +1,16 @@
+apiVersion: v1
+kind: Service
+metadata:
+  name: testiks
+  labels:
+    app: testiks
+spec:
+  type: NodePort
+  selector:
+    app: testiks
+  ports:
+    - name: http
+      protocol: TCP
+      port: 80
+      targetPort: http
+      nodePort: 30080
\ No newline at end of file
diff --git a/k8s/testiks/Chart.yaml b/k8s/testiks/Chart.yaml
new file mode 100644
index 0000000000..6e658a2710
--- /dev/null
+++ b/k8s/testiks/Chart.yaml
@@ -0,0 +1,12 @@
+apiVersion: v2
+name: testiks
+description: Helm chart for py web application
+type: application
+version: 0.1.0
+appVersion: "1.0.0"
+keywords:
+  - python
+  - web
+maintainers:
+  - name: CacucoH
+    email: dfffd7800@gmail.com
diff --git a/k8s/testiks/HELM.md b/k8s/testiks/HELM.md
new file mode 100644
index 0000000000..ce82315fb8
--- /dev/null
+++ b/k8s/testiks/HELM.md
@@ -0,0 +1,586 @@
+## Helm Package Manager (Lab 10)
+### Chart structure
+
+This Helm chart follows a standard and production-ready structure for deploying a Kubernetes application. Below is an explanation of each component and its purpose
+
+### Root Directory
+
+```
+testiks/
+├── Chart.yaml
+├── values.yaml
+├── values-dev.yaml
+├── values-prod.yaml
+└── templates/
+  ├── _helpers.tpl
+  ├── deployment.yaml
+  ├── service.yaml
+  ├── hooks-preinstall-job.yaml
+  └── hooks-postinstall-job.yaml
+```
+
+### Files and its purpose
+charts/: Directory containing any dependencies
+
+
+Chart.yaml:
+- This file contains metadata about the Helm chart
+Purpose:
+- Defines chart name, version, and description
+- Specifies chart type (application or library)
+- Provides application version
+
+
+values.yaml:
+- The values.yaml file defines default configuration values used across templates.
+Purpose:
+
+- Centralized configuration management
+- Allows easy customization without modifying templates
+- Supports overrides via CLI or environment-specific files
+
+_helpers.tpl:
+- Contains reusable template definitions.
+Purpose:
+- Avoid duplication
+- Standardize naming and labels
+- Improve maintainability
+
+deployment.yaml
+- Defines the Kubernetes Deployment resource.
+Purpose:
+- Deploys the application pods
+- Configures replicas, rolling updates, and container settings
+- Uses values from values.yaml for dynamic configuration
+
+hooks-postinstall-job.yaml:
+- Defines a Helm post-install hook
+Purpose:
+- Executes after installation completes
+- Used for smoke tests or notifications
+
+## task 1
+
+```
+$ sudo apt install helm
+$ helm version
+version.BuildInfo{Version:"v4.1.3", GitCommit:"c94d381b03be117e7e57908edbf642104e00eb8f", GitTreeState:"clean", GoVersion:"go1.26.1", KubeClientVersion:"v1.35"}
+```
+
+I started by creating a Helm chart in the k8s/ directory for my application. To do this, I ran the following command:
+```
+helm create k8s/testiks
+```
+This generated the basic Helm chart structure with all the necessary files and directories. I then updated the Chart.yaml to include the metadata for my chart:
+```
+apiVersion: v2
+name: testiks
+description: Helm chart for py web application
+type: application
+version: 0.1.0
+appVersion: "1.0"
+```
+The name field is set to testiks, and I chose 0.1.0 as the chart version. The appVersion is set to "1.0" to represent the version of my Python app.
+
+promethus repo:
+```
+$ helm show chart prometheus-community/prometheus
+annotations:
+  artifacthub.io/license: Apache-2.0
+  artifacthub.io/links: |
+    - name: Chart Source
+      url: https://github.com/prometheus-community/helm-charts
+    - name: Upstream Project
+      url: https://github.com/prometheus/prometheus
+apiVersion: v2
+appVersion: v3.11.0
+dependencies:
+- condition: alertmanager.enabled
+  name: alertmanager
+  repository: https://prometheus-community.github.io/helm-charts
+  version: 1.34.*
+- condition: kube-state-metrics.enabled
+  name: kube-state-metrics
+  repository: https://prometheus-community.github.io/helm-charts
+  version: 7.2.*
+- condition: prometheus-node-exporter.enabled
+  name: prometheus-node-exporter
+  repository: https://prometheus-community.github.io/helm-charts
+  version: 4.52.*
+- condition: prometheus-pushgateway.enabled
+  name: prometheus-pushgateway
+  repository: https://prometheus-community.github.io/helm-charts
+  version: 3.6.*
+description: Prometheus is a monitoring system and time series database.
+home: https://prometheus.io/
+icon: https://raw.githubusercontent.com/prometheus/prometheus.github.io/master/assets/prometheus_logo-cb55bb5c346.png
+keywords:
+- monitoring
+- prometheus
+kubeVersion: '>=1.19.0-0'
+maintainers:
+- email: gianrubio@gmail.com
+  name: gianrubio
+  url: https://github.com/gianrubio
+- email: zanhsieh@gmail.com
+  name: zanhsieh
+  url: https://github.com/zanhsieh
+- email: miroslav.hadzhiev@gmail.com
+  name: Xtigyro
+  url: https://github.com/Xtigyro
+- email: naseem@transit.app
+  name: naseemkullah
+  url: https://github.com/naseemkullah
+- email: rootsandtrees@posteo.de
+  name: zeritti
+  url: https://github.com/zeritti
+name: prometheus
+sources:
+- https://github.com/prometheus/alertmanager
+- https://github.com/prometheus/prometheus
+- https://github.com/prometheus/pushgateway
+- https://github.com/prometheus/node_exporter
+- https://github.com/kubernetes/kube-state-metrics
+type: application
+version: 28.15.0
+```
+
+### Why Helm matters
+Helm simplifies Kubernetes application management by providing a package manager for deploying, managing, and scaling applications. It allows you to define reusable and customizable Kubernetes manifests using charts, making deployments consistent across environments. Helm also offers versioning, rollback capabilities, dependency management, and automation, ensuring easier and more reliable application management on Kubernetes
+
+## Task 2
+
+Important Values:
+- replicaCount: number of pod replicas
+- image.repository / image.tag: container image source
+- containerPort: container listening port
+- service.type: NodePort for local access, LoadBalancer for production-style exposure
+- service.nodePort: fixed local NodePort for dev install
+- resources.requests / resources.limits: scheduler and runtime resource boundaries
+- livenessProbe / readinessProbe: health-check timings and paths
+- hooks.enabled: enables lifecycle Jobs
+
+### Environment Customization
+
+Two environment-specific configuration files are used:
+- Development (values-dev.yaml)
+    - 1 replica
+    - Lower resource usage
+    - NodePort service
+    - Latest image tag
+
+- Production (values-prod.yaml)
+    - 5 replicas
+    - Higher resource limits
+    - LoadBalancer service
+    - Fixed image version
+
+### Install example
+Development:
+```
+helm install testiks . -f values-dev.yaml
+```
+Production:
+```
+helm upgrade testiks . -f values-prod.yaml
+```
+
+## Task 3
+
+Two Helm hooks are implemented:
+1. Pre-install Hook
+- Runs before chart installation
+- Purpose: simulate pre-deployment validation
+
+2. Post-install Hook
+- Runs after deployment
+- Purpose: simulate smoke testing
+
+| | Pre-install | Post-install |
+|---|-------------|--------------|
+| Kind | Job | Job |
+| `helm.sh/hook` | `pre-install` | `post-install` |
+| `helm.sh/hook-weight` | `-5` | `5` |
+| `helm.sh/hook-delete-policy` | `hook-succeeded` when `hooks.deleteAfterSuccess` is true | same |
+
+
+### Operations
+```
+helm uninstall dev -n lab10-dev
+helm uninstall prod -n lab10-prod
+helm upgrade dev ./k8s/testiks -f k8s/testiks/values-dev.yaml -n lab10-dev
+helm history dev -n lab10-dev
+helm rollback dev <rev> -n lab10-dev
+```
+
+## Installation evidence
+
+```text
+$ helm lint ./k8s/testiks
+==> Linting ./k8s/testiks
+[INFO] Chart.yaml: icon is recommended
+1 chart(s) linted, 0 chart(s) failed
+```
+
+```text
+$ kubectl config current-context
+minikube
+
+$ kubectl cluster-info
+Kubernetes control plane is running at https://127.0.0.1:65035
+CoreDNS is running at https://127.0.0.1:65035/api/v1/namespaces/kube-system/services/kube-dns:dns/proxy
+
+$ kubectl get nodes
+NAME       STATUS   ROLES           AGE   VERSION
+minikube   Ready    control-plane   8d    v1.32.0
+```
+
+```bash
+helm template dev ./k8s/testiks -f k8s/testiks/values-dev.yaml -n lab10-dev
+helm template prod ./k8s/testiks -f k8s/testiks/values-prod.yaml -n lab10-prod
+```
+
+```text
+$ helm template dev ./k8s/testiks -f k8s/testiks/values-dev.yaml -n lab10-dev 2>&1 | head -42
+---
+# Source: testiks/templates/deployment.yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: dev-testiks
+  labels:
+    helm.sh/chart: testiks-0.1.0
+    app.kubernetes.io/name: testiks
+    app.kubernetes.io/instance: dev
+    app.kubernetes.io/version: "1.0.0"
+    app.kubernetes.io/managed-by: Helm
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app.kubernetes.io/name: testiks
+      app.kubernetes.io/instance: dev
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1
+      maxUnavailable: 0
+  template:
+    metadata:
+      labels:
+        app.kubernetes.io/name: testiks
+        app.kubernetes.io/instance: dev
+    spec:
+      containers:
+        - name: testiks
+          image: "cacucoh/testiks:latest"
+          imagePullPolicy: Always
+          ports:
+            - name: http
+              containerPort: 5000
+              protocol: TCP
+```
+
+```text
+$ helm install dev ./k8s/testiks \
+  -f k8s/testiks/values-dev.yaml \
+  --namespace lab10-dev --create-namespace
+NAME: dev
+LAST DEPLOYED: Thu Apr  2 19:39:50 2026
+NAMESPACE: lab10-dev
+STATUS: deployed
+REVISION: 1
+TEST SUITE: None
+NOTES:
+1. Get the application URL by running these commands:
+  export NODE_PORT=$(kubectl get --namespace lab10-dev -o jsonpath="{.spec.ports[0].nodePort}" services dev-testiks)
+  export NODE_IP=$(kubectl get nodes --namespace lab10-dev -o jsonpath="{.items[0].status.addresses[0].address}")
+  echo http://$NODE_IP:$NODE_PORT/health
+
+Release: dev
+Namespace: lab10-dev
+```
+
+```text
+$ helm list -n lab10-dev
+NAME    NAMESPACE       REVISION        UPDATED                                 STATUS        CHART                            APP VERSION
+dev     lab10-dev       1               2026-04-02 19:39:50.110994 +0300 MSK    deployed      testiks-0.1.0        1.0.0
+```
+
+```text
+$ kubectl get all -n lab10-dev
+NAME                                           READY   STATUS    RESTARTS   AGE
+pod/dev-testiks-84579bd9bb-8mnkp   1/1     Running   0          62s
+
+NAME                              TYPE       CLUSTER-IP       EXTERNAL-IP   PORT(S)        AGE
+service/dev-testiks   NodePort   10.103.117.200   <none>        80:30081/TCP   62s
+
+NAME                                      READY   UP-TO-DATE   AVAILABLE   AGE
+deployment.apps/dev-testiks   1/1     1            1           62s
+
+NAME                                                 DESIRED   CURRENT   READY   AGE
+replicaset.apps/dev-testiks-84579bd9bb   1         1         1       62s
+```
+
+With default `deleteAfterSuccess: true`, hook Jobs are removed after success (`kubectl get jobs` is empty). With `values-hooks-keep.yaml`:
+
+```bash
+helm uninstall dev -n lab10-dev
+helm install dev ./k8s/testiks \
+  -f k8s/testiks/values-dev.yaml \
+  -f k8s/testiks/values-hooks-keep.yaml \
+  --namespace lab10-dev
+kubectl get jobs -n lab10-dev
+kubectl describe job dev-testiks-pre-install -n lab10-dev
+kubectl describe job dev-testiks-post-install -n lab10-dev
+kubectl logs -n lab10-dev job/dev-testiks-pre-install
+kubectl logs -n lab10-dev job/dev-testiks-post-install
+```
+
+```text
+$ helm install dev ./k8s/testiks \
+  -f k8s/testiks/values-dev.yaml \
+  -f k8s/testiks/values-hooks-keep.yaml \
+  --namespace lab10-dev
+NAME: dev
+LAST DEPLOYED: Thu Apr  2 19:48:28 2026
+NAMESPACE: lab10-dev
+STATUS: deployed
+REVISION: 1
+```
+
+```text
+$ kubectl get jobs -n lab10-dev
+NAME                                   STATUS     COMPLETIONS   DURATION   AGE
+dev-testiks-post-install   Complete   1/1           4s         12s
+dev-testiks-pre-install    Complete   1/1           3s         15s
+```
+
+```text
+$ kubectl describe job dev-testiks-pre-install -n lab10-dev
+Name:             dev-testiks-pre-install
+Namespace:        lab10-dev
+Selector:         batch.kubernetes.io/controller-uid=b3df58aa-361f-48fd-8b38-934fa4dbe167
+Labels:           app.kubernetes.io/instance=dev
+                  app.kubernetes.io/managed-by=Helm
+                  app.kubernetes.io/name=testiks
+                  app.kubernetes.io/version=1.0.0
+                  helm.sh/chart=testiks-0.1.0
+Annotations:      helm.sh/hook: pre-install
+                  helm.sh/hook-weight: -5
+Parallelism:      1
+Completions:      1
+Completion Mode:  NonIndexed
+Suspend:          false
+Backoff Limit:    2
+Start Time:       Thu, 02 Apr 2026 19:48:28 +0300
+Completed At:     Thu, 02 Apr 2026 19:48:31 +0300
+Duration:         3s
+Pods Statuses:    0 Active (0 Ready) / 1 Succeeded / 0 Failed
+Pod Template:
+  Labels:  app.kubernetes.io/managed-by=Helm
+           batch.kubernetes.io/controller-uid=b3df58aa-361f-48fd-8b38-934fa4dbe167
+           batch.kubernetes.io/job-name=dev-testiks-pre-install
+           controller-uid=b3df58aa-361f-48fd-8b38-934fa4dbe167
+           helm.sh/hook=pre-install
+           job-name=dev-testiks-pre-install
+  Containers:
+   pre-install:
+    Image:      busybox:1.36
+    Command:
+      sh
+      -c
+      set -e
+      echo "pre-install: release=dev ns=lab10-dev"
+      echo "pre-install OK"
+    Environment:   <none>
+    Mounts:        <none>
+  Volumes:         <none>
+  Node-Selectors:  <none>
+  Tolerations:     <none>
+Events:
+  Type    Reason            Age   From            Message
+  ----    ------            ----  ----            -------
+  Normal  SuccessfulCreate  22s   job-controller  Created pod: dev-testiks-pre-install-q8xgb
+  Normal  Completed         19s   job-controller  Job completed
+```
+
+```text
+$ kubectl logs -n lab10-dev job/dev-testiks-pre-install
+pre-install: release=dev ns=lab10-dev
+pre-install OK
+```
+
+```text
+$ kubectl logs -n lab10-dev job/dev-testiks-post-install
+post-install: smoke GET http://dev-testiks.lab10-dev.svc.cluster.local:80/health
+{"status":"healthy","timestamp":"2026-04-02T16:48:32.488027+00:00","uptime_seconds":507}
+post-install OK
+```
+
+Production install (`values-prod.yaml`):
+
+```text
+$ helm list -n lab10-prod
+NAME    NAMESPACE       REVISION        UPDATED                                 STATUS  CHART                          APP VERSION
+prod    lab10-prod      1               2026-04-02 19:51:57.134345 +0300 MSK    failed  testiks-0.1.0      1.0.0
+```
+
+```text
+$ kubectl get all -n lab10-prod
+NAME                                              READY   STATUS      RESTARTS   AGE
+pod/prod-testiks-05dff54df9-b77f4     0/1     Running     0          40s
+pod/prod-testiks-05dff54df9-lf2j2     0/1     Running     0          40s
+pod/prod-testiks-05dff54df9-q54dt     0/1     Running     0          40s
+pod/prod-testiks-05dff54df9-sw95m     1/1     Running     0          40s
+pod/prod-testiks-05dff54df9-z45wb     1/1     Running     0          40s
+pod/prod-testiks-post-install-t4c9p   0/1     Completed   0          40s
+
+NAME                               TYPE           CLUSTER-IP       EXTERNAL-IP   PORT(S)        AGE
+service/prod-testiks   LoadBalancer   10.103.135.218   <pending>     80:31854/TCP   40s
+
+NAME                                       READY   UP-TO-DATE   AVAILABLE   AGE
+deployment.apps/prod-testiks   2/5     5            2           40s
+
+NAME                                                  DESIRED   CURRENT   READY   AGE
+replicaset.apps/prod-testiks-05dff54df9   5         5         2       40s
+
+NAME                                              STATUS     COMPLETIONS   DURATION   AGE
+job.batch/prod-testiks-post-install   Complete   1/1           30s        40s
+```
+
+```text
+$ kubectl get svc -n lab10-prod
+NAME                       TYPE           CLUSTER-IP       EXTERNAL-IP   PORT(S)        AGE
+prod-testiks   LoadBalancer   10.103.135.218   <pending>     80:31854/TCP   47s
+```
+
+```bash
+kubectl port-forward -n lab10-prod svc/prod-testiks 8080:80
+```
+
+```text
+$ kubectl rollout status deployment/prod-testiks -n lab10-prod
+deployment "prod-testiks" successfully rolled out
+
+$ helm upgrade prod ./k8s/testiks -f k8s/testiks/values-prod.yaml -n lab10-prod
+Release "prod" has been upgraded. Happy Helming!
+NAME: prod
+LAST DEPLOYED: Thu Apr  2 19:54:16 2026
+NAMESPACE: lab10-prod
+STATUS: deployed
+REVISION: 2
+TEST SUITE: None
+NOTES:
+1. Get the application URL by running these commands:
+  NOTE: It may take a few minutes for the LoadBalancer IP to be available.
+        Watch status: kubectl get svc -w prod-testiks
+  export SERVICE_IP=$(kubectl get svc --namespace lab10-prod prod-testiks -o jsonpath='{.status.loadBalancer.ingress[0].ip}')
+  echo http://$SERVICE_IP:80/health
+
+Release: prod
+Namespace: lab10-prod
+```
+
+The following `helm list -A` was captured before `helm upgrade prod`; the upgrade transcript above records `prod` at revision 2 `deployed`.
+
+```text
+$ helm list -A
+NAME    NAMESPACE       REVISION        UPDATED                                 STATUS        CHART                            APP VERSION
+dev     default         1               2026-04-02 19:38:26.499655 +0300 MSK    failed        testiks-0.1.0        1.0.0
+dev     lab10-dev       1               2026-04-02 19:48:28.029525 +0300 MSK    deployed      testiks-0.1.0        1.0.0
+prod    lab10-prod      1               2026-04-02 19:51:57.134345 +0300 MSK    failed        testiks-0.1.0        1.0.0
+```
+
+```bash
+helm uninstall dev -n default
+```
+
+## Testing and validation
+
+```bash
+helm lint ./k8s/testiks
+helm template dev ./k8s/testiks -f k8s/testiks/values-dev.yaml -n lab10-dev
+helm install dev-dryrun ./k8s/testiks \
+  -f k8s/testiks/values-dev.yaml \
+  --namespace lab-dryrun --create-namespace \
+  --dry-run=client
+```
+
+```text
+$ helm install dev-dryrun ./k8s/testiks \
+  -f k8s/testiks/values-dev.yaml \
+  --namespace lab-dryrun --create-namespace \
+  --dry-run=client 2>&1 | head -80
+NAME: dev-dryrun
+LAST DEPLOYED: Thu Apr  2 19:53:17 2026
+NAMESPACE: lab-dryrun
+STATUS: pending-install
+REVISION: 1
+TEST SUITE: None
+HOOKS:
+---
+# Source: testiks/templates/hooks/post-install-job.yaml
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: dev-dryrun-testiks-post-install
+  annotations:
+    helm.sh/hook: post-install
+    helm.sh/hook-weight: "5"
+    helm.sh/hook-delete-policy: hook-succeeded
+  labels:
+    helm.sh/chart: testiks-0.1.0
+    app.kubernetes.io/name: testiks
+    app.kubernetes.io/instance: dev-dryrun
+    app.kubernetes.io/version: "1.0.0"
+    app.kubernetes.io/managed-by: Helm
+spec:
+  backoffLimit: 3
+  template:
+    metadata:
+      labels:
+        app.kubernetes.io/managed-by: Helm
+        helm.sh/hook: post-install
+    spec:
+      restartPolicy: Never
+      containers:
+        - name: post-install
+          image: "curlimages/curl:8.5.0"
+          command:
+            - sh
+            - -c
+            - |
+              set -e
+              URL="http://dev-dryrun-testiks.lab-dryrun.svc.cluster.local:80/health"
+              echo "post-install: smoke GET $URL"
+              i=0
+              while [ "$i" -lt 30 ]; do
+                if curl -fsS --connect-timeout 3 --max-time 10 "$URL"; then
+                  echo "post-install OK"
+                  exit 0
+                fi
+                i=$((i + 1))
+                echo "post-install: retry $i/30"
+                sleep 2
+              done
+              echo "post-install: health check failed" >&2
+              exit 1
+```
+
+```text
+$ curl -sS -i localhost:8080/health
+
+HTTP/1.1 200 OK
+Server: Werkzeug/3.1.7 Python/3.13.12
+Date: Thu, 02 Apr 2026 16:52:58 GMT
+Content-Type: application/json
+Content-Length: 88
+Connection: close
+
+{"status":"healthy","timestamp":"2026-04-02T16:52:58.654555+00:00","uptime_seconds":41}
+```
+
+```bash
+curl "$(minikube service dev-testiks -n lab10-dev --url)/health"
+```
\ No newline at end of file
diff --git a/k8s/testiks/deployment.yml b/k8s/testiks/deployment.yml
new file mode 100644
index 0000000000..78ec4c61c1
--- /dev/null
+++ b/k8s/testiks/deployment.yml
@@ -0,0 +1,73 @@
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: testiks
+  labels:
+    app: testiks
+    app.kubernetes.io/name: testiks
+    app.kubernetes.io/component: web
+    app.kubernetes.io/part-of: devops-core-course
+spec:
+  replicas: 3
+  minReadySeconds: 5
+  revisionHistoryLimit: 5
+  selector:
+    matchLabels:
+      app: testiks
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1
+      maxUnavailable: 0
+  template:
+    metadata:
+      labels:
+        app: testiks
+        app.kubernetes.io/name: testiks
+        app.kubernetes.io/component: web
+        app.kubernetes.io/part-of: devops-core-course
+    spec:
+      securityContext:
+        seccompProfile:
+          type: RuntimeDefault
+      containers:
+        - name: testiks
+          image: testiks:lab09
+          imagePullPolicy: IfNotPresent
+          ports:
+            - name: http
+              containerPort: 5000
+          env:
+            - name: PORT
+              value: "5000"
+          resources:
+            requests:
+              cpu: 100m
+              memory: 128Mi
+            limits:
+              cpu: 250m
+              memory: 256Mi
+          securityContext:
+            runAsUser: 10001
+            runAsGroup: 10001
+            runAsNonRoot: true
+            allowPrivilegeEscalation: false
+            capabilities:
+              drop:
+                - ALL
+          readinessProbe:
+            httpGet:
+              path: /health
+              port: http
+            initialDelaySeconds: 5
+            periodSeconds: 5
+            timeoutSeconds: 2
+            failureThreshold: 3
+          livenessProbe:
+            httpGet:
+              path: /health
+              port: http
+            initialDelaySeconds: 15
+            periodSeconds: 10
+            timeoutSeconds: 2
+            failureThreshold: 3
\ No newline at end of file
diff --git a/k8s/testiks/service.yml b/k8s/testiks/service.yml
new file mode 100644
index 0000000000..e55c7b045a
--- /dev/null
+++ b/k8s/testiks/service.yml
@@ -0,0 +1,19 @@
+apiVersion: v1
+kind: Service
+metadata:
+  name: testiks
+  labels:
+    app: testiks
+    app.kubernetes.io/name: testiks
+    app.kubernetes.io/component: web
+    app.kubernetes.io/part-of: devops-core-course
+spec:
+  type: NodePort
+  selector:
+    app: testiks
+  ports:
+    - name: http
+      protocol: TCP
+      port: 80
+      targetPort: http
+      nodePort: 30080
\ No newline at end of file
diff --git a/k8s/testiks/templates/NOTES.txt b/k8s/testiks/templates/NOTES.txt
new file mode 100644
index 0000000000..43246accac
--- /dev/null
+++ b/k8s/testiks/templates/NOTES.txt
@@ -0,0 +1,14 @@
+1. Get the application URL by running these commands:
+{{- if eq .Values.service.type "NodePort" }}
+  export NODE_PORT=$(kubectl get --namespace {{ .Release.Namespace }} -o jsonpath="{.spec.ports[0].nodePort}" services {{ include "testiks.fullname" . }})
+  export NODE_IP=$(kubectl get nodes --namespace {{ .Release.Namespace }} -o jsonpath="{.items[0].status.addresses[0].address}")
+  echo http://$NODE_IP:$NODE_PORT/health
+{{- else if eq .Values.service.type "LoadBalancer" }}
+  NOTE: It may take a few minutes for the LoadBalancer IP to be available.
+        Watch status: kubectl get svc -w {{ include "testiks.fullname" . }}
+  export SERVICE_IP=$(kubectl get svc --namespace {{ .Release.Namespace }} {{ include "testiks.fullname" . }} -o jsonpath='{.status.loadBalancer.ingress[0].ip}')
+  echo http://$SERVICE_IP:{{ .Values.service.port }}/health
+{{- end }}
+
+Release: {{ .Release.Name }}
+Namespace: {{ .Release.Namespace }}
diff --git a/k8s/testiks/templates/_helpers.tpl b/k8s/testiks/templates/_helpers.tpl
new file mode 100644
index 0000000000..3c2a31c442
--- /dev/null
+++ b/k8s/testiks/templates/_helpers.tpl
@@ -0,0 +1,43 @@
+{{/*
+Expand the name of the chart.
+*/}}
+{{- define "testiks.name" -}}
+{{- default .Chart.Name .Values.nameOverride | trunc 63 | trimSuffix "-" }}
+{{- end }}
+
+{{/*
+Create a default fully qualified app name.
+*/}}
+{{- define "testiks.fullname" -}}
+{{- if .Values.fullnameOverride }}
+{{- .Values.fullnameOverride | trunc 63 | trimSuffix "-" }}
+{{- else }}
+{{- $name := default .Chart.Name .Values.nameOverride }}
+{{- printf "%s-%s" .Release.Name $name | trunc 63 | trimSuffix "-" }}
+{{- end }}
+{{- end }}
+
+{{/*
+Create chart name and version as used by the chart label.
+*/}}
+{{- define "testiks.chart" -}}
+{{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" }}
+{{- end }}
+
+{{/*
+Common labels
+*/}}
+{{- define "testiks.labels" -}}
+helm.sh/chart: {{ include "testiks.chart" . }}
+{{ include "testiks.selectorLabels" . }}
+app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
+app.kubernetes.io/managed-by: {{ .Release.Service }}
+{{- end }}
+
+{{/*
+Selector labels
+*/}}
+{{- define "testiks.selectorLabels" -}}
+app.kubernetes.io/name: {{ include "testiks.name" . }}
+app.kubernetes.io/instance: {{ .Release.Name }}
+{{- end }}
diff --git a/k8s/testiks/templates/deployment.yaml b/k8s/testiks/templates/deployment.yaml
new file mode 100644
index 0000000000..09bcf9acc8
--- /dev/null
+++ b/k8s/testiks/templates/deployment.yaml
@@ -0,0 +1,46 @@
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: {{ include "testiks.fullname" . }}
+  labels:
+    {{- include "testiks.labels" . | nindent 4 }}
+spec:
+  replicas: {{ .Values.replicaCount }}
+  selector:
+    matchLabels:
+      {{- include "testiks.selectorLabels" . | nindent 6 }}
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1
+      maxUnavailable: 0
+  template:
+    metadata:
+      labels:
+        {{- include "testiks.selectorLabels" . | nindent 8 }}
+    spec:
+      securityContext:
+        seccompProfile:
+          type: RuntimeDefault
+      containers:
+        - name: {{ .Chart.Name }}
+          image: "{{ .Values.image.repository }}:{{ .Values.image.tag | default .Chart.AppVersion }}"
+          imagePullPolicy: {{ .Values.image.pullPolicy }}
+          ports:
+            - name: http
+              containerPort: {{ .Values.containerPort }}
+              protocol: TCP
+          resources:
+            {{- toYaml .Values.resources | nindent 12 }}
+          securityContext:
+            runAsUser: 10001
+            runAsGroup: 10001
+            runAsNonRoot: true
+            allowPrivilegeEscalation: false
+            capabilities:
+              drop:
+                - ALL
+          livenessProbe:
+            {{- toYaml .Values.livenessProbe | nindent 12 }}
+          readinessProbe:
+            {{- toYaml .Values.readinessProbe | nindent 12 }}
diff --git a/k8s/testiks/templates/hooks/post-install-job.yaml b/k8s/testiks/templates/hooks/post-install-job.yaml
new file mode 100644
index 0000000000..99eb9ae2e4
--- /dev/null
+++ b/k8s/testiks/templates/hooks/post-install-job.yaml
@@ -0,0 +1,41 @@
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: "{{ include "testiks.fullname" . }}-post-install"
+  labels:
+    {{- include "testiks.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": post-install
+    "helm.sh/hook-weight": "5"
+    "helm.sh/hook-delete-policy": {{ if .Values.hooks.deleteAfterSuccess }}hook-succeeded{{ else }}before-hook-creation{{ end }}
+spec:
+  backoffLimit: 3
+  template:
+    metadata:
+      labels:
+        app.kubernetes.io/managed-by: Helm
+        helm.sh/hook: post-install
+    spec:
+      restartPolicy: Never
+      containers:
+        - name: post-install
+          image: "curlimages/curl:8.5.0"
+          command:
+            - sh
+            - -c
+            - |
+              set -e
+              URL="http://{{ include "testiks.fullname" . }}.{{ .Release.Namespace }}.svc.cluster.local:{{ .Values.service.port }}/health"
+              echo "post-install: smoke GET $URL"
+              i=0
+              while [ "$i" -lt 30 ]; do
+                if curl -fsS --connect-timeout 3 --max-time 10 "$URL"; then
+                  echo "post-install OK"
+                  exit 0
+                fi
+                i=$((i + 1))
+                echo "post-install: retry $i/30"
+                sleep 2
+              done
+              echo "post-install: health check failed" >&2
+              exit 1
diff --git a/k8s/testiks/templates/hooks/pre-install-job.yaml b/k8s/testiks/templates/hooks/pre-install-job.yaml
new file mode 100644
index 0000000000..08c582166f
--- /dev/null
+++ b/k8s/testiks/templates/hooks/pre-install-job.yaml
@@ -0,0 +1,29 @@
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: "{{ include "testiks.fullname" . }}-pre-install"
+  labels:
+    {{- include "testiks.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": pre-install
+    "helm.sh/hook-weight": "-5"
+    "helm.sh/hook-delete-policy": {{ if .Values.hooks.deleteAfterSuccess }}hook-succeeded{{ else }}before-hook-creation{{ end }}
+spec:
+  backoffLimit: 2
+  template:
+    metadata:
+      labels:
+        app.kubernetes.io/managed-by: Helm
+        helm.sh/hook: pre-install
+    spec:
+      restartPolicy: Never
+      containers:
+        - name: pre-install
+          image: busybox:1.36
+          command:
+            - sh
+            - -c
+            - |
+              set -e
+              echo "pre-install: release={{ .Release.Name }} ns={{ .Release.Namespace }}"
+              echo "pre-install OK"
diff --git a/k8s/testiks/templates/service.yaml b/k8s/testiks/templates/service.yaml
new file mode 100644
index 0000000000..f3299537b5
--- /dev/null
+++ b/k8s/testiks/templates/service.yaml
@@ -0,0 +1,18 @@
+apiVersion: v1
+kind: Service
+metadata:
+  name: {{ include "testiks.fullname" . }}
+  labels:
+    {{- include "testiks.labels" . | nindent 4 }}
+spec:
+  type: {{ .Values.service.type }}
+  selector:
+    {{- include "testiks.selectorLabels" . | nindent 4 }}
+  ports:
+    - name: http
+      protocol: TCP
+      port: {{ .Values.service.port }}
+      targetPort: http
+      {{- if and (eq .Values.service.type "NodePort") .Values.service.nodePort }}
+      nodePort: {{ .Values.service.nodePort }}
+      {{- end }}
diff --git a/k8s/testiks/values-dev.yaml b/k8s/testiks/values-dev.yaml
new file mode 100644
index 0000000000..47363925f6
--- /dev/null
+++ b/k8s/testiks/values-dev.yaml
@@ -0,0 +1,25 @@
+replicaCount: 1
+
+image:
+  tag: "latest"
+  pullPolicy: Always
+
+service:
+  type: NodePort
+  nodePort: 30081
+
+resources:
+  requests:
+    cpu: 50m
+    memory: 64Mi
+  limits:
+    cpu: 100m
+    memory: 128Mi
+
+livenessProbe:
+  initialDelaySeconds: 5
+  periodSeconds: 10
+
+readinessProbe:
+  initialDelaySeconds: 3
+  periodSeconds: 5
diff --git a/k8s/testiks/values-prod.yaml b/k8s/testiks/values-prod.yaml
new file mode 100644
index 0000000000..10ecf11523
--- /dev/null
+++ b/k8s/testiks/values-prod.yaml
@@ -0,0 +1,24 @@
+replicaCount: 5
+
+image:
+  tag: "1.0.0"
+  pullPolicy: IfNotPresent
+
+service:
+  type: LoadBalancer
+
+resources:
+  requests:
+    cpu: 200m
+    memory: 256Mi
+  limits:
+    cpu: 500m
+    memory: 512Mi
+
+livenessProbe:
+  initialDelaySeconds: 30
+  periodSeconds: 5
+
+readinessProbe:
+  initialDelaySeconds: 10
+  periodSeconds: 3
diff --git a/k8s/testiks/values.yaml b/k8s/testiks/values.yaml
new file mode 100644
index 0000000000..c413a1e7f2
--- /dev/null
+++ b/k8s/testiks/values.yaml
@@ -0,0 +1,43 @@
+replicaCount: 3
+
+image:
+  repository: cacucoh/testiks
+  tag: "1.0.0"
+  pullPolicy: IfNotPresent
+
+containerPort: 5000
+
+service:
+  type: NodePort
+  port: 80
+  targetPort: 5000
+  nodePort: 30081
+
+resources:
+  requests:
+    cpu: 100m
+    memory: 128Mi
+  limits:
+    cpu: 250m
+    memory: 256Mi
+
+livenessProbe:
+  httpGet:
+    path: /health
+    port: 5000
+  initialDelaySeconds: 15
+  periodSeconds: 10
+  timeoutSeconds: 2
+  failureThreshold: 3
+
+readinessProbe:
+  httpGet:
+    path: /health
+    port: 5000
+  initialDelaySeconds: 5
+  periodSeconds: 5
+  timeoutSeconds: 2
+  failureThreshold: 3
+
+hooks:
+  deleteAfterSuccess: true
diff --git a/lab1.md b/lab1.md
deleted file mode 100644
index 30b74c95f5..0000000000
--- a/lab1.md
+++ /dev/null
@@ -1,65 +0,0 @@
-# Lab 1: Web Application Development
-
-## Overview
-
-In this lab assignment, you will develop a simple web application using Python and best practices. You will also have the opportunity to create a bonus web application using a different programming language. Follow the tasks below to complete the lab assignment.
-
-## Task 1: Python Web Application
-
-**6 Points:**
-
-1. Create `app_python` Folder:
-   - Create a folder named `app_python` to contain your Python web application files.
-   - Inside the `app_python` folder, create a file named `PYTHON.md`.
-
-2. Develop and Test Python Web Application:
-   - Develop a Python web application that displays the current time in Moscow.
-   - Choose a suitable framework for your web application and justify your choice in the `PYTHON.md` file.
-   - Implement best practices in your code and follow coding standards.
-   - Test your application to ensure the displayed time updates upon page refreshing.
-
-## Task 2: Well Decorated Description
-
-**4 Points:**
-
-1. Update `PYTHON.md`:
-   - Describe best practices applied in the web application.
-   - Explain how you followed coding standards, implemented testing, and ensured code quality.
-
-2. Create `README.md` in `app_python` folder:
-   - Use a Markdown template to document the Python web application.
-
-3. Ensure:
-   - Maintain a clean `.gitignore` file.
-   - Use a concise `requirements.txt` file for required dependencies.
-
-### List of Requirements
-
-- MSK Time timezone set up
-- 2 PRs created
-- README includes Overview
-- Nice Markdown decoration
-- Local installation details in README
-
-## Bonus Task: Additional Web Application
-
-**2.5 Points:**
-
-1. Create `app_*` Folder:
-   - Create a folder named `app_*` in the main project directory, replacing `*` with a programming language of your choice (other than Python).
-   - Inside the `app_*` folder, create a file named `*`.md.
-
-2. Develop Your Own Web App:
-   - Create a web application using the programming language you chose.
-   - Decide what your web application will display or do, and use your creativity.
-
-3. Follow Main Task Steps:
-   - Implement your bonus web application following the same suggestions and steps as the main Python web application task.
-
-### Guidelines
-
-- Use proper Markdown formatting and structure for the documentation files. We will use [online one](https://dlaa.me/markdownlint/) to check your `.md` files.
-- Organize the files within the lab folder using appropriate naming conventions.
-- Create a PR from your fork to the master branch of this repository and from your fork's branch to your fork's master branch with your completed lab assignment.
-
-> Note: Apply best practices, coding standards, and testing to your Python web application. Explore creativity in your bonus web application, and document your process using Markdown.
diff --git a/lab10.md b/lab10.md
deleted file mode 100644
index c472086168..0000000000
--- a/lab10.md
+++ /dev/null
@@ -1,91 +0,0 @@
-# Lab 10: Introduction to Helm
-
-## Overview
-
-In this lab, you will become familiar with Helm, set up a local development environment, and generate manifests for your application.
-
-## Task 1: Helm Setup and Chart Creation
-
-**6 Points:**
-
-1. Learn About Helm:
-   - Begin by exploring the architecture and concepts of Helm:
-     - [Helm Architecture](https://helm.sh/docs/topics/architecture/)
-     - [Understanding Helm Charts](https://helm.sh/docs/topics/charts/)
-
-2. Install Helm:
-   - Install Helm using the instructions provided:
-     - [Helm Installation](https://helm.sh/docs/intro/install/)
-     - [Chart Repository Initialization](https://helm.sh/docs/intro/quickstart/#initialize-a-helm-chart-repository)
-
-3. Create Your Own Helm Chart:
-   - Generate a Helm chart for your application.
-     - Inside the `k8s` folder, create a Helm chart template by using the command `helm create your-app`.
-     - Replace the default repository and tag inside the `values.yaml` file with your repository name.
-     - Modify the `containerPort` setting in the `deployment.yml` file.
-     - If you encounter issues with `livenessProbe` and `readinessProbe`, you can comment them out.
-
-   > For troubleshooting, you can use the `minikube dashboard` command.
-
-4. Install Your Helm Chart:
-   - Install your custom Helm chart and ensure that all services are healthy. Verify this by checking the `Workloads` page in the Minikube dashboard.
-
-5. Access Your Application:
-   - Confirm that your application is accessible by running the `minikube service your_service_name` command.
-
-6. Create a HELM.md File:
-   - Construct a `HELM.md` file and provide the output of the `kubectl get pods,svc` command within it.
-
-## Task 2: Helm Chart Hooks
-
-**4 Points:**
-
-1. Learn About Chart Hooks:
-   - Familiarize yourself with [Helm Chart Hooks](https://helm.sh/docs/topics/charts_hooks/).
-
-2. Implement Helm Chart Hooks:
-   - Develop pre-install and post-install pods within your Helm chart, without adding any complex logic (e.g., use "sleep 20"). You can refer to [Example 1 in the guide](https://www.golinuxcloud.com/kubernetes-helm-hooks-examples/).
-
-3. Troubleshoot Hooks:
-   - Execute the following commands to troubleshoot your hooks:
-     1. `helm lint <your_chart_name>`
-     2. `helm install --dry-run helm-hooks <your_chart_name>`
-     3. `kubectl get po`
-
-4. Provide Output:
-   - Execute the following commands and include their output in your report:
-     1. `kubectl get po`
-     2. `kubectl describe po <preinstall_hook_name>`
-     3. `kubectl describe po <postinstall_hook_name>`
-
-5. Hook Delete Policy:
-   - Implement a hook delete policy to remove the hook once it has executed successfully.
-
-**List of Requirements:**
-
-- Helm Chart with Hooks implemented, including the hook delete policy.
-- Output of the `kubectl get pods,svc` command in `HELM.md`.
-- Output of all commands from the step 4 of Task 2 in `HELM.md`.
-
-## Bonus Task: Helm Library Chart
-
-**To Earn 2.5 Additional Points:**
-
-1. Helm Chart for Extra App:
-   - Prepare a Helm chart for an additional application.
-
-2. Helm Library Charts:
-   - Get acquainted with [Helm Library Charts](https://helm.sh/docs/topics/library_charts/).
-
-3. Create a Library Chart:
-   - Develop a simple library chart that includes a "labels" template. You can follow the steps outlined in [the Using Library Charts guide](https://austindewey.com/2020/08/17/how-to-reduce-helm-chart-boilerplate-with-library-charts/). Use this library chart for both of your applications.
-
-### Guidelines
-
-- Ensure your documentation is clear and well-structured.
-- Include all the necessary components.
-- Follow appropriate file and folder naming conventions.
-- Create and participate in PRs for the peer review process.
-- Create pull requests (PRs) as needed: from your fork to the main branch of this repository, and from your fork's branch to your fork's master branch.
-
-> Note: Detailed documentation is crucial to ensure that your Helm deployment and hooks function as expected. Engage with the bonus tasks to further enhance your understanding and application deployment skills.
diff --git a/lab11.md b/lab11.md
deleted file mode 100644
index 4994bb1a80..0000000000
--- a/lab11.md
+++ /dev/null
@@ -1,85 +0,0 @@
-# Lab 11: Kubernetes Secrets and Hashicorp Vault
-
-## Overview
-
-In this lab, you will learn how to manage sensitive data, such as passwords, tokens, or keys, within Kubernetes. Additionally, you will configure CPU and memory limits for your application.
-
-## Task 1: Kubernetes Secrets and Resource Management
-
-**6 Points:**
-
-1. Create a Secret Using `kubectl`:
-   - Learn about Kubernetes Secrets and create a secret using the `kubectl` command:
-     - [Kubernetes Secrets](https://kubernetes.io/docs/concepts/configuration/secret/)
-     - [Managing Secrets with kubectl](https://kubernetes.io/docs/tasks/configmap-secret/managing-secret-using-kubectl/#decoding-secret)
-
-2. Verify and Decode Your Secret:
-   - Confirm and decode the secret, then create an `11.md` file within the `k8s` folder. Provide the output of the necessary commands inside this file.
-
-3. Manage Secrets with Helm:
-   - Use Helm to manage your secrets.
-   - Create a `secrets.yaml` file in the `templates` folder.
-   - Define a `secret` object within this YAML file.
-   - Add an `env` field to your `Deployment`. The path to update is: `spec.template.spec.containers.env`.
-
-     > Refer to this [Helm Secrets Video](https://www.youtube.com/watch?v=hRSlKRvYe1A) for guidance.
-
-   - Update your Helm deployment as instructed in the video.
-   - Retrieve the list of pods using the command `kubectl get po`. Use the name of the pod as proof of your success within the report.
-   - Verify your secret inside the pod, for example: `kubectl exec demo-5f898f5f4c-2gpnd -- printenv | grep MY_PASS`. Share this output in `11.md`.
-
-## Task 2: Vault Secret Management System
-
-**4 Points:**
-
-1. Install Vault Using Helm Chart:
-   - Install Vault using a Helm chart. Follow the steps provided in this guide:
-     - [Vault Installation Guide](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar#install-the-vault-helm-chart)
-
-2. Follow the Tutorial with Your Helm Chart:
-   - Adapt the tutorial to work with your Helm chart, including the following steps:
-     - [Set a Secret in Vault](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar#set-a-secret-in-vault)
-     - [Configure Kubernetes Authentication](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar#configure-kubernetes-authentication)
-     - Be cautious with the service account. If you used `helm create ...`, it will be created automatically. In the guide, they create it manually.
-       - [Manually Define a Kubernetes Service Account](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar#define-a-kubernetes-service-account)
-
-3. Implement Vault Secrets in Your Helm Chart:
-   - Use the steps from the guide as an example for your Helm chart:
-     - [Update values.yaml](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar#launch-an-application)
-     - [Add Labels](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar#inject-secrets-into-the-pod)
-   - Test to ensure your credentials are injected successfully. Use the `kubectl exec -it <your_app> -- bash` command to access the container. Verify the injected secrets using `cat /path/to/your/secret` and `df -h`. Share the output in the `11.md` report.
-   - Apply a template as described in the guide. Test the updates as you did in the previous step and provide the outputs in `11.md`.
-
-**List of Requirements:**
-
-- Proof of work with a secret in `11.md` for the Task 1 - steps 2 and 3.
-- `secrets.yaml` file.
-- Resource requests and limits for CPU and memory.
-- Vault configuration implemented, with proofs in `11.md`.
-
-## Bonus Task: Resource Management and Environment Variables
-
-**2.5 Points:**
-
-1. Read About Resource Management:
-   - Familiarize yourself with resource management in Kubernetes:
-     - [Resource Management](https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/)
-
-2. Set Up Requests and Limits for CPU and Memory for Both Helm Charts:
-   - Configure resource requests and limits for CPU and memory for your application.
-   - Test to ensure these configurations work correctly.
-
-3. Add Environment Variables for Your Containers for Both Helm Charts:
-   - Read about Kubernetes environment variables:
-     - [Kubernetes Environment Variables](https://kubernetes.io/docs/tasks/inject-data-application/define-environment-variable-container/)
-   - Update your Helm chart with several environment variables using named templates. Move these variables to the `_helpers.tpl` file:
-     - [Helm Named Templates](https://helm.sh/docs/chart_template_guide/named_templates/)
-
-### Guidelines
-
-- Ensure that your documentation is clear and organized.
-- Include all the necessary components.
-- Follow appropriate file and folder naming conventions.
-- Create pull requests (PRs) as needed: from your fork to the main branch of this repository, and from your fork's branch to your fork's master branch.
-
-> Note: Thorough documentation is essential to demonstrate your success in managing secrets and resource allocation in Kubernetes. Explore the bonus tasks to enhance your skills further.
diff --git a/lab12.md b/lab12.md
deleted file mode 100644
index efb72a29ec..0000000000
--- a/lab12.md
+++ /dev/null
@@ -1,68 +0,0 @@
-# Lab 12: Kubernetes ConfigMaps
-
-## Overview
-
-In this lab, you'll delve into Kubernetes ConfigMaps, focusing on managing non-confidential data and upgrading your application for persistence. ConfigMaps provide a way to decouple configuration artifacts from image content, allowing you to manage configuration data separately from the application.
-
-## Task 1: Upgrade Application for Persistence
-
-**6 Points:**
-
-1. Upgrade Your Application:
-   - Modify your application to:
-     - Implement a counter logic in your application to keep track of the number of times it's accessed.
-     - Save the counter number in the `visits` file.
-     - Introduce a new endpoint `/visits` to display the recorded visits.
-   - Test the changes:
-     - Update your `docker-compose.yml` to include a new volume with your `visits` file.
-     - Verify that the enhancements work as expected, you must see the updated number in the `visits` file on the host machine.
-     - Update the `README.md` for your application.
-
-## Task 2: ConfigMap Implementation
-
-**4 Points:**
-
-1. Understand ConfigMaps:
-   - Read about ConfigMaps in Kubernetes:
-     - [ConfigMaps](https://kubernetes.io/docs/concepts/configuration/configmap/)
-
-2. Mount a Config File:
-   - Create a `files` folder with a `config.json` file.
-   - Populate `config.json` with data in JSON format.
-   - Use Helm to mount `config.json`:
-     - Create a `configMap` manifest, extracting data from `config.json` using `.Files.Get`.
-     - Update `deployment.yaml` with `Volumes` and `VolumeMounts`.
-       - [Example](https://carlos.mendible.com/2019/02/10/kubernetes-mount-file-pod-with-configmap/)
-     - Install the updated Helm chart and verify success:
-       - Retrieve the list of pods: `kubectl get po`.
-       - Use the pod name as proof of successful deployment.
-       - Check the ConfigMap inside the pod, e.g., `kubectl exec demo-758cc4d7c4-cxnrn -- cat /config.json`.
-
-3. Documentation:
-   - Create `12.md` in the `k8s` folder and include the output of relevant commands.
-
-**List of Requirements:**
-
-- `config.json` in the `files` folder.
-- `configMap` retrieving data from `config.json` using `.Files.Get`.
-- `Volume`s and `VolumeMount`s in `deployments.yml`.
-- `12.md` documenting the results of commands.
-
-## Bonus Task: ConfigMap via Environment Variables
-
-**2.5 Points:**
-
-1. Upgrade Bonus App:
-   - Implement persistence logic in your bonus app.
-
-2. ConfigMap via Environment Variables:
-   - Utilize ConfigMap via environment variables in a running container using the `envFrom` property.
-   - Provide proof with the output of the `env` command inside your container.
-
-### Guidelines
-
-- Maintain clear and organized documentation.
-- Use appropriate naming conventions for files and folders.
-- For your repository PR, ensure it's from the `lab12` branch to the main branch.
-
-> Note: Clear documentation is crucial to demonstrate successful data persistence and ConfigMap utilization in Kubernetes. Explore the bonus tasks to further enhance your skills.
diff --git a/lab13.md b/lab13.md
deleted file mode 100644
index e6f6c919f8..0000000000
--- a/lab13.md
+++ /dev/null
@@ -1,212 +0,0 @@
-# Lab 13: ArgoCD for GitOps Deployment
-
-## Overview
-
-In this lab, you will implement ArgoCD to automate Kubernetes application deployments using GitOps principles. You’ll install ArgoCD via Helm, configure it to manage your Python app, and simulate production-like workflows.
-
-## Task 1: Deploy and Configure ArgoCD
-
-**6 Points:**
-
-1. Install ArgoCD via Helm
-   - Add the ArgoCD Helm repository:
-
-     ```bash
-     helm repo add argo https://argoproj.github.io/argo-helm
-     ```
-
-     [ArgoCD Helm Chart Docs](https://github.com/argoproj/argo-helm)
-
-   - Install ArgoCD:
-
-     ```bash
-     helm install argo argo/argo-cd --namespace argocd --create-namespace
-     ```
-
-     [ArgoCD Installation Guide](https://argo-cd.readthedocs.io/en/stable/getting_started/)
-
-   - Verify installation:
-
-     ```bash
-     kubectl wait --for=condition=ready pod -l app.kubernetes.io/name=argocd-server -n argocd --timeout=90s
-     ```
-
-2. Install ArgoCD CLI
-   - Install the ArgoCD CLI tool (required for command-line interactions):
-
-     ```bash
-     # For macOS (Homebrew):
-     brew install argocd
-
-     # For Debian/Ubuntu:
-     sudo apt-get install -y argocd
-
-     # For other OS/architectures:
-     curl -sSL -o argocd https://github.com/argoproj/argo-cd/releases/latest/download/argocd-linux-amd64
-     chmod +x argocd
-     sudo mv argocd /usr/local/bin/
-     ```
-
-     [ArgoCD CLI Docs](https://argo-cd.readthedocs.io/en/stable/cli_installation/)
-
-   - Verify CLI installation:
-
-     ```bash
-     argocd version
-     ```
-
-3. Access the ArgoCD UI
-   - Forward the ArgoCD server port:
-
-     ```bash
-     kubectl port-forward svc/argocd-server -n argocd 8080:443 &
-     ```
-
-   - Log in using the initial admin password:
-
-     ```bash
-     # Retrieve the password:
-     kubectl -n argocd get secret argocd-initial-admin-secret -o jsonpath="{.data.password}" | base64 --decode
-
-     # Log in via CLI:
-     argocd login localhost:8080 --insecure
-     argocd account login
-     ```
-
-     [ArgoCD Authentication Docs](https://argo-cd.readthedocs.io/en/stable/user-guide/accessing/)
-
-4. Configure Python App Sync
-   - Create an ArgoCD folder:
-     Add an `ArgoCD` folder in your `k8s` directory for ArgoCD manifests.
-
-   - Define the ArgoCD Application:
-     Create `argocd-python-app.yaml` in the `ArgoCD` folder:
-
-     ```yaml
-     apiVersion: argoproj.io/v1alpha1
-     kind: Application
-     metadata:
-       name: python-app
-       namespace: argocd
-     spec:
-       project: default
-       source:
-         repoURL: https://github.com/<your-repo>/S25-core-course-labs.git
-         targetRevision: lab13
-         path: <k8s/app-python>
-         helm:
-           valueFiles:
-             - values.yaml
-       destination:
-         server: https://kubernetes.default.svc
-         namespace: default
-       syncPolicy:
-         automated: {}
-     ```
-
-     [ArgoCD Application Manifest Docs](https://argo-cd.readthedocs.io/en/stable/operator-manual/declarative_setup/)
-
-   - Apply the configuration:
-
-     ```bash
-     kubectl apply -f ArgoCD/argocd-python-app.yaml
-     ```
-
-   - Verify sync:
-
-     ```bash
-     argocd app sync python-app
-     argocd app status python-app
-     ```
-
-5. Test Sync Workflow
-   - Modify `values.yaml` (e.g., update `replicaCount`).
-   - Commit and push changes to the target branch from the config.
-   - Observe ArgoCD auto-sync the update:
-
-     ```bash
-     argocd app status python-app
-     ```
-
-### Task 2: Multi-Environment Deployment & Auto-Sync
-
-**4 Points:**
-
-1. Set Up Multi-Environment Configurations
-   - Extend your Python app’s Helm chart to support `dev` and `prod` environments.
-   - Create environment-specific values files (`values-dev.yaml`, `values-prod.yaml`).
-
-2. Create Namespaces
-
-   ```bash
-   kubectl create namespace dev
-   kubectl create namespace prod
-   ```
-
-3. Deploy Multi-Environment via ArgoCD
-   - Define two ArgoCD applications with auto-sync:
-     `argocd-python-dev.yaml` and `argocd-python-prod.yaml` (as before).
-
-4. Enable Auto-Sync
-   - Test auto-sync by updating `values-prod.yaml` and pushing to Git.
-
-5. Self-Heal Testing
-   - Test 1: Manual Override of Replica Count
-     1. Modify the deployment’s replica count manually:
-
-        ```bash
-        kubectl patch deployment python-app-prod -n prod --patch '{"spec":{"replicas": 3}}'
-        ```
-
-     2. Observe ArgoCD auto-revert the change (due to `syncPolicy.automated`):
-
-        ```bash
-        argocd app sync python-app-prod
-        argocd app status python-app-prod
-        ```
-
-   - Test 2: Delete a Pod (Replica)
-     1. Delete a pod in the `prod` namespace:
-
-        ```bash
-        kubectl delete pod -n prod -l <app.kubernetes.io/name=python-app>
-        ```
-
-     2. Verify Kubernetes recreates the pod to match the deployment’s `replicaCount`:
-
-        ```bash
-        kubectl get pods -n prod -w
-        ```
-
-     3. Confirm ArgoCD shows no drift (since pod deletions don’t affect the desired state):
-
-        ```bash
-        argocd app diff python-app-prod
-        ```
-
-6. Documentation
-   - In `13.md`, include:
-     - Output of `kubectl get pods -n prod` before and after pod deletion.
-     - Screenshots of ArgoCD UI showing sync status and the dashboard after both tests.
-     - Explanation of how ArgoCD handles configuration drift vs. runtime events.
-
-## Bonus Task: Sync Your Bonus App with ArgoCD
-
-**2.5 Points:**
-
-1. Configure ArgoCD for Bonus App
-   - Create an `argocd-<bonus>-app.yaml` similar to Task 1, pointing to your bonus app’s helm chart folder.
-   - Sync and validate deployment with:
-
-     ```bash
-     kubectl get pods -n <namespace>
-     ```
-
-### Guidelines
-
-- Follow the [ArgoCD docs](https://argo-cd.readthedocs.io/) for advanced configurations.
-- Use consistent naming conventions (e.g., `lab13` branch for Git commits).
-- Document all steps in `13.md` (include diffs, outputs, and UI screenshots).
-- For your repository PR, ensure it's from the `lab14` branch to the main branch.
-
-> **Note**: This lab emphasizes GitOps workflows, environment isolation, and automation. Mastery of ArgoCD will streamline your CI/CD pipelines in real-world scenarios.
diff --git a/lab14.md b/lab14.md
deleted file mode 100644
index d1d6ba51cd..0000000000
--- a/lab14.md
+++ /dev/null
@@ -1,106 +0,0 @@
-# Lab 14: Kubernetes StatefulSet
-
-## Overview
-
-In this lab, you'll explore Kubernetes StatefulSets, focusing on managing stateful applications with guarantees about the ordering and uniqueness of a set of Pods.
-
-## Task 1: Implement StatefulSet in Helm Chart
-
-**6 Points:**
-
-1. Understand StatefulSets:
-   - Read about StatefulSet objects:
-     - [Concept](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/)
-     - [Tutorial](https://kubernetes.io/docs/tutorials/stateful-application/basic-stateful-set/)
-
-2. Update Helm Chart:
-   - Rename `deployment.yml` to `statefulset.yml`.
-   - Create a manifest for StatefulSet following the tutorial.
-   - Test with command: `helm install --dry-run --debug name_of_your_chart path_to_your_chart`.
-   - Fix any issues and deploy it.
-   - Apply best practices by moving values to variables in `values.yml` meaningfully.
-
-## Task 2: StatefulSet Exploration and Optimization
-
-**4 Points:**
-
-1. Research and Documentation:
-   - Create `14.md` report.
-   - Include the output of `kubectl get po,sts,svc,pvc` commands.
-   - Use `minikube service name_of_your_statefulset` command to access your app.
-   - Access the root path of your app from different tabs and modes in your browser.
-   - Check the content of your file in each pod, e.g., `kubectl exec pod/demo-0 -- cat visits`, and provide the output for all replicas.
-   - Describe and explain differences in the report.
-
-2. Persistent Storage Validation
-   - Delete a pod:
-
-     ```bash
-     kubectl delete pod app-stateful-0
-     ```
-
-   - Verify that the PVC and data persist:
-
-     ```bash
-     kubectl get pvc
-     kubectl exec app-stateful-0 -- cat /data/visits
-     ```
-
-3. Headless Service Access
-   - Access pods via DNS:
-
-     ```bash
-     kubectl exec app-stateful-0 -- nslookup app-stateful-1.app-stateful
-     ```
-
-   - Document DNS resolution in `14.md`.
-
-4. Monitoring & Alerts
-   - Add liveness/readiness probes to your StatefulSet.
-   - Describe in `14.md`:
-     - How probes ensure pod health.
-     - Why they’re critical for stateful apps.
-
-5. Ordering Guarantee and Parallel Operations:
-   - Explain why ordering guarantees are unnecessary for your app.
-   - Implement a way to instruct the StatefulSet controller to launch or terminate all Pods in parallel.
-
-**List of Requirements:**
-
-- Outputs of commands in `14.md`.
-- Results of the "number of visits" command for each pod, with an explanation in `14.md`.
-- Answers to questions in point 2 of `14.md`.
-- Implementation of parallel launch and terminate.
-
-## Bonus Task: Update Strategies
-
-**2.5 Points:**
-
-1. Apply StatefulSet to Bonus App
-   - Convert your bonus app’s Helm chart to use a StatefulSet.
-
-2. Explore Update Strategies
-   - Implement Rolling Updates:
-
-     ```yaml
-     spec:
-       updateStrategy:
-         type: RollingUpdate
-         rollingUpdate:
-           partition: 1
-     ```
-
-   - Test Canaries:
-     Update a subset of pods first.
-
-   - Document in `14.md`:
-     - Explain `OnDelete`, `RollingUpdate`, and their use cases.
-     - Compare with Deployment update strategies.
-
-### Guidelines
-
-- Maintain clear and organized documentation.
-- Use appropriate naming conventions for files and folders.
-- For your repository PR, ensure it's from the `lab14` branch to the main branch.
-
-> Note: Understanding StatefulSets and their optimization is crucial for managing stateful applications in Kubernetes. Explore the bonus tasks to further enhance your skills.
diff --git a/lab15.md b/lab15.md
deleted file mode 100644
index 887587145d..0000000000
--- a/lab15.md
+++ /dev/null
@@ -1,78 +0,0 @@
-# Lab 15: Kubernetes Monitoring and Init Containers
-
-## Overview
-
-In this lab, you will explore Kubernetes cluster monitoring using Prometheus with the Kube Prometheus Stack. Additionally, you'll delve into the concept of Init Containers in Kubernetes.
-
-## Task 1: Kubernetes Cluster Monitoring with Prometheus
-
-**6 Points:**
-
-1. This lab was tested on a specific version of components:
-    - Minikube v1.33.0
-    - Minikube kubectl v1.28.3
-    - kube-prometheus-stack-57.2.0    v0.72.0
-    - the minikube start command - `minikube start --driver=docker --container-runtime=containerd`
-
-2. Read about `Kube Prometheus Stack`:
-    - [Helm chart with installation guide](https://github.com/prometheus-community/helm-charts/tree/main/charts/kube-prometheus-stack)
-    - [Explanation of components](https://github.com/prometheus-operator/kube-prometheus#kubeprometheus)
-
-3. Describe Components:
-    - Create `15.md` and detail the components of the Kube Prometheus Stack, explaining their roles and functions. Avoid direct copy-pasting; provide a personal understanding.
-
-4. Install Helm Charts:
-    - Install the Kube Prometheus Stack to your Kubernetes cluster.
-    - Install your app's Helm chart.
-    - Provide the output of the `kubectl get po,sts,svc,pvc,cm` command in the report and explain each part.
-
-5. Utilize Grafana Dashboards:
-    - Access Grafana using `minikube service monitoring-grafana`.
-    - Explore existing dashboards to find information about your cluster:
-        1. Check CPU and Memory consumption of your StatefulSet.
-        2. Identify Pods with higher and lower CPU usage in the default namespace.
-        3. Monitor node memory usage in percentage and megabytes.
-        4. Count the number of pods and containers managed by the Kubelet service.
-        5. Evaluate network usage of Pods in the default namespace.
-        6. Determine the number of active alerts; also check the Web UI with `minikube service monitoring-kube-prometheus-alertmanager`.
-    - Provide answers to all these points in the report.
-
-## Task 2: Init Containers
-
-**4 Points:**
-
-1. Read about `Init Containers`:
-    - [Concept](https://kubernetes.io/docs/concepts/workloads/pods/init-containers/)
-    - [Tutorial](https://kubernetes.io/docs/tasks/configure-pod-container/configure-pod-initialization/#create-a-pod-that-has-an-init-container)
-
-2. Implement Init Container:
-    - Create a new Volume.
-    - Implement an Init container to download any file using `wget` (you can use a site from the example).
-    - Provide proof of success, e.g., `kubectl exec pod/demo-0 -- cat /test.html`.
-
-**List of Requirements:**
-
-- Detailed explanation of monitoring stack components in `15.md`.
-- Output and explanation of `kubectl get po,sts,svc,pvc,cm`.
-- Answers to all 6 questions from point 4 in `15.md`.
-- Implementation of Init Container.
-- Proof of Init Container downloading a file.
-
-## Bonus Task: App Metrics & Multiple Init Containers
-
-**2.5 Points:**
-
-1. App Metrics:
-    - Fetch metrics from your app and provide proof.
-
-2. Init Container Queue:
-    - Create a queue of three Init containers, with any logic like adding new lines to the same file.
-    - Provide proof using the `cat` tool.
-
-### Guidelines
-
-- Ensure clear and organized documentation.
-- Use appropriate naming conventions for files and folders.
-- For your repository PR, ensure it's from the `lab15` branch to the main branch.
-
-> Note: Demonstrate successful implementation and understanding of Kubernetes monitoring and Init Containers. Take your time to explore the bonus tasks for additional learning opportunities.
diff --git a/lab16.md b/lab16.md
deleted file mode 100644
index 37912fc50b..0000000000
--- a/lab16.md
+++ /dev/null
@@ -1,75 +0,0 @@
-# Lab 16: IPFS and Fleek
-
-In this lab, you will explore essential DevOps tools and set up a project on the Fleek service. Follow the tasks below to complete the lab assignment.
-
-## Task 1: Set Up an IPFS Gateway Using Docker
-
-Objective: Understand and implement an IPFS gateway using Docker, upload a file, and verify it via an IPFS cluster.
-
-1. Set Up IPFS Gateway:
-   - Install Docker on your machine if it's not already installed.
-     - [Docker Installation Guide](https://docs.docker.com/get-docker/)
-
-   - Pull the IPFS Docker image and run an IPFS container:
-
-     ```sh
-     docker pull ipfs/go-ipfs
-     docker run -d --name ipfs_host -v /path/to/folder/with/file:/export -v ipfs_data:/data/ipfs -p 8080:8080 -p 4001:4001 -p 5001:5001 ipfs/go-ipfs
-     ```
-
-   - Verify the IPFS container is running:
-
-     ```sh
-     docker ps
-     ```
-
-2. Upload a File to IPFS:
-   - Open a browser and access the IPFS web UI:
-
-     ```sh
-     http://127.0.0.1:5001/webui/
-     ```
-
-   - Explore the web UI and wait for 5 minutes to sync up with the network.
-   - Upload any file via the web UI.
-   - Use the obtained hash to access the file via any public IPFS gateway. Here are a few options:
-     - [IPFS.io Gateway](https://ipfs.io/ipfs/)
-     - [Cloudflare IPFS Gateway](https://cloudflare-ipfs.com/ipfs/)
-     - [Infura IPFS Gateway](https://ipfs.infura.io/ipfs/)
-
-   - Append your file hash to any of the gateway URLs to verify your file is accessible. Note that it may fail due to network overload, so don't worry if you can't reach it.
-
-3. Documentation:
-   - Create a `submission2.md` file.
-   - Share information about connected peers and bandwidth in your report.
-   - Provide the hash and the URLs used to verify the file on the IPFS gateways.
-
-## Task 2: Set Up Project on Fleek.xyz
-
-Objective: Set up a project on the Fleek service and share the IPFS link.
-
-1. Research:
-   - Understand what IPFS is and its purpose.
-   - Explore Fleek's features.
-
-2. Set Up:
-   - Sign up for a Fleek account if you haven't already.
-   - Use your fork of the Labs repository as your project source. Optionally, set up your own website (notify us in advance).
-   - Configure the project settings on Fleek.
-   - Deploy the Labs repository to Fleek, ensuring it is uploaded to IPFS.
-
-3. Documentation:
-   - Share the IPFS link and domain of the deployed project in the `submission2.md` file.
-
-## Additional Resources
-
-- [IPFS Documentation](https://docs.ipfs.io/)
-- [Fleek Documentation](https://docs.fleek.xyz/)
-
-### Guidelines
-
-- Use proper Markdown formatting for documentation files.
-- Organize files with appropriate naming conventions.
-- Create a Pull Request to the main branch of the repository with your completed lab assignment.
-
-> Note: Actively explore and document your findings to gain hands-on experience with IPFS and Fleek.
diff --git a/lab16/index.html b/lab16/index.html
deleted file mode 100644
index acce39eee3..0000000000
--- a/lab16/index.html
+++ /dev/null
@@ -1,303 +0,0 @@
-<!DOCTYPE html>
-<html lang="en">
-<head>
-    <meta charset="UTF-8">
-    <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>DevOps Engineering Expert Track</title>
-    <meta name="description" content="Learn modern DevOps practices through 16 hands-on labs. Master Kubernetes, Terraform, CI/CD, Monitoring, and more.">
-    <style>
-        :root {
-            --primary: #1a1a1a;
-            --secondary: #00a896;
-            --accent: #004b66;
-            --highlight: #a30050;
-            --text: #e0e0e0;
-        }
-
-        * {
-            box-sizing: border-box;
-            margin: 0;
-            padding: 0;
-            font-family: 'Fira Code', monospace;
-        }
-
-        body {
-            background: var(--primary);
-            color: var(--text);
-            line-height: 1.6;
-        }
-
-        .container {
-            width: 90%;
-            margin: 0 auto;
-            padding: 2rem 0;
-        }
-
-        header {
-            background: var(--accent);
-            padding: 1rem 0;
-            position: sticky;
-            top: 0;
-            z-index: 1000;
-        }
-
-        nav ul {
-            display: flex;
-            justify-content: center;
-            list-style: none;
-            gap: 2rem;
-        }
-
-        nav a {
-            display: block;
-            color: var(--text);
-            padding: 1rem 2rem;
-            text-decoration: none;
-            transition: 0.3s;
-        }
-
-        nav a:hover {
-            background: var(--secondary);
-            border-radius: 4px;
-        }
-
-        .hero {
-            text-align: center;
-            padding: 5rem 0;
-            background: linear-gradient(45deg, var(--secondary), var(--accent));
-            background-size: 400% 400%;
-            animation: gradient 15s ease infinite;
-        }
-
-        @keyframes gradient {
-            0% { background-position: 0% 50%; }
-            50% { background-position: 100% 50%; }
-            100% { background-position: 0% 50%; }
-        }
-
-        .hero h1 {
-            font-size: 4.5rem;
-            color: white;
-            margin-bottom: 1rem;
-        }
-
-        .hero p {
-            font-size: 1.5rem;
-            margin-bottom: 2rem;
-            color: rgba(255, 255, 255, 0.8);
-        }
-
-        .hero-button {
-            background: var(--highlight);
-            color: white;
-            padding: 14px 40px;
-            border-radius: 30px;
-            font-size: 1.2rem;
-            text-decoration: none;
-            transition: transform 0.3s;
-        }
-
-        .hero-button:hover {
-            transform: translateY(-5px);
-        }
-
-        .topic-grid {
-            display: grid;
-            grid-template-columns: repeat(auto-fit, minmax(250px, 1fr));
-            gap: 2rem;
-            margin: 3rem 0;
-        }
-
-        .topic-card {
-            background: var(--accent);
-            padding: 2rem;
-            border-radius: 20px;
-            text-align: center;
-            transition: transform 0.3s;
-        }
-
-        .topic-card:hover {
-            transform: translateY(-7px);
-        }
-
-        .topic-card i {
-            font-size: 3.5rem;
-            color: var(--secondary);
-            margin-bottom: 1rem;
-        }
-
-        .syllabus {
-            background: var(--primary);
-            padding: 4rem 0;
-        }
-
-        .syllabus ol {
-            list-style-type: decimal;
-            padding-left: 2rem;
-            line-height: 1.8;
-        }
-
-        .syllabus li {
-            margin: 1rem 0;
-        }
-
-        .syllabus li span {
-            font-weight: bold;
-            color: var(--secondary);
-        }
-
-        .roadmap {
-            background: var(--primary);
-            padding: 4rem 0;
-        }
-
-        .roadmap-step {
-            background: var(--accent);
-            padding: 1.5rem;
-            border-radius: 15px;
-            margin: 1rem 0;
-            color: white;
-        }
-
-        .roadmap-step::before {
-            content: "☕";
-            margin-right: 1rem;
-            color: var(--secondary);
-        }
-
-        .pricing-table {
-            display: grid;
-            grid-template-columns: repeat(auto-fit, minmax(300px, 1fr));
-            gap: 2rem;
-            margin: 3rem 0;
-        }
-
-        .pricing-card {
-            background: var(--accent);
-            padding: 2rem;
-            border-radius: 20px;
-            transition: transform 0.3s;
-        }
-
-        .pricing-card:hover {
-            transform: translateY(-5px);
-        }
-
-        .pricing-card h3 {
-            color: var(--secondary);
-            margin-bottom: 1rem;
-        }
-
-        .footer {
-            background: var(--accent);
-            padding: 2rem 0;
-            text-align: center;
-        }
-
-        a {
-            color: var(--secondary);
-            text-decoration: underline;
-            transition: color 0.3s;
-        }
-
-        a:hover {
-            color: var(--highlight);
-        }
-    </style>
-</head>
-<body>
-    <header>
-        <div class="container">
-            <nav>
-                <ul>
-                    <li><a href="#why-us">Why Choose Us?</a></li>
-                    <li><a href="#syllabus">Lab Syllabus</a></li>
-                    <li><a href="#roadmap">Learning Path</a></li>
-                </ul>
-            </nav>
-        </div>
-    </header>
-
-    <section class="hero">
-        <div class="container">
-            <h1>Master Modern DevOps Practices</h1>
-            <p>16 hands-on labs covering Kubernetes, Terraform, CI/CD, and more</p>
-            <a href="https://github.com/inno-devops-labs/S25-core-course-labs" class="hero-button">Start Free Trial →</a>
-        </div>
-    </section>
-
-    <section id="why-us" class="container">
-        <h2>Why This Course?</h2>
-        <div class="why-us-grid">
-            <div>
-                <i class="fas fa-graduation-cap"></i>
-                <h3>16 Advanced Labs</h3>
-                <p>Build production-ready systems from scratch</p>
-            </div>
-            <div>
-                <i class="fas fa-code-branch"></i>
-                <h3>Industry-Standard Tools</h3>
-                <p>Terraform, ArgoCD, Prometheus, Vault, and more</p>
-            </div>
-            <div>
-                <i class="fas fa-user-check"></i>
-                <h3>Job-Ready Skills</h3>
-                <p>Learn tools used by top tech companies</p>
-            </div>
-        </div>
-    </section>
-
-    <section id="syllabus" class="syllabus">
-        <div class="container">
-            <h2>Lab Syllabus (2025 Edition)</h2>
-            <ol>
-                <li><span>Lab 1:</span> Web Application Development</li>
-                <li><span>Lab 2:</span> Containerization</li>
-                <li><span>Lab 3:</span> Continuous Integration</li>
-                <li><span>Lab 4:</span> Infrastructure as Code & Terraform</li>
-                <li><span>Lab 5:</span> Configuration Management</li>
-                <li><span>Lab 6:</span> Ansible Automation</li>
-                <li><span>Lab 7:</span> Observability, Logging, Loki Stack</li>
-                <li><span>Lab 8:</span> Monitoring & Prometheus</li>
-                <li><span>Lab 9:</span> Kubernetes & Declarative Manifests</li>
-                <li><span>Lab 10:</span> Helm Charts & Library Charts</li>
-                <li><span>Lab 11:</span> Kubernetes Secrets Management (Vault, ConfigMaps)</li>
-                <li><span>Lab 12:</span> Kubernetes ConfigMaps & Environment Variables</li>
-                <li><span>Lab 13:</span> GitOps with ArgoCD</li>
-                <li><span>Lab 14:</span> StatefulSet Optimization</li>
-                <li><span>Lab 15:</span> Kubernetes Monitoring & Init Containers</li>
-                <li><span>Lab 16:</span> IPFS & Fleek Decentralization</li>
-            </ol>
-        </div>
-    </section>
-
-    <section id="roadmap" class="roadmap container">
-        <h2>Learning Progression</h2>
-        <div class="roadmap-step">
-            <p><strong>Phase 1:</strong> Foundations (Labs 1-6)</p>
-            <p>Web Dev → Containers → CI/CD → IaC → Ansible</p>
-        </div>
-        <div class="roadmap-step">
-            <p><strong>Phase 2:</strong> Observability (Labs 7-8)</p>
-            <p>Logging → Monitoring → Loki/Prometheus</p>
-        </div>
-        <div class="roadmap-step">
-            <p><strong>Phase 3:</strong> Kubernetes Mastery (Labs 9-12)</p>
-            <p>Deployments → Helm → Secrets → ConfigMaps</p>
-        </div>
-        <div class="roadmap-step">
-            <p><strong>Phase 4:</strong> Expert Track (Labs 13-16)</p>
-            <p>GitOps → StatefulSets → IPFS → Final Project</p>
-        </div>
-    </section>
-
-    <footer class="footer">
-        <div class="container">
-            <p>© 2025 DevOps Engineering Institute</p>
-            <p>Questions? <a href="mailto:creed@soramitsu.co.jp">Email Us</a> | <a href="https://github.com/inno-devops-labs/S25-core-course-labs">GitHub Repo</a></p>
-        </div>
-    </footer>
-
-    <script src="https://kit.fontawesome.com/your-fontawesome-kit.js" crossorigin="anonymous"></script>
-</body>
-</html>
\ No newline at end of file
diff --git a/lab2.md b/lab2.md
deleted file mode 100644
index ff71bc227d..0000000000
--- a/lab2.md
+++ /dev/null
@@ -1,85 +0,0 @@
-# Lab 2: Containerization - Docker
-
-## Overview
-
-In this lab assignment, you will learn to containerize applications using Docker, while focusing on best practices. Additionally, you will explore Docker multi-stage builds. Follow the tasks below to complete the lab assignment.
-
-## Task 1: Dockerize Your Application
-
-**6 Points:**
-
-1. Create a `Dockerfile`:
-   - Inside the `app_python` folder, craft a `Dockerfile` for your application.
-   - Research and implement Docker best practices. Utilize a Dockerfile linter for quality assurance.
-
-2. Build and Test Docker Image:
-   - Build a Docker image using your Dockerfile.
-   - Thoroughly test the image to ensure it functions correctly.
-
-3. Push Image to Docker Hub:
-   - If you lack a public Docker Hub account, create one.
-   - Push your Docker image to your public Docker Hub account.
-
-4. Run and Verify Docker Image:
-   - Retrieve the Docker image from your Docker Hub account.
-   - Execute the image and validate its functionality.
-
-## Task 2: Docker Best Practices
-
-**4 Points:**
-
-1. Enhance your docker image by implementing [Docker Best Practices](https://docs.docker.com/build/building/best-practices/).
-   - No root user inside, or you will get no points at all.
-
-2. Write `DOCKER.md`:
-   - Inside the `app_python` folder, create a `DOCKER.md` file.
-   - Elaborate on the best practices you employed within your Dockerfile.
-   - Implementing and listing numerous Docker best practices will earn you more points.
-
-3. Enhance the README.md:
-   - Update the `README.md` file in the `app_python` folder.
-   - Include a dedicated `Docker` section, explaining your containerized application and providing clear instructions for execution.
-     - How to build?
-     - How to pull?
-     - How to run?
-
-### List of Requirements
-
-- Rootless container.
-- Use COPY, but only specific files.
-- Layer sanity.
-- Use `.dockerignore`.
-- Use a precise version of your base image and language, example `python:3-alpine3.15`.
-
-## Bonus Task: Multi-Stage Builds Exploration
-
-**2.5 Points:**
-
-1. Dockerize Previous App:
-   - Craft a `Dockerfile` for the application from the prior lab.
-   - Place this Dockerfile within the corresponding `app_*` folder.
-
-2. Follow Main Task Guidelines:
-   - Apply the same steps and suggestions as in the primary Dockerization task.
-
-3. Study Docker Multi-Stage Builds:
-   - Familiarize yourself with Docker multi-stage builds.
-   - Consider implementing multi-stage builds, only if they enhance your project's structure and efficiency.
-
-4. Study Distroless Images:
-   - Explore how to use Distroless images by reviewing the official documentation: [GoogleContainerTools/distroless](https://github.com/GoogleContainerTools/distroless).
-   - Create new `distroless.Dockerfile` files for your Python app and your second app.
-   - Use the `nonroot` tag for both images to ensure they run with non-root privileges.
-   - Verify that the applications work correctly with the Distroless images.
-   - Compare the sizes of your previous Docker images with the new Distroless-based images.
-   - In the `DOCKER.md` file, describe the differences between the Distroless images and your previous images. Explain why these differences exist (e.g., smaller size, reduced attack surface, etc.).
-   - Include a screenshot of your final results (e.g., image sizes).
-   - Add a new section to the `README.md` file titled "Distroless Image Version".
-
-### Guidelines
-
-- Utilize appropriate Markdown formatting and structure for all documentation.
-- Organize files within the lab folder with suitable naming conventions.
-- Create pull requests (PRs) as needed: from your fork to the main branch of this repository, and from your fork's branch to your fork's master branch.
-
-> Note: Utilize Docker to containerize your application, adhering to best practices. Explore Docker multi-stage builds for a deeper understanding, and document your process using Markdown.
diff --git a/lab3.md b/lab3.md
deleted file mode 100644
index 2f4899750a..0000000000
--- a/lab3.md
+++ /dev/null
@@ -1,53 +0,0 @@
-# Lab 3: Continuous Integration Lab
-
-## Overview
-
-In this lab assignment, you will delve into continuous integration (CI) practices by focusing on code testing, setting up Git Actions CI, and optimizing workflows. Additionally, you will have the opportunity to explore bonus tasks to enhance your CI knowledge. Follow the tasks below to complete the lab assignment.
-
-## Task 1: Code Testing and Git Actions CI
-
-**6 Points:**
-
-1. Code Testing:
-   - Begin by researching and implementing best practices for code testing.
-   - Write comprehensive unit tests for your application.
-   - In the `PYTHON.md` file, describe the unit tests you've created and the best practices you applied.
-   - Enhance the `README.md` file by adding a "Unit Tests" section.
-
-2. Set Up Git Actions CI:
-   - Create a CI workflow using GitHub Actions to build and test your Python project. Refer to the [official GitHub Actions documentation](https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python) for guidance.
-   - Ensure your CI workflow includes at least three essential steps: Dependencies, Linter, and Tests.
-   - Integrate Docker-related steps into your CI workflow, at least two steps Login, Build & Push. You can refer to the [Docker GitHub Actions documentation](https://docs.docker.com/ci-cd/github-actions/) for assistance.
-   - Update the `README.md` file to provide information about your CI workflow.
-
-## Task 2: CI Workflow Improvements
-
-**4 Points:**
-
-1. Workflow Enhancements:
-   - Add a workflow status badge to your repository for visibility.
-   - Dive into best practices for CI workflows and apply them to optimize your existing workflow.
-   - Utilize build cache to enhance workflow efficiency.
-   - Create a `CI.md` file and document the best practices you've implemented.
-
-2. Implement Snyk Vulnerability Checks:
-   - Integrate Snyk into your CI workflow to identify and address vulnerabilities in your projects. You can refer to the [Python example](https://github.com/snyk/actions/tree/master/python-3.8) for guidance, check [another option](https://docs.snyk.io/integrations/snyk-ci-cd-integrations/github-actions-integration#use-your-own-development-environment) how to install dependencies if you face any issue.
-
-## Bonus Task
-
-**2.5 Points:**
-
-1. Follow the Main Task Steps:
-   - Apply the same steps as in the primary CI task to set up CI workflows for an extra application. You can find useful examples in the [GitHub Actions starter workflows](https://github.com/actions/starter-workflows/tree/main/ci).
-
-2. CI Workflow Improvements:
-   1. Python App CI: Configure the CI workflow to run only when changes occur in the `app_python` folder.
-   2. Extra Language App CI: Configure the CI workflow to run only when changes occur in the `app_<language>` folder.
-
-### Guidelines
-
-- Use proper Markdown formatting and structure for all documentation files.
-- Organize files within the lab folder with suitable naming conventions.
-- Create pull requests (PRs) as needed: from your fork to the main branch of this repository, and from your fork's branch to your fork's master branch.
-
-> Note: Implement CI best practices, optimize your workflows, and explore bonus tasks to deepen your understanding of continuous integration.
diff --git a/lab4.md b/lab4.md
deleted file mode 100644
index e88b5e63e5..0000000000
--- a/lab4.md
+++ /dev/null
@@ -1,84 +0,0 @@
-# Lab 4: Infrastructure as Code Lab
-
-## Overview
-
-In this lab assignment, you will explore Infrastructure as Code (IAC) using Terraform. You'll build Docker and AWS infrastructures and dive into managing GitHub repositories through Terraform. Additionally, there are bonus tasks to enhance your Terraform skills. Follow the tasks below to complete the lab assignment.
-
-## Task 1: Introduction to Terraform
-
-**6 Points:**
-
-0. You will need a VPN tool for this lab
-
-1. Get Familiar with Terraform:
-   - Begin by familiarizing yourself with Terraform by reading the [introduction](https://www.terraform.io/intro/index.html) and exploring [best practices](https://www.terraform.io/docs/cloud/guides/recommended-practices/index.html).
-
-2. Set Up Terraform Workspace:
-   - Create a `terraform` folder to organize your Terraform workspaces.
-   - Inside the `terraform` folder, create a file named `TF.md`.
-
-3. Docker Infrastructure Using Terraform:
-   - Follow the [Docker tutorial](https://learn.hashicorp.com/collections/terraform/docker-get-started) for building a Docker infrastructure with Terraform.
-   - Perform the following tasks as instructed in the tutorial:
-      - Install Terraform.
-      - Build the Infrastructure.
-      - Provide the output of the following commands in the `TF.md` file:
-
-        ```sh
-            terraform state show
-            terraform state list
-        ```
-
-      - Document a part of the log with the applied changes.
-      - Utilize input variables to rename your Docker container.
-      - Finish the tutorial and provide the output of the `terraform output` command in the `TF.md` file.
-
-4. Yandex Cloud Infrastracture Using Terraform:
-   - Create an account on [Yandex Cloud](https://cloud.yandex.com/).
-   - Check for available free-tier options and select a free VM instance suitable for this lab.
-   - Follow the [Yandex Quickstart Guide](https://yandex.cloud/en-ru/docs/tutorials/infrastructure-management/terraform-quickstart#linux_1) to set up and configure Terraform for managing Yandex Cloud resources.
-   - Document the entire process, including setup steps, configurations, and any challenges encountered, in the `TF.md` file.
-
-5. [Optioinal] AWS Infrastructure Using Terraform:
-   - Follow the [AWS tutorial](https://learn.hashicorp.com/tutorials/terraform/aws-build?in=terraform/aws-get-started) alongside the instructions from the previous step.
-
-## Task 2: Terraform for GitHub
-
-**4 Points:**
-
-1. GitHub Infrastructure Using Terraform:
-   - Utilize the [GitHub provider for Terraform](https://registry.terraform.io/providers/integrations/github/latest/docs).
-   - Create a directory inside the `terraform` folder specifically for managing your GitHub project infrastructure.
-   - Build GitHub infrastructure following a reference like [this example](https://dev.to/pwd9000/manage-and-maintain-github-with-terraform-2k86). Prepare `.tf` files that include:
-      - Repository name
-      - Repository description
-      - Visibility settings
-      - Default branch
-      - Branch protection rule for the default branch
-   - Avoid placing your token as a variable in the code; instead, use an environment variable.
-
-2. Import Existing Repository:
-   - Use the `terraform import` command to import your current GitHub repository into your Terraform configuration. No need to create a new one. Example: `terraform import "github_repository.core-course-labs" "core-course-labs"`.
-
-3. Apply Terraform Changes:
-   - Apply changes from your Terraform configuration to your GitHub repository.
-
-4. Document Best Practices:
-   - Provide Terraform-related best practices that you applied in the `TF.md` file.
-
-## Bonus Task: Adding Teams
-
-**2.5 Points:**
-
-1. GitHub Teams Using Terraform:
-   - You need to create a new organization.
-   - Extend your Terraform configuration to add several teams to your GitHub repository, each with different levels of access.
-   - Apply the changes and ensure they take effect in your GitHub repository.
-
-### Guidelines
-
-- Use proper Markdown formatting and structure for documentation files.
-- Organize files within the lab folder with suitable naming conventions.
-- Create pull requests (PRs) as needed: from your fork to the main branch of this repository, and from your fork's branch to your fork's master branch.
-
-> Note: Dive into Terraform to manage infrastructures efficiently. Explore the AWS and Docker tutorials, and don't forget to document your process and best practices in the `TF.md` file.
diff --git a/lab5.md b/lab5.md
deleted file mode 100644
index bead18ceea..0000000000
--- a/lab5.md
+++ /dev/null
@@ -1,141 +0,0 @@
-# Lab 5: Ansible and Docker Deployment
-
-## Overview
-
-In this lab, you will get acquainted with Ansible, a powerful configuration management and automation tool. Your objective is to use Ansible to deploy Docker on a newly created cloud VM. This knowledge will be essential for your application deployment in the next lab.
-
-## Task 1: Initial Setup
-
-**6 Points:**
-
-1. Repository Structure:
-   - Organize your repository following the recommended structure below:
-
-     ```sh
-     .
-     |-- README.md
-     |-- ansible
-     |   |-- inventory
-     |   |   `-- default_aws_ec2.yml
-     |   |-- playbooks
-     |   |   `-- dev
-     |   |       `-- main.yaml
-     |   |-- roles
-     |   |   |-- docker
-     |   |   |   |-- defaults
-     |   |   |   |   `-- main.yml
-     |   |   |   |-- handlers
-     |   |   |   |   `-- main.yml
-     |   |   |   |-- tasks
-     |   |   |   |   |-- install_compose.yml
-     |   |   |   |   |-- install_docker.yml
-     |   |   |   |   `-- main.yml
-     |   |   |   `-- README.md
-     |   |   `-- web_app
-     |   |       |-- defaults
-     |   |       |   `-- main.yml
-     |   |       |-- handlers
-     |   |       |   `-- main.yml
-     |   |       |-- meta
-     |   |       |   `-- main.yml
-     |   |       |-- tasks
-     |   |       |   `-- main.yml
-     |   |       `-- templates
-     |   |           `-- docker-compose.yml.j2
-     |   `-- ansible.cfg
-     |-- app_go
-     |-- app_python
-     `-- terraform
-     ```
-
-2. Installation and Introduction:
-   - Install Ansible and familiarize yourself with its basics. You can follow the [Ansible installation guide](https://docs.ansible.com/ansible/latest/installation_guide/intro_installation.html).
-
-3. Use an Existing Ansible Role for Docker:
-   - Utilize an existing Ansible role for Docker from `ansible-galaxy` as a template. You can explore [this Docker role](https://github.com/geerlingguy/ansible-role-docker) as an example.
-
-4. Create a Playbook and Testing:
-   - Develop an Ansible playbook for deploying Docker.
-   - Test your playbook to ensure it works as expected.
-
-## Task 2: Custom Docker Role
-
-**4 Points:**
-
-1. Create Your Custom Docker Role:
-   - Develop a custom Ansible role for Docker with the following tasks:
-     1. Install Docker and Docker Compose.
-     2. Update your playbook to utilize this custom role. [Tricks and Tips](https://docs.ansible.com/ansible/latest/user_guide/playbooks_best_practices.html).
-     3. Test your playbook with the custom role to ensure successful deployment.
-     4. Make sure the role has a task to configure Docker to start on boot (`systemctl enable docker`).
-     5. Include a task to add the current user to the `docker` group to avoid using `sudo` for Docker commands.
-
-2. Documentation:
-   - Develop an `ANSIBLE.md` file in the `ansible` folder to document your Ansible-related work.
-   - Create a `README.md` file in the `ansible/roles/docker` folder.
-   - Use a Markdown template to describe your Docker role, its requirements and usage.
-   - Example `README.md` template for the Docker role:
-
-   ```markdown
-      # Docker Role
-
-      This role installs and configures Docker and Docker Compose.
-
-      ## Requirements
-
-      - Ansible 2.9+
-      - Ubuntu 22.04
-
-      ## Role Variables
-
-      - `docker_version`: The version of Docker to install (default: `latest`).
-      - `docker_compose_version`: The version of Docker Compose to install (default: `1.29.2`).
-
-      ## Example Playbook
-
-      ```yaml
-      - hosts: all
-         roles:
-            - role: docker
-   ```
-
-3. Deployment Output:
-   - Execute your playbook to deploy the Docker role.
-   - Provide the last 50 lines of the output from your deployment command in the `ANSIBLE.md` file.
-   - Use the `--check` flag with `ansible-playbook` to perform a dry run and verify changes before applying them.
-
-   Example command:
-
-   ```sh
-    ansible-playbook <path_to your_playbook> --diff
-   ```
-
-4. **Inventory Details:**
-   - Execute the following command `ansible-inventory -i <name_of_your_inventory_file>.yaml --list` and provide its output in the `ANSIBLE.md` file.
-   - Validate the inventory file using `ansible-inventory -i <name_of_your_inventory_file>.yaml --graph` to visualize the inventory structure.
-   - Ensure you have documented the inventory information.
-
-## Bonus Task: Dynamic Inventory
-
-**2.5 Points:**
-
-1. Set up Dynamic Inventory:
-   - Implement dynamic inventory for your cloud environment, if available.
-   - You may explore ready-made solutions for dynamic inventories:
-
-     - [AWS Example](https://docs.ansible.com/ansible/latest/collections/amazon/aws/aws_ec2_inventory.html)
-     - [Yandex Cloud (Note: Not tested)](https://github.com/rodion-goritskov/yacloud_compute)
-
-   Implementing dynamic inventory can enhance your automation capabilities.
-
-2. Secure Docker Configuration:
-   - Add a task to configure Docker security settings, disable root access.
-   - Use the `copy` module and modify the `daemon.json` file.
-
-### Guidelines
-
-- Use proper Markdown formatting and structure for documentation files.
-- Organize files within the lab folder with suitable naming conventions.
-- Create pull requests (PRs) as needed: from your fork to the main branch of this repository, and from your fork's branch to your fork's master branch.
-
-> Note: Ensure that your repository is well-structured, follow Ansible best practices, and provide clear documentation for a successful submission.
diff --git a/lab6.md b/lab6.md
deleted file mode 100644
index cc8249390d..0000000000
--- a/lab6.md
+++ /dev/null
@@ -1,139 +0,0 @@
-# Lab 6: Ansible and Application Deployment
-
-## Overview
-
-In this lab, you will utilize Ansible to set up a Continuous Deployment (CD) process for your application.
-
-## Task 1: Application Deployment
-
-**6 Points:**
-
-1. Create an Ansible Role:
-   - Develop an Ansible role specifically for deploying your application's Docker image, it can be done manually or via `ansible-galaxy init roles/web_app`. Call it `web_app`.
-   - Define variables in `roles/web_app/defaults/main.yml`.
-   - Add tasks to `roles/web_app/tasks/main.yml` to pull the Docker image and start the container.
-
-   > Managing just a container is bad practice, you can omit it and move to the Task 2 directly.
-
-2. Update the Playbook:
-   - Modify your Ansible playbook to integrate the new role you've created for Docker image deployment.
-
-3. Deployment Output:
-   - Execute your playbook to deploy the role.
-   - Provide the last 50 lines of the output from your deployment command in the `ANSIBLE.md` file.
-
-## Task 2: Ansible Best Practices
-
-**4 Points:**
-
-1. Group Tasks with Blocks:
-   - Organize related tasks within your playbooks using Ansible blocks.
-   - Implement logical blocks. For example:
-
-   ```yaml
-   - name: Setup Docker Environment
-      block:
-      - name: Install Docker
-         apt:
-            name: docker.io
-            state: present
-
-      - name: Start Docker Service
-         service:
-            name: docker
-            state: started
-            enabled: yes
-      tags:
-      - setup
-   ```
-
-2. Role Dependency:
-   - Set the role dependency for your `web_app` role to include the `docker` role.
-   - Specify dependencies in `roles/web_app/meta/main.yml`.
-
-3. Apply Tags:
-   - Implement Ansible tags to group tasks logically and enable selective execution. For example:
-
-     ```yaml
-     - name: Pull Docker image
-       docker_image:
-         name: "{{ docker_image }}"
-         source: pull
-       tags:
-         - docker
-     ```
-
-   - Run specific tags. For example:
-
-     ```bash
-     ansible-playbook site.yml --tags docker
-     ```
-
-4. Wipe Logic:
-   - Create a wipe logic in `roles/web_app/tasks/0-wipe.yml`. This should include removing your Docker container and all related files.
-   - Ensure that this wipe process can be enabled or disabled by using a variable, for example, `web_app_full_wipe=true`.
-
-5. Separate Tag for Wipe:
-   - Utilize a distinct tag for the **Wipe** section of your Ansible playbook. This allows you to run the wipe tasks independently from the main tasks.
-
-6. Docker Compose File:
-   - Write a Jinja2 template (`roles/web_app/templates/docker-compose.yml.j2`). For example:
-
-     ```yaml
-     version: '3'
-     services:
-       app:
-         image: "{{ docker_image }}"
-         ports:
-           - "{{ app_port }}:80"
-     ```
-
-   - Deliver the template using the `template` module in `roles/web_app/tasks/main.yml`.
-   - Suggested structure:
-
-   ```sh
-   .
-   |-- defaults
-   |   `-- main.yml
-   |-- meta
-   |   `-- main.yml
-   |-- tasks
-   |   |-- 0-wipe.yml
-   |   `-- main.yml
-   `-- templates
-      `-- docker-compose.yml.j2
-   ```
-
-7. Create `README.md`:
-   - Create a `README.md` file in the `ansible/roles/web_app` folder.
-   - Use a suggested Docker Markdown template from the previous lab to describe your role, its requirements and usage.
-
-## Bonus Task: CD Improvement
-
-**2.5 Points:**
-
-1. Create an Extra Playbook:
-   - Develop an additional Ansible playbook specifically for your bonus application.
-   - You can reuse the existing Ansible role you created for your primary application or create a new one.
-   - Suggested structure:
-
-   ```sh
-   .
-   `--ansible
-       `-- playbooks
-           `-- dev
-               |-- app_python
-               |   `-- main.yaml
-               `-- app_go
-                   `-- main.yaml
-   ```
-
-### Guidelines
-
-- Use proper Markdown formatting and structure for documentation files.
-- Organize files within the lab folder with suitable naming conventions.
-- Create pull requests (PRs) as needed: from your fork to the main branch of this repository, and from your fork's branch to your fork's master branch.
-- Follow the suggested structure for your Ansible roles, tasks, and templates.
-- Utilize Ansible best practices such as grouping tasks with blocks, applying tags, and separating roles logically.
-
-> Note: Apply diligence to your Ansible implementation, follow best practices, and clearly document your work to achieve the best results in this lab assignment.
diff --git a/lab7.md b/lab7.md
deleted file mode 100644
index 48e65eb202..0000000000
--- a/lab7.md
+++ /dev/null
@@ -1,59 +0,0 @@
-# Lab 7: Monitoring and Logging
-
-## Overview
-
-In this lab, you will become familiar with a logging stack that includes Promtail, Loki, and Grafana. Your goal is to create a Docker Compose configuration and configuration files to set up this logging stack.
-
-## Task 1: Logging Stack Setup
-
-**6 Points:**
-
-1. Study the Logging Stack:
-   - Begin by researching the components of the logging stack:
-     - [Grafana Webinar: Loki Getting Started](https://grafana.com/go/webinar/loki-getting-started/)
-     - [Loki Overview](https://grafana.com/docs/loki/latest/overview/)
-     - [Loki GitHub Repository](https://github.com/grafana/loki)
-
-2. Create a Monitoring Folder:
-   - Start by creating a new folder named `monitoring` in your project directory.
-
-3. Docker Compose Configuration:
-   - Inside the `monitoring` folder, prepare a `docker-compose.yml` file that defines the entire logging stack along with your application.
-   - To assist you in this task, refer to these resources for sample Docker Compose configurations:
-     - [Example Docker Compose Configuration from Loki Repository](https://github.com/grafana/loki/blob/main/production/docker-compose.yaml)
-     - [Promtail Configuration Example](https://github.com/black-rosary/loki-nginx/blob/master/promtail/promtail.yml) (Adapt it as needed)
-
-4. Testing:
-   - Verify that the configured logging stack and your application work as expected.
-
-## Task 2: Documentation and Reporting
-
-**4 Points:**
-
-1. Logging Stack Report:
-   - Create a new file named `LOGGING.md` to document how the logging stack you've set up functions.
-   - Provide detailed explanations of each component's role within the stack.
-
-2. Screenshots:
-   - Capture screenshots that demonstrate the successful operation of your logging stack.
-   - Include these screenshots in your `LOGGING.md` report for reference.
-
-## Bonus Task: Additional Configuration
-
-**2.5 Points:**
-
-1. Integrating Your Extra App:
-   - Extend the `docker-compose.yml` configuration to include your additional application.
-
-2. Configure Stack for Comprehensive Logging:
-   - Modify the logging stack's configuration to collect logs from all containers defined in the `docker-compose.yml`.
-   - Include screenshots in your `LOGGING.md` report to demonstrate your success.
-
-### Guidelines
-
-- Ensure that your documentation in `LOGGING.md` is well-structured and comprehensible.
-- Follow proper naming conventions for files and folders.
-- Use code blocks and Markdown formatting where appropriate.
-- Create pull requests (PRs) as needed: from your fork to the main branch of this repository, and from your fork's branch to your fork's master branch.
-
-> Note: Thoroughly document your work, and ensure the logging stack functions correctly. Utilize the bonus points opportunity to enhance your understanding and the completeness of your setup.
diff --git a/lab8.md b/lab8.md
deleted file mode 100644
index 8eb0752ec7..0000000000
--- a/lab8.md
+++ /dev/null
@@ -1,71 +0,0 @@
-# Lab 8: Monitoring with Prometheus
-
-## Overview
-
-In this lab, you will become acquainted with Prometheus, set it up, and configure applications to collect metrics.
-
-## Task 1: Prometheus Setup
-
-**6 Points:**
-
-1. Learn About Prometheus:
-   - Begin by reading about Prometheus and its fundamental concepts:
-     - [Prometheus Overview](https://prometheus.io/docs/introduction/overview/)
-     - [Prometheus Naming Best Practices](https://prometheus.io/docs/practices/naming/)
-
-2. Integration with Docker Compose:
-   - Expand your existing `docker-compose.yml` file from the previous lab to include Prometheus.
-
-3. Prometheus Configuration:
-   - Configure Prometheus to collect metrics from both Loki and Prometheus containers.
-
-4. Verify Prometheus Targets:
-   - Access `http://localhost:9090/targets` to ensure that Prometheus is correctly scraping metrics.
-   - Capture screenshots that confirm the successful setup and place them in a file named `METRICS.md` within the monitoring folder.
-
-## Task 2: Dashboard and Configuration Enhancements
-
-**4 Points:**
-
-1. Grafana Dashboards:
-   - Set up dashboards in Grafana for both Loki and Prometheus.
-   - You can use examples as references:
-     - [Example Dashboard for Loki](https://grafana.com/grafana/dashboards/13407)
-     - [Example Dashboard for Prometheus](https://grafana.com/grafana/dashboards/3662)
-   - Capture screenshots displaying your successful dashboard configurations and include them in `METRICS.md`.
-
-2. Service Configuration Updates:
-   - Enhance the configuration of all services in the `docker-compose.yml` file:
-     - Add log rotation mechanisms.
-     - Specify memory limits for containers.
-   - Ensure these changes are documented within your `METRICS.md` file.
-
-3. Metrics Gathering:
-   - Extend Prometheus to gather metrics from all services defined in the `docker-compose.yml` file.
-
-## Bonus Task: Metrics and Health Checks
-
-**To Earn 2.5 Additional Points:**
-
-1. Application Metrics:
-   - Integrate metrics into your applications. You can refer to Python examples like:
-     - [Monitoring a Synchronous Python Web Application](https://dzone.com/articles/monitoring-your-synchronous-python-web-application)
-     - [Metrics Monitoring in Python](https://opensource.com/article/18/4/metrics-monitoring-and-python)
-
-2. Obtain Application Metrics:
-   - Configure your applications to export metrics.
-
-3. METRICS.md Update:
-   - Document your progress with the bonus tasks, including screenshots, in the `METRICS.md` file.
-
-4. Health Checks:
-   - Further enhance the `docker-compose.yml` file's service configurations by adding health checks for the containers.
-
-### Guidelines
-
-- Maintain a well-structured and comprehensible `METRICS.md` document.
-- Adhere to file and folder naming conventions.
-- Utilize code blocks and Markdown formatting where appropriate.
-- Create pull requests (PRs) as needed: from your fork to the main branch of this repository, and from your fork's branch to your fork's master branch.
-
-> Note: Ensure thorough documentation of your work, and guarantee that Prometheus correctly collects metrics. Take advantage of the bonus tasks to deepen your understanding and enhance the completeness of your setup.
diff --git a/lab9.md b/lab9.md
deleted file mode 100644
index 5493f042a6..0000000000
--- a/lab9.md
+++ /dev/null
@@ -1,76 +0,0 @@
-# Lab 9: Introduction to Kubernetes
-
-## Overview
-
-In this lab, you will explore Kubernetes, set up a local development environment, and create manifests for your application.
-
-## Task 1: Kubernetes Setup and Basic Deployment
-
-**6 Points:**
-
-1. Learn About Kubernetes:
-   - Begin by studying the fundamentals of Kubernetes:
-     - [What is Kubernetes](https://kubernetes.io/docs/concepts/overview/what-is-kubernetes/)
-     - [Kubernetes Components](https://kubernetes.io/docs/concepts/overview/components/)
-
-2. Install Kubernetes Tools:
-   - Install `kubectl` and `minikube`, essential tools for managing Kubernetes.
-     - [Kubernetes Tools](https://kubernetes.io/docs/tasks/tools/)
-
-3. Deploy Your Application:
-   - Deploy your application within the Minikube cluster using the `kubectl create` command. Create a `Deployment` resource for your app.
-     - [Example of Creating a Deployment](https://kubernetes.io/docs/tutorials/hello-minikube/#create-a-deployment)
-     - [Deployment Overview](https://kubernetes.io/docs/tutorials/kubernetes-basics/deploy-app/deploy-intro/)
-
-4. Access Your Application:
-   - Make your application accessible from outside the Kubernetes virtual network. Achieve this by creating a `Service` resource.
-     - [Example of Creating a Service](https://kubernetes.io/docs/tutorials/hello-minikube/#create-a-service)
-     - [Service Overview](https://kubernetes.io/docs/tutorials/kubernetes-basics/expose/expose-intro/)
-
-5. Create a Kubernetes Folder:
-   - Establish a `k8s` folder within your repository.
-   - Create a `README.md` report within this folder and include the output of the `kubectl get pods,svc` command.
-
-6. Cleanup:
-   - Remove the `Deployment` and `Service` resources that you created, maintaining a tidy Kubernetes environment.
-
-## Task 2: Declarative Kubernetes Manifests
-
-**4 Points:**
-
-1. Manifest Files for Your Application:
-   - As a more efficient and structured approach, employ configuration files to deploy your application.
-   - Create a `deployment.yml` manifest file that describes your app's deployment, specifying at least 3 replicas.
-     - [Kubernetes Deployment](https://kubernetes.io/docs/concepts/workloads/controllers/deployment/)
-     - [Declarative Management of Kubernetes Objects Using Configuration Files](https://kubernetes.io/docs/tasks/manage-kubernetes-objects/declarative-config/)
-
-2. Service Manifest:
-   - Develop a `service.yml` manifest file for your application.
-
-3. Manifest Files in `k8s` Folder:
-   - Store these manifest files in the `k8s` folder of your repository.
-   - Additionally, provide the output of the `kubectl get pods,svc` command in the `README.md` report.
-   - Include the output of the `minikube service --all` command and the result from your browser, with a screenshot demonstrating that the IP matches the output of `minikube service --all`.
-
-## Bonus Task: Additional Configuration and Ingress
-
-**To Earn 2.5 Additional Points:**
-
-1. Manifests for Extra App:
-   - Create `deployment` and `service` manifests for an additional application.
-
-2. Ingress Manifests:
-   - Construct [Ingress manifests](https://kubernetes.io/docs/tasks/access-application-cluster/ingress-minikube/) for your applications.
-
-3. Application Availability Check:
-   - Utilize `curl` or a similar tool to verify the availability of your applications. Include the output in the report.
-
-**Guidelines:**
-
-- Maintain a clear and well-structured `README.md` document.
-- Ensure that all required components are included.
-- Adhere to file and folder naming conventions.
-- Create and participate in PRs to facilitate the peer review process.
-- Create pull requests (PRs) as needed: from your fork to the main branch of this repository, and from your fork's branch to your fork's master branch.
-
-> Note: Detailed documentation is crucial to ensure that your Kubernetes deployment is fully functional and accessible. Engage with the bonus tasks to further enhance your understanding and application deployment skills.
diff --git a/labs/docs/LAB08.md b/labs/docs/LAB08.md
new file mode 100644
index 0000000000..4b47e9ea29
--- /dev/null
+++ b/labs/docs/LAB08.md
@@ -0,0 +1,259 @@
+## Lab 8 — Metrics & Monitoring with Prometheus
+
+## Architecture
+Key components:
+- `testiks-app`: exposes Prometheus metrics at `GET /metrics`
+- `Prometheus`: scrapes metrics (pull model) and stores time-series in TSDB
+- `Grafana`: visualizes Prometheus metrics with dashboards (PromQL)
+- `Loki`: remain for logs, complementing metrics
+
+
+### Diagram:
+
+```mermaid
+flowchart LR
+  A[py app :5000] --> |scrape| P[Prometheus :9090]
+  G[Grafana :3000] --> |query| P
+  G --> |query| D[Dashboards with metrics]
+  P --> |scrape| L[Loki :3100]
+  PT[Promtail :9080] --> |puhs| L
+  DC[D0cker conainers] --> |logs| PT
+```
+
+Data flow:
+- Py app exposes metrics at `/metrics` using prometheus
+- Prometheus scrapes all targets  (app, itself, Loki, Grafana)
+- Grafana queries Prometheus via PromQL to render dashboard panels
+- Loki receives logs from Promtail, while Prometheus scrapes Loki's own metrics
+- Grafana combines both data sources for full observability (logs + metrics)
+
+### Why these metrics
+- Counter (`http_requests_total`): Useful for calculating request rates and error rates over time windows
+- Histogram (`http_request_duration_seconds`): Provides bucketed latency distribution, enabling percentile calculations (p50, p95, p99)
+- Gauge (`http_requests_in_progress`): Can go up and down: shows current load on the service
+- Business metrics (`devops_info_endpoint_calls`): Track which endpoints are most popular beyond raw HTTP metrics
+
+The `/metrics` endpoint itself is excluded from tracking to avoid feedback loops
+
+## Application Instrumentation
+### Metrics
+We track the standard RED metrics with low-cardinality labels like `method`, normalized `endpoint`, and `status_code`:
+
+- **Counter** `http_requests_total{method,endpoint,status_code}`  
+  Counts all HTTP requests. Useful for monitoring request rates and errors.
+- **Histogram** `http_request_duration_seconds_bucket{method,endpoint,...}`  
+  Measures latency distribution. We use this to calculate p95 and create heatmaps.
+- **Gauge** `http_requests_in_progress`  
+  Shows the number of ongoing HTTP requests at any moment.
+
+App-specific Metrics:
+- **Counter** `devops_info_endpoint_calls{endpoint}`  
+  Tracks usage for specific endpoints like `"/"` and `"/health"`
+- **Histogram** `devops_info_system_collection_seconds`  
+  Measures the time spent collecting system info within a request
+
+**Label Design Note**: Endpoint labels are normalized using Flask route rules (for example `"/health"`). We deliberately avoid using user IDs or raw paths to prevent high label cardinality.
+
+![all working](./screenshots/metrics.png)
+
+### Code Location
+- Metrics are implemented in: `./ansible/app_python/app.py`:
+```python
+http_requests_total = Counter(
+    'http_requests_total',
+    'Total HTTP requests',
+    ['method', 'endpoint', 'status']
+)
+
+http_request_duration_seconds = Histogram(
+    'http_request_duration_seconds',
+    'HTTP request duration',
+    ['method', 'endpoint']
+)
+
+http_requests_in_progress = Gauge(
+    'http_requests_in_progress',
+    'HTTP requests currently being processed'
+)
+
+```
+
+### Local Testing
+```bash
+cd app_python
+pip install -r requirements.txt
+python3 app.py
+curl -s http://localhost:5000/metrics | head -n 40
+```
+
+## Prometheus Configuration
+### Docker Compose Setup
+
+The monitoring stack is defined in monitoring/docker-compose.yml
+
+Key settings:
+- Prometheus image: prom/prometheus:v3.9.0
+- Scrape interval: 15s
+- Retention:
+    - `--storage.tsdb.retention.time=15d`
+    - `--storage.tsdb.retention.size=10GB`
+
+Persistent volume: `prometheus-data:/prometheus`
+
+Connected to the same logging network as Loki and Grafana (from Lab 7)
+
+### Scrape Targets:
+
+Prometheus configuration is in monitoring/prometheus/prometheus.yml. Jobs include:
+- prometheus: localhost:9090
+- app: app-python:5000 (path: `/metrics`)
+- loki: loki:3100 (path: `/metrics`)
+- grafana: grafana:3000 (path: `/metrics`)
+
+![alt text](./screenshots/allgreen.png)
+
+## Grafana Dashboard Walkthrough
+
+### Request Rate (time series)
+Shows throughput per endpoint (RED metric “Rate”):
+
+`sum by (endpoint) (rate(http_requests_total[5m]))`
+
+![alt text](./screenshots/endpoints.png)
+
+### Error Rate (5xx) (time series)
+Tracks server errors:
+
+`sum(rate(http_requests_total{status_code=~"5.."}[5m]))`
+
+![alt text](./screenshots/500.png)
+
+### Latency Heatmap (heatmap)
+Visualizes latency distribution:
+
+`sum by (le) (rate(http_request_duration_seconds_bucket[5m]))`
+
+![alt text](./screenshots/latency.png)
+
+### Active Requests (stat/time series)
+Displays ongoing requests:
+
+`http_requests_in_progress`
+
+![alt text](./screenshots/progress.png)
+
+### Status Code Distribution (pie chart)
+Breakdown of 2xx/4xx/5xx responses:
+
+`sum by (status_code) (rate(http_requests_total[5m]))`
+
+![alt text](./screenshots/allreq.png)
+
+
+### Uptime (app target) (stat)
+Shows app availability:
+
+`up{job="app"}`
+
+![alt text](./screenshots/up.png)
+
+### CPU usage rate
+Shows app CPU consumption:
+
+`rate(process_cpu_seconds_total{job="app"}[5m]) * 100`
+
+![alt text](image.png)
+
+## Production Setup
+
+### Health checks
+
+| Service      | Check                                           | Interval | Retries |
+|-------------|-------------------------------------------------|----------|---------|
+| Prometheus  | `wget http://localhost:9090/-/healthy`         | 10s      | 5       |
+| Loki        | `wget http://localhost:3100/ready`             | 10s      | 5       |
+| Grafana     | `curl http://localhost:3000/api/health`        | 10s      | 5       |
+| app-python  | `urllib.request.urlopen('http://localhost:5000/health')` | 10s      | 5       |
+
+---
+
+### Resource limits
+
+| Service      | CPU Limit | Memory Limit | CPU Reserved | Memory Reserved |
+|-------------|-----------|--------------|--------------|----------------|
+| Prometheus  | 1.0       | 1 GB         | 0.25         | 256 MB         |
+| Loki        | 1.0       | 1 GB         | 0.25         | 256 MB         |
+| Grafana     | 0.5       | 512 MB       | 0.25         | 256 MB         |
+| app-python  | 0.5       | 256 MB       | 0.1          | 64 MB          |
+| Promtail    | 0.5       | 512 MB       | 0.1          | 128 MB         |
+
+---
+
+### Retention policies
+
+- **Prometheus**: 15 days / 10 GB (whichever limit is reached first)  
+- **Loki**: 168 hours (7 days), configured via `limits_config.retention_period`
+
+---
+
+### Persistent volumes
+
+| Volume           | Service     | Mount Point          | Purpose                          |
+|-----------------|------------|--------------------|----------------------------------|
+| `prometheus-data` | Prometheus | `/prometheus`      | TSDB storage                     |
+| `loki-data`      | Loki       | `/loki`            | Log chunks and index             |
+| `grafana-data`   | Grafana    | `/var/lib/grafana` | Dashboards, users, settings      |
+
+> Data survives `docker compose down` + `docker compose up -d`.
+
+---
+
+## Testing Results
+
+### Verification steps
+
+```bash
+cd monitoring
+echo 'GRAFANA_ADMIN_PASSWORD=testpass' > .env
+docker compose up -d
+
+docker compose ps
+
+curl http://localhost:9090/api/v1/targets | jq '.data.activeTargets[].health'
+curl http://localhost:8000/metrics
+
+curl -u admin:admin http://localhost:3000/api/datasources
+
+# Test persistence
+docker compose down
+docker compose up -d
+# Dashboards and data should persist
+```
+
+Persistance evidence:
+
+![alt text](image-1.png)
+
+## Metrics vs Logs — When to Use Each
+
+| Aspect         | Metrics (Prometheus)                     | Logs (Loki)                       |
+|----------------|----------------------------------------|----------------------------------|
+| Purpose        | Numeric measurements over time         | Event records with context       |
+| Use when       | "How many?", "How fast?", "How much?" | "What happened?", "Why did it fail?" |
+| Alerting       | Ideal — threshold-based alerts on rates | Possible but less efficient      |
+| Storage        | Compact (numeric time series)          | Verbose (full text)              |
+| Query          | PromQL — aggregations, rates, percentiles | LogQL — filter, parse, aggregate |
+| Example        | "Error rate > 5% in last 5 min"       | "Show me the stack trace for request X" |
+| Cardinality    | Keep low (avoid high-cardinality labels) | Naturally high (each log is unique) |
+
+**Best practice:** Use metrics for detection (something is wrong), logs for investigation (why it’s wrong)
+
+
+## Challenges & Solutions
+
+| Challenge                              | Solution                                                                 |
+|----------------------------------------|-------------------------------------------------------------------------|
+| Metrics endpoint creating feedback loops | Excluded `/metrics` path from request tracking in `before_request` / `after_request` hooks |
+| Grafana data source UID mismatch        | Used provisioning YAML to auto-configure Prometheus and Loki data sources |
+| Prometheus container health check       | Used `wget` instead of `curl` since `prom/prometheus` image is Alpine-based |
+| Dashboard persistence across restarts   | Used Grafana provisioning with JSON files mounted as volumes            |
\ No newline at end of file
diff --git a/labs/docs/screenshots/500.png b/labs/docs/screenshots/500.png
new file mode 100644
index 0000000000..3aff243056
Binary files /dev/null and b/labs/docs/screenshots/500.png differ
diff --git a/labs/docs/screenshots/allgreen.png b/labs/docs/screenshots/allgreen.png
new file mode 100644
index 0000000000..61ae8110c2
Binary files /dev/null and b/labs/docs/screenshots/allgreen.png differ
diff --git a/labs/docs/screenshots/allreq.png b/labs/docs/screenshots/allreq.png
new file mode 100644
index 0000000000..743d770919
Binary files /dev/null and b/labs/docs/screenshots/allreq.png differ
diff --git a/labs/docs/screenshots/endpoints.png b/labs/docs/screenshots/endpoints.png
new file mode 100644
index 0000000000..4cc70766b4
Binary files /dev/null and b/labs/docs/screenshots/endpoints.png differ
diff --git a/labs/docs/screenshots/image-1.png b/labs/docs/screenshots/image-1.png
new file mode 100644
index 0000000000..9f1781d97c
Binary files /dev/null and b/labs/docs/screenshots/image-1.png differ
diff --git a/labs/docs/screenshots/image.png b/labs/docs/screenshots/image.png
new file mode 100644
index 0000000000..241124d6d6
Binary files /dev/null and b/labs/docs/screenshots/image.png differ
diff --git a/labs/docs/screenshots/latency.png b/labs/docs/screenshots/latency.png
new file mode 100644
index 0000000000..29690493bf
Binary files /dev/null and b/labs/docs/screenshots/latency.png differ
diff --git a/labs/docs/screenshots/metrics.png b/labs/docs/screenshots/metrics.png
new file mode 100644
index 0000000000..0b988a8377
Binary files /dev/null and b/labs/docs/screenshots/metrics.png differ
diff --git a/labs/docs/screenshots/progress.png b/labs/docs/screenshots/progress.png
new file mode 100644
index 0000000000..384de84ea2
Binary files /dev/null and b/labs/docs/screenshots/progress.png differ
diff --git a/labs/docs/screenshots/up.png b/labs/docs/screenshots/up.png
new file mode 100644
index 0000000000..92535b5601
Binary files /dev/null and b/labs/docs/screenshots/up.png differ
diff --git a/labs/lab01.md b/labs/lab01.md
new file mode 100644
index 0000000000..18c9ff6c43
--- /dev/null
+++ b/labs/lab01.md
@@ -0,0 +1,693 @@
+# Lab 1 — DevOps Info Service: Web Application Development
+
+![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
+![topic](https://img.shields.io/badge/topic-Web%20Development-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![languages](https://img.shields.io/badge/languages-Python%20|%20Go-informational)
+
+> Build a DevOps info service that reports system information and health status. This service will evolve throughout the course into a comprehensive monitoring tool.
+
+## Overview
+
+Create a **DevOps Info Service** - a web application providing detailed information about itself and its runtime environment. This foundation will grow throughout the course as you add containerization, CI/CD, monitoring, and persistence.
+
+**What You'll Learn:**
+- Web framework selection and implementation
+- System introspection and API design
+- Python best practices and documentation
+- Foundation for future DevOps tooling
+
+**Tech Stack:** Python 3.11+ | Flask 3.1 or FastAPI 0.115
+
+---
+
+## Tasks
+
+### Task 1 — Python Web Application (6 pts)
+
+Build a production-ready Python web service with comprehensive system information.
+
+#### 1.1 Project Structure
+
+Create this structure:
+
+```
+app_python/
+├── app.py                    # Main application
+├── requirements.txt          # Dependencies
+├── .gitignore               # Git ignore
+├── README.md                # App documentation
+├── tests/                   # Unit tests (Lab 3)
+│   └── __init__.py
+└── docs/                    # Lab documentation
+    ├── LAB01.md            # Your lab submission
+    └── screenshots/        # Proof of work
+        ├── 01-main-endpoint.png
+        ├── 02-health-check.png
+        └── 03-formatted-output.png
+```
+
+#### 1.2 Choose Web Framework
+
+Select and justify your choice:
+- **Flask** - Lightweight, easy to learn
+- **FastAPI** - Modern, async, auto-documentation
+- **Django** - Full-featured, includes ORM
+
+Document your decision in `app_python/docs/LAB01.md`.
+
+#### 1.3 Implement Main Endpoint: `GET /`
+
+Return comprehensive service and system information:
+
+```json
+{
+  "service": {
+    "name": "devops-info-service",
+    "version": "1.0.0",
+    "description": "DevOps course info service",
+    "framework": "Flask"
+  },
+  "system": {
+    "hostname": "my-laptop",
+    "platform": "Linux",
+    "platform_version": "Ubuntu 24.04",
+    "architecture": "x86_64",
+    "cpu_count": 8,
+    "python_version": "3.13.1"
+  },
+  "runtime": {
+    "uptime_seconds": 3600,
+    "uptime_human": "1 hour, 0 minutes",
+    "current_time": "2026-01-07T14:30:00.000Z",
+    "timezone": "UTC"
+  },
+  "request": {
+    "client_ip": "127.0.0.1",
+    "user_agent": "curl/7.81.0",
+    "method": "GET",
+    "path": "/"
+  },
+  "endpoints": [
+    {"path": "/", "method": "GET", "description": "Service information"},
+    {"path": "/health", "method": "GET", "description": "Health check"}
+  ]
+}
+```
+
+<details>
+<summary>💡 Implementation Hints</summary>
+
+**Get System Information:**
+```python
+import platform
+import socket
+from datetime import datetime
+
+hostname = socket.gethostname()
+platform_name = platform.system()
+architecture = platform.machine()
+python_version = platform.python_version()
+```
+
+**Calculate Uptime:**
+```python
+start_time = datetime.now()
+
+def get_uptime():
+    delta = datetime.now() - start_time
+    seconds = int(delta.total_seconds())
+    hours = seconds // 3600
+    minutes = (seconds % 3600) // 60
+    return {
+        'seconds': seconds,
+        'human': f"{hours} hours, {minutes} minutes"
+    }
+```
+
+**Request Information:**
+```python
+# Flask
+request.remote_addr  # Client IP
+request.headers.get('User-Agent')  # User agent
+request.method  # HTTP method
+request.path  # Request path
+
+# FastAPI
+request.client.host
+request.headers.get('user-agent')
+request.method
+request.url.path
+```
+
+</details>
+
+#### 1.4 Implement Health Check: `GET /health`
+
+Simple health endpoint for monitoring:
+
+```json
+{
+  "status": "healthy",
+  "timestamp": "2024-01-15T14:30:00.000Z",
+  "uptime_seconds": 3600
+}
+```
+
+Return HTTP 200 for healthy status. This will be used for Kubernetes probes in Lab 9.
+
+<details>
+<summary>💡 Implementation Hints</summary>
+
+```python
+# Flask
+@app.route('/health')
+def health():
+    return jsonify({
+        'status': 'healthy',
+        'timestamp': datetime.now(timezone.utc).isoformat(),
+        'uptime_seconds': get_uptime()['seconds']
+    })
+
+# FastAPI
+@app.get("/health")
+def health():
+    return {
+        'status': 'healthy',
+        'timestamp': datetime.now(timezone.utc).isoformat(),
+        'uptime_seconds': get_uptime()['seconds']
+    }
+```
+
+</details>
+
+#### 1.5 Configuration
+
+Make your app configurable via environment variables:
+
+```python
+import os
+
+HOST = os.getenv('HOST', '0.0.0.0')
+PORT = int(os.getenv('PORT', 5000))
+DEBUG = os.getenv('DEBUG', 'False').lower() == 'true'
+```
+
+**Test:**
+```bash
+python app.py                    # Default: 0.0.0.0:5000
+PORT=8080 python app.py          # Custom port
+HOST=127.0.0.1 PORT=3000 python app.py
+```
+
+---
+
+### Task 2 — Documentation & Best Practices (4 pts)
+
+#### 2.1 Application README (`app_python/README.md`)
+
+Create user-facing documentation:
+
+**Required Sections:**
+1. **Overview** - What the service does
+2. **Prerequisites** - Python version, dependencies
+3. **Installation**
+   ```bash
+   python -m venv venv
+   source venv/bin/activate
+   pip install -r requirements.txt
+   ```
+4. **Running the Application**
+   ```bash
+   python app.py
+   # Or with custom config
+   PORT=8080 python app.py
+   ```
+5. **API Endpoints**
+   - `GET /` - Service and system information
+   - `GET /health` - Health check
+6. **Configuration** - Environment variables table
+
+#### 2.2 Best Practices
+
+Implement these in your code:
+
+**1. Clean Code Organization**
+- Clear function names
+- Proper imports grouping
+- Comments only where needed
+- Follow PEP 8
+
+<details>
+<summary>💡 Example Structure</summary>
+
+```python
+"""
+DevOps Info Service
+Main application module
+"""
+import os
+import socket
+import platform
+from datetime import datetime, timezone
+from flask import Flask, jsonify, request
+
+app = Flask(__name__)
+
+# Configuration
+HOST = os.getenv('HOST', '0.0.0.0')
+PORT = int(os.getenv('PORT', 5000))
+
+# Application start time
+START_TIME = datetime.now(timezone.utc)
+
+def get_system_info():
+    """Collect system information."""
+    return {
+        'hostname': socket.gethostname(),
+        'platform': platform.system(),
+        'architecture': platform.machine(),
+        'python_version': platform.python_version()
+    }
+
+@app.route('/')
+def index():
+    """Main endpoint - service and system information."""
+    # Implementation
+```
+
+</details>
+
+**2. Error Handling**
+
+<details>
+<summary>💡 Implementation</summary>
+
+```python
+@app.errorhandler(404)
+def not_found(error):
+    return jsonify({
+        'error': 'Not Found',
+        'message': 'Endpoint does not exist'
+    }), 404
+
+@app.errorhandler(500)
+def internal_error(error):
+    return jsonify({
+        'error': 'Internal Server Error',
+        'message': 'An unexpected error occurred'
+    }), 500
+```
+
+</details>
+
+**3. Logging**
+
+<details>
+<summary>💡 Implementation</summary>
+
+```python
+import logging
+
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+
+logger.info('Application starting...')
+logger.debug(f'Request: {request.method} {request.path}')
+```
+
+</details>
+
+**4. Dependencies (`requirements.txt`)**
+
+```txt
+# Web Framework
+Flask==3.1.0
+# or
+fastapi==0.115.0
+uvicorn[standard]==0.32.0  # Includes performance extras
+```
+
+Pin exact versions for reproducibility.
+
+**5. Git Ignore (`.gitignore`)**
+
+```gitignore
+# Python
+__pycache__/
+*.py[cod]
+venv/
+*.log
+
+# IDE
+.vscode/
+.idea/
+
+# OS
+.DS_Store
+```
+
+#### 2.3 Lab Submission (`app_python/docs/LAB01.md`)
+
+Document your implementation:
+
+**Required Sections:**
+1. **Framework Selection**
+   - Your choice and why
+   - Comparison table with alternatives
+2. **Best Practices Applied**
+   - List practices with code examples
+   - Explain importance of each
+3. **API Documentation**
+   - Request/response examples
+   - Testing commands
+4. **Testing Evidence**
+   - Screenshots showing endpoints work
+   - Terminal output
+5. **Challenges & Solutions**
+   - Problems encountered
+   - How you solved them
+
+**Required Screenshots:**
+- Main endpoint showing complete JSON
+- Health check response
+- Formatted/pretty-printed output
+
+#### 2.4 GitHub Community Engagement
+
+**Objective:** Explore GitHub's social features that support collaboration and discovery.
+
+**Actions Required:**
+1. **Star** the course repository
+2. **Star** the [simple-container-com/api](https://github.com/simple-container-com/api) project — a promising open-source tool for container management
+3. **Follow** your professor and TAs on GitHub:
+   - Professor: [@Cre-eD](https://github.com/Cre-eD)
+   - TA: [@marat-biriushev](https://github.com/marat-biriushev)
+   - TA: [@pierrepicaud](https://github.com/pierrepicaud)
+4. **Follow** at least 3 classmates from the course
+
+**Document in LAB01.md:**
+
+Add a "GitHub Community" section (after Challenges & Solutions) with 1-2 sentences explaining:
+- Why starring repositories matters in open source
+- How following developers helps in team projects and professional growth
+
+<details>
+<summary>💡 GitHub Social Features</summary>
+
+**Why Stars Matter:**
+
+**Discovery & Bookmarking:**
+- Stars help you bookmark interesting projects for later reference
+- Star count indicates project popularity and community trust
+- Starred repos appear in your GitHub profile, showing your interests
+
+**Open Source Signal:**
+- Stars encourage maintainers (shows appreciation)
+- High star count attracts more contributors
+- Helps projects gain visibility in GitHub search and recommendations
+
+**Professional Context:**
+- Shows you follow best practices and quality projects
+- Indicates awareness of industry tools and trends
+
+**Why Following Matters:**
+
+**Networking:**
+- See what other developers are working on
+- Discover new projects through their activity
+- Build professional connections beyond the classroom
+
+**Learning:**
+- Learn from others' code and commits
+- See how experienced developers solve problems
+- Get inspiration for your own projects
+
+**Collaboration:**
+- Stay updated on classmates' work
+- Easier to find team members for future projects
+- Build a supportive learning community
+
+**Career Growth:**
+- Follow thought leaders in your technology stack
+- See trending projects in real-time
+- Build visibility in the developer community
+
+**GitHub Best Practices:**
+- Star repos you find useful (not spam)
+- Follow developers whose work interests you
+- Engage meaningfully with the community
+- Your GitHub activity shows employers your interests and involvement
+
+</details>
+
+---
+
+## Bonus Task — Compiled Language (2.5 pts)
+
+Implement the same service in a compiled language to prepare for multi-stage Docker builds (Lab 2).
+
+**Choose One:**
+- **Go** (Recommended) - Small binaries, fast compilation
+- **Rust** - Memory safety, modern features
+- **Java/Spring Boot** - Enterprise standard
+- **C#/ASP.NET Core** - Cross-platform .NET
+
+**Structure:**
+
+```
+app_go/  (or app_rust, app_java, etc.)
+├── main.go
+├── go.mod
+├── README.md
+└── docs/
+    ├── LAB01.md              # Implementation details
+    ├── GO.md                 # Language justification
+    └── screenshots/
+```
+
+**Requirements:**
+- Same two endpoints: `/` and `/health`
+- Same JSON structure
+- Document build process
+- Compare binary size to Python
+
+<details>
+<summary>💡 Go Example Skeleton</summary>
+
+```go
+package main
+
+import (
+    "encoding/json"
+    "net/http"
+    "os"
+    "runtime"
+    "time"
+)
+
+type ServiceInfo struct {
+    Service  Service  `json:"service"`
+    System   System   `json:"system"`
+    Runtime  Runtime  `json:"runtime"`
+    Request  Request  `json:"request"`
+}
+
+var startTime = time.Now()
+
+func mainHandler(w http.ResponseWriter, r *http.Request) {
+    info := ServiceInfo{
+        Service: Service{
+            Name:    "devops-info-service",
+            Version: "1.0.0",
+        },
+        System: System{
+            Platform:     runtime.GOOS,
+            Architecture: runtime.GOARCH,
+            CPUCount:     runtime.NumCPU(),
+        },
+        // ... implement rest
+    }
+
+    w.Header().Set("Content-Type", "application/json")
+    json.NewEncoder(w).Encode(info)
+}
+
+func main() {
+    http.HandleFunc("/", mainHandler)
+    http.HandleFunc("/health", healthHandler)
+
+    port := os.Getenv("PORT")
+    if port == "" {
+        port = "8080"
+    }
+
+    http.ListenAndServe(":"+port, nil)
+}
+```
+
+</details>
+
+---
+
+## How to Submit
+
+1. **Create Branch:**
+   ```bash
+   git checkout -b lab01
+   ```
+
+2. **Commit Work:**
+   ```bash
+   git add app_python/
+   git commit -m "feat: implement lab01 devops info service"
+   git push -u origin lab01
+   ```
+
+3. **Create Pull Requests:**
+   - **PR #1:** `your-fork:lab01` → `course-repo:master`
+   - **PR #2:** `your-fork:lab01` → `your-fork:master`
+
+4. **Verify:**
+   - All files present
+   - Screenshots included
+   - Documentation complete
+
+---
+
+## Acceptance Criteria
+
+### Main Tasks (10 points)
+
+**Application Functionality (3 pts):**
+- [ ] Service runs without errors
+- [ ] `GET /` returns all required fields:
+  - [ ] Service metadata (name, version, description, framework)
+  - [ ] System info (hostname, platform, architecture, CPU, Python version)
+  - [ ] Runtime info (uptime, current time, timezone)
+  - [ ] Request info (client IP, user agent, method, path)
+  - [ ] Endpoints list
+- [ ] `GET /health` returns status and uptime
+- [ ] Configurable via environment variables (PORT, HOST)
+
+**Code Quality (2 pts):**
+- [ ] Clean code structure
+- [ ] PEP 8 compliant
+- [ ] Error handling implemented
+- [ ] Logging configured
+
+**Documentation (3 pts):**
+- [ ] `app_python/README.md` complete with all sections
+- [ ] `app_python/docs/LAB01.md` includes:
+  - [ ] Framework justification
+  - [ ] Best practices documentation
+  - [ ] API examples
+  - [ ] Testing evidence
+  - [ ] Challenges solved
+  - [ ] GitHub Community section (why stars/follows matter)
+- [ ] All 3 required screenshots present
+- [ ] Course repository starred
+- [ ] simple-container-com/api repository starred
+- [ ] Professor and TAs followed on GitHub
+- [ ] At least 3 classmates followed on GitHub
+
+**Configuration (2 pts):**
+- [ ] `requirements.txt` with pinned versions
+- [ ] `.gitignore` properly configured
+- [ ] Environment variables working
+
+### Bonus Task (2.5 points)
+
+- [ ] Compiled language app implements both endpoints
+- [ ] Same JSON structure as Python version
+- [ ] `app_<language>/README.md` with build/run instructions
+- [ ] `app_<language>/docs/GO.md` with language justification
+- [ ] `app_<language>/docs/LAB01.md` with implementation details
+- [ ] Screenshots showing compilation and execution
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Functionality** | 3 pts | Both endpoints work with complete, correct data |
+| **Code Quality** | 2 pts | Clean, organized, follows Python standards |
+| **Documentation** | 3 pts | Complete README and lab submission docs |
+| **Configuration** | 2 pts | Dependencies, environment vars, .gitignore |
+| **Bonus** | 2.5 pts | Compiled language implementation |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading Scale:**
+- **10/10:** Perfect implementation, excellent documentation
+- **8-9/10:** All works, good docs, minor improvements possible
+- **6-7/10:** Core functionality present, basic documentation
+- **<6/10:** Missing features or documentation, needs revision
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Python Web Frameworks</summary>
+
+- [Flask 3.1 Documentation](https://flask.palletsprojects.com/en/latest/)
+- [Flask Quickstart](https://flask.palletsprojects.com/en/latest/quickstart/)
+- [FastAPI Documentation](https://fastapi.tiangolo.com/)
+- [FastAPI Tutorial](https://fastapi.tiangolo.com/tutorial/first-steps/)
+- [Django 5.1 Documentation](https://docs.djangoproject.com/en/5.1/)
+
+</details>
+
+<details>
+<summary>🐍 Python Best Practices</summary>
+
+- [PEP 8 Style Guide](https://pep8.org/)
+- [Python Logging Tutorial](https://docs.python.org/3/howto/logging.html)
+- [Python platform module](https://docs.python.org/3/library/platform.html)
+- [Python socket module](https://docs.python.org/3/library/socket.html)
+
+</details>
+
+<details>
+<summary>🔧 Compiled Languages (Bonus)</summary>
+
+- [Go Web Development](https://golang.org/doc/articles/wiki/)
+- [Go net/http Package](https://pkg.go.dev/net/http)
+- [Rust Web Frameworks](https://www.arewewebyet.org/)
+- [Spring Boot Quickstart](https://spring.io/quickstart)
+- [ASP.NET Core Tutorial](https://docs.microsoft.com/aspnet/core/)
+
+</details>
+
+<details>
+<summary>🛠️ Development Tools</summary>
+
+- [Postman](https://www.postman.com/) - API testing
+- [HTTPie](https://httpie.io/) - Command-line HTTP client
+- [curl](https://curl.se/) - Data transfer tool
+- [jq](https://stedolan.github.io/jq/) - JSON processor
+
+</details>
+
+---
+
+## Looking Ahead
+
+This service evolves throughout the course:
+
+- **Lab 2:** Containerize with Docker, multi-stage builds
+- **Lab 3:** Add unit tests and CI/CD pipeline
+- **Lab 8:** Add `/metrics` endpoint for Prometheus
+- **Lab 9:** Deploy to Kubernetes using `/health` probes
+- **Lab 12:** Add `/visits` endpoint with file persistence
+- **Lab 13:** Multi-environment deployment with GitOps
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** Keep it simple, write clean code, and document thoroughly. This foundation will carry through all 16 labs!
diff --git a/labs/lab02.md b/labs/lab02.md
new file mode 100644
index 0000000000..1c3e032f89
--- /dev/null
+++ b/labs/lab02.md
@@ -0,0 +1,366 @@
+# Lab 2 — Docker Containerization
+
+![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
+![topic](https://img.shields.io/badge/topic-Containerization-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Docker-informational)
+
+> Containerize your Python app from Lab 1 using Docker best practices and publish it to Docker Hub.
+
+## Overview
+
+Take your Lab 1 application and package it into a Docker container. Learn image optimization, security basics, and the Docker workflow used in production.
+
+**What You'll Learn:**
+- Writing production-ready Dockerfiles
+- Docker best practices and security
+- Image optimization techniques
+- Docker Hub workflow
+
+**Tech Stack:** Docker 25+ | Python 3.13-slim | Multi-stage builds
+
+---
+
+## Tasks
+
+### Task 1 — Create Dockerfile (4 pts)
+
+**Objective:** Write a Dockerfile that containerizes your Python app following best practices.
+
+Create `app_python/Dockerfile` with these requirements:
+
+**Must Have:**
+- Non-root user (mandatory)
+- Specific base image version (e.g., `python:3.13-slim` or `python:3.12-slim`)
+- Only copy necessary files
+- Proper layer ordering
+- `.dockerignore` file
+
+**Your app should work the same way in the container as it did locally.**
+
+<details>
+<summary>💡 Dockerfile Concepts & Resources</summary>
+
+**Key Dockerfile Instructions to Research:**
+- `FROM` - Choose your base image (look at python:3.13-slim, python:3.12-slim, python:3.13-alpine)
+- `RUN` - Execute commands (creating users, installing packages)
+- `WORKDIR` - Set working directory
+- `COPY` - Copy files into the image
+- `USER` - Switch to non-root user
+- `EXPOSE` - Document which port your app uses
+- `CMD` - Define how to start your application
+
+**Critical Concepts:**
+- **Layer Caching**: Why does the order of COPY commands matter?
+- **Non-root User**: How do you create and switch to a non-root user?
+- **Base Image Selection**: What's the difference between slim, alpine, and full images?
+- **Dependency Installation**: Why copy requirements.txt separately from application code?
+
+**Resources:**
+- [Dockerfile Reference](https://docs.docker.com/reference/dockerfile/)
+- [Best Practices Guide](https://docs.docker.com/build/building/best-practices/)
+- [Python Image Variants](https://hub.docker.com/_/python) - Use 3.13-slim or 3.12-slim
+
+**Think About:**
+- What happens if you copy all files before installing dependencies?
+- Why shouldn't you run as root?
+- How does layer caching speed up rebuilds?
+
+</details>
+
+<details>
+<summary>💡 .dockerignore Concepts</summary>
+
+**Purpose:** Prevent unnecessary files from being sent to Docker daemon during build (faster builds, smaller context).
+
+**What Should You Exclude?**
+Think about what doesn't need to be in your container:
+- Development artifacts (like Python's `__pycache__`, `*.pyc`)
+- Version control files (`.git` directory)
+- IDE configuration files
+- Virtual environments (`venv/`, `.venv/`)
+- Documentation that's not needed at runtime
+- Test files (if not running tests in container)
+
+**Key Question:** Why does excluding files from the build context matter for build speed?
+
+**Resources:**
+- [.dockerignore Documentation](https://docs.docker.com/engine/reference/builder/#dockerignore-file)
+- Look at your `.gitignore` for inspiration - many patterns overlap
+
+**Exercise:** Start minimal and add exclusions as needed, rather than copying a huge list you don't understand.
+
+</details>
+
+**Test Your Container:**
+
+You should be able to:
+1. Build your image using the `docker build` command
+2. Run a container from your image with proper port mapping
+3. Access your application endpoints from the host machine
+
+Verify that your application works the same way in the container as it did locally.
+
+---
+
+### Task 2 — Docker Hub (2 pts)
+
+**Objective:** Publish your image to Docker Hub.
+
+**Requirements:**
+1. Create a Docker Hub account (if you don't have one)
+2. Tag your image with your Docker Hub username
+3. Authenticate with Docker Hub
+4. Push your image to the registry
+5. Verify the image is publicly accessible
+
+**Documentation Required:**
+- Terminal output showing successful push
+- Docker Hub repository URL
+- Explanation of your tagging strategy
+
+<details>
+<summary>💡 Docker Hub Resources</summary>
+
+**Useful Commands:**
+- `docker tag` - Tag images for registry push
+- `docker login` - Authenticate with Docker Hub
+- `docker push` - Upload image to registry
+- `docker pull` - Download image from registry
+
+**Resources:**
+- [Docker Hub Quickstart](https://docs.docker.com/docker-hub/quickstart/)
+- [Docker Tag Reference](https://docs.docker.com/reference/cli/docker/image/tag/)
+- [Best Practices for Tagging](https://docs.docker.com/build/building/best-practices/#tagging)
+
+</details>
+
+---
+
+### Task 3 — Documentation (4 pts)
+
+**Objective:** Document your Docker implementation with focus on understanding and decisions.
+
+#### 3.1 Update `app_python/README.md`
+
+Add a **Docker** section explaining how to use your containerized application. Include command patterns (not exact commands) for:
+- Building the image locally
+- Running a container
+- Pulling from Docker Hub
+
+#### 3.2 Create `app_python/docs/LAB02.md`
+
+Document your implementation with these sections:
+
+**Required Sections:**
+
+1. **Docker Best Practices Applied**
+   - List each practice you implemented (non-root user, layer caching, .dockerignore, etc.)
+   - Explain WHY each matters (not just what it does)
+   - Include relevant Dockerfile snippets with explanations
+
+2. **Image Information & Decisions**
+   - Base image chosen and justification (why this specific version?)
+   - Final image size and your assessment
+   - Layer structure explanation
+   - Optimization choices you made
+
+3. **Build & Run Process**
+   - Complete terminal output from your build process
+   - Terminal output showing container running
+   - Terminal output from testing endpoints (curl/httpie)
+   - Docker Hub repository URL
+
+4. **Technical Analysis**
+   - Why does your Dockerfile work the way it does?
+   - What would happen if you changed the layer order?
+   - What security considerations did you implement?
+   - How does .dockerignore improve your build?
+
+5. **Challenges & Solutions**
+   - Issues encountered during implementation
+   - How you debugged and resolved them
+   - What you learned from the process
+
+---
+
+## Bonus Task — Multi-Stage Build (2.5 pts)
+
+**Objective:** Containerize your compiled language app (from Lab 1 bonus) using multi-stage builds.
+
+**Why Multi-Stage?** Separate build environment from runtime → smaller final image.
+
+**Example Flow:**
+1. **Stage 1 (Builder):** Compile the app (large image with compilers)
+2. **Stage 2 (Runtime):** Copy only the binary (small image, no build tools)
+
+<details>
+<summary>💡 Multi-Stage Build Concepts</summary>
+
+**The Problem:** Compiled language images include the entire compiler/SDK in the final image (huge!).
+
+**The Solution:** Use multiple `FROM` statements:
+- **Stage 1 (Builder)**: Use full SDK image, compile your application
+- **Stage 2 (Runtime)**: Use minimal base image, copy only the compiled binary
+
+**Key Concepts to Research:**
+- How to name build stages (`AS builder`)
+- How to copy files from previous stages (`COPY --from=builder`)
+- Choosing runtime base images (alpine, distroless, scratch)
+- Static vs dynamic compilation (affects what base image you can use)
+
+**Questions to Explore:**
+- What's the size difference between your builder and final image?
+- Why can't you just use the builder image as your final image?
+- What security benefits come from smaller images?
+- Can you use `FROM scratch`? Why or why not?
+
+**Resources:**
+- [Multi-Stage Builds Documentation](https://docs.docker.com/build/building/multi-stage/)
+- [Distroless Base Images](https://github.com/GoogleContainerTools/distroless)
+- Language-specific: Search "Go static binary Docker" or "Rust alpine Docker"
+
+**Challenge:** Try to get your final image under 20MB.
+
+</details>
+
+**Requirements:**
+- Multi-stage Dockerfile in `app_go/` (or your chosen language)
+- Working containerized application
+- Documentation in `app_go/docs/LAB02.md` explaining:
+  - Your multi-stage build strategy
+  - Size comparison with analysis (builder vs final image)
+  - Why multi-stage builds matter for compiled languages
+  - Terminal output showing build process and image sizes
+  - Technical explanation of each stage's purpose
+
+**Bonus Points Given For:**
+- Significant size reduction achieved with clear metrics
+- Deep understanding of multi-stage build benefits
+- Analysis of security implications (smaller attack surface)
+- Explanation of trade-offs and decisions made
+
+---
+
+## How to Submit
+
+1. **Create Branch:** Create a new branch called `lab02`
+
+2. **Commit Work:**
+   - Add your changes (app_python/ directory with Dockerfile, .dockerignore, updated docs)
+   - Commit with a descriptive message following conventional commits format
+   - Push to your fork
+
+3. **Create Pull Requests:**
+   - **PR #1:** `your-fork:lab02` → `course-repo:master`
+   - **PR #2:** `your-fork:lab02` → `your-fork:master`
+
+---
+
+## Acceptance Criteria
+
+### Main Tasks (10 points)
+
+**Dockerfile (4 pts):**
+- [ ] Dockerfile exists in `app_python/`
+- [ ] Uses specific base image version
+- [ ] Runs as non-root user (USER directive)
+- [ ] Proper layer ordering (dependencies before code)
+- [ ] Only copies necessary files
+- [ ] `.dockerignore` file present
+- [ ] Image builds successfully
+- [ ] Container runs and app works
+
+**Docker Hub (2 pts):**
+- [ ] Image pushed to Docker Hub
+- [ ] Image is publicly accessible
+- [ ] Correct tagging used
+- [ ] Can pull and run from Docker Hub
+
+**Documentation (4 pts):**
+- [ ] `app_python/README.md` has Docker section with command patterns
+- [ ] `app_python/docs/LAB02.md` complete with:
+  - [ ] Best practices explained with WHY (not just what)
+  - [ ] Image information and justifications for choices
+  - [ ] Terminal output from build, run, and testing
+  - [ ] Technical analysis demonstrating understanding
+  - [ ] Challenges and solutions documented
+  - [ ] Docker Hub repository URL provided
+
+### Bonus Task (2.5 points)
+
+- [ ] Multi-stage Dockerfile for compiled language app
+- [ ] Working containerized application
+- [ ] Documentation in `app_<language>/docs/LAB02.md` with:
+  - [ ] Multi-stage strategy explained
+  - [ ] Terminal output showing image sizes (builder vs final)
+  - [ ] Analysis of size reduction and why it matters
+  - [ ] Technical explanation of each stage
+  - [ ] Security benefits discussed
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Dockerfile** | 4 pts | Correct, secure, optimized |
+| **Docker Hub** | 2 pts | Successfully published |
+| **Documentation** | 4 pts | Complete and clear |
+| **Bonus** | 2.5 pts | Multi-stage implementation |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Perfect Dockerfile, deep understanding demonstrated, excellent analysis
+- **8-9/10:** Working container, good practices, solid understanding shown
+- **6-7/10:** Container works, basic security, surface-level explanations
+- **<6/10:** Missing requirements, runs as root, copy-paste without understanding
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Docker Documentation</summary>
+
+- [Dockerfile Best Practices](https://docs.docker.com/build/building/best-practices/)
+- [Dockerfile Reference](https://docs.docker.com/reference/dockerfile/)
+- [Multi-Stage Builds](https://docs.docker.com/build/building/multi-stage/)
+- [.dockerignore](https://docs.docker.com/reference/dockerfile/#dockerignore-file)
+- [Docker Build Guide](https://docs.docker.com/build/guide/)
+
+</details>
+
+<details>
+<summary>🔒 Security Resources</summary>
+
+- [Docker Security Best Practices](https://docs.docker.com/build/building/best-practices/#security)
+- [Snyk Docker Security](https://snyk.io/learn/docker-security-scanning/)
+- [Why Non-Root Containers](https://docs.docker.com/build/building/best-practices/#user)
+- [Distroless Images](https://github.com/GoogleContainerTools/distroless) - Minimal base images
+
+</details>
+
+<details>
+<summary>🛠️ Tools</summary>
+
+- [Hadolint](https://github.com/hadolint/hadolint) - Dockerfile linter
+- [Dive](https://github.com/wagoodman/dive) - Explore image layers
+- [Docker Hub](https://hub.docker.com/) - Container registry
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 3:** CI/CD will automatically build these Docker images
+- **Lab 7-8:** Deploy containers with docker-compose for logging/monitoring
+- **Lab 9:** Run these containers in Kubernetes
+- **Lab 13:** ArgoCD will deploy containerized apps automatically
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** Understanding beats copy-paste. Explain your decisions, not just your actions. Run as non-root or no points!
diff --git a/labs/lab03.md b/labs/lab03.md
new file mode 100644
index 0000000000..9824e934b3
--- /dev/null
+++ b/labs/lab03.md
@@ -0,0 +1,931 @@
+# Lab 3 — Continuous Integration (CI/CD)
+
+![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
+![topic](https://img.shields.io/badge/topic-CI/CD-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-GitHub%20Actions-informational)
+
+> Automate your Python app testing and Docker builds with GitHub Actions CI/CD pipeline.
+
+## Overview
+
+Take your containerized app from Labs 1-2 and add automated testing and deployment. Learn how CI/CD catches bugs early, ensures code quality, and automates the Docker build/push workflow.
+
+**What You'll Learn:**
+- Writing effective unit tests
+- GitHub Actions workflow syntax
+- CI/CD best practices (caching, matrix builds, security scanning)
+- Automated Docker image publishing
+- Continuous integration for multiple applications
+
+**Tech Stack:** GitHub Actions | pytest 8+ | Python 3.11+ | Snyk | Docker
+
+**Connection to Previous Labs:**
+- **Lab 1:** Test the endpoints you created
+- **Lab 2:** Automate the Docker build/push workflow
+- **Lab 4+:** This CI pipeline will run for all future labs
+
+---
+
+## Tasks
+
+### Task 1 — Unit Testing (3 pts)
+
+**Objective:** Write comprehensive unit tests for your Python application to ensure reliability.
+
+**Requirements:**
+
+1. **Choose a Testing Framework**
+   - Research Python testing frameworks (pytest, unittest, etc.)
+   - Select one and justify your choice
+   - Install it in your `requirements.txt` or create `requirements-dev.txt`
+
+2. **Write Unit Tests**
+   - Create `app_python/tests/` directory
+   - Write tests for **all** your endpoints:
+     - `GET /` - Verify JSON structure and required fields
+     - `GET /health` - Verify health check response
+   - Test both successful responses and error cases
+   - Aim for meaningful test coverage (not just basic smoke tests)
+
+3. **Run Tests Locally**
+   - Verify all tests pass locally before CI setup
+   - Document how to run tests in your README
+
+<details>
+<summary>💡 Testing Framework Guidance</summary>
+
+**Popular Python Testing Frameworks:**
+
+**pytest (Recommended):**
+- Pros: Simple syntax, powerful fixtures, excellent plugin ecosystem
+- Cons: Additional dependency
+- Use case: Most modern Python projects
+
+**unittest:**
+- Pros: Built into Python (no extra dependencies)
+- Cons: More verbose, less modern features
+- Use case: Minimal dependency projects
+
+**Key Testing Concepts to Research:**
+- Test fixtures and setup/teardown
+- Mocking external dependencies
+- Testing HTTP endpoints (test client usage)
+- Test coverage measurement
+- Assertions and expected vs actual results
+
+**What Should You Test?**
+- Correct HTTP status codes (200, 404, 500)
+- Response data structure (JSON fields present)
+- Response data types (strings, integers, etc.)
+- Edge cases (invalid requests, missing data)
+- Error handling (what happens when things fail?)
+
+**Questions to Consider:**
+- How do you test a Flask/FastAPI app without starting the server?
+- Should you test that `hostname` returns your actual hostname, or just that the field exists?
+- How do you simulate different client IPs or user agents in tests?
+
+**Resources:**
+- [Pytest Documentation](https://docs.pytest.org/)
+- [Flask Testing](https://flask.palletsprojects.com/en/stable/testing/)
+- [FastAPI Testing](https://fastapi.tiangolo.com/tutorial/testing/)
+- [Python unittest](https://docs.python.org/3/library/unittest.html)
+
+**Anti-Patterns to Avoid:**
+- Testing framework functionality instead of your code
+- Tests that always pass regardless of implementation
+- Tests with no assertions
+- Tests that depend on external services
+
+</details>
+
+**What to Document:**
+- Your testing framework choice and why
+- Test structure explanation
+- How to run tests locally
+- Terminal output showing all tests passing
+
+---
+
+### Task 2 — GitHub Actions CI Workflow (4 pts)
+
+**Objective:** Create a GitHub Actions workflow that automatically tests your code and builds Docker images with proper versioning.
+
+**Requirements:**
+
+1. **Create Workflow File**
+   - Create `.github/workflows/python-ci.yml` in your repository
+   - Name your workflow descriptively
+
+2. **Implement Essential CI Steps**
+
+   Your workflow must include these logical stages:
+
+   **a) Code Quality & Testing:**
+   - Install dependencies
+   - Run a linter (pylint, flake8, black, ruff, etc.)
+   - Run your unit tests
+
+   **b) Docker Build & Push with Versioning:**
+   - Authenticate with Docker Hub
+   - Build your Docker image
+   - Tag with proper version strategy (see versioning section below)
+   - Push to Docker Hub with multiple tags
+
+3. **Versioning Strategy**
+
+   Choose **one** versioning approach and implement it:
+
+   **Option A: Semantic Versioning (SemVer)**
+   - Version format: `v1.2.3` (major.minor.patch)
+   - Use git tags for releases
+   - Tag images like: `username/app:1.2.3`, `username/app:1.2`, `username/app:latest`
+   - **When to use:** Traditional software releases with breaking changes
+
+   **Option B: Calendar Versioning (CalVer)**
+   - Version format: `2024.01.15` or `2024.01` (year.month.day or year.month)
+   - Based on release date
+   - Tag images like: `username/app:2024.01`, `username/app:latest`
+   - **When to use:** Time-based releases, continuous deployment
+
+   **Required:**
+   - Document which strategy you chose and why
+   - Implement it in your CI workflow
+   - Show at least 2 tags per image (e.g., version + latest)
+
+4. **Workflow Triggers**
+   - Configure when the workflow runs (push, pull request, etc.)
+   - Consider which branches should trigger builds
+
+5. **Testing the Workflow**
+   - Push your workflow file and verify it runs
+   - Fix any issues that arise
+   - Ensure all steps complete successfully
+   - Verify Docker Hub shows your version tags
+
+<details>
+<summary>💡 GitHub Actions Concepts</summary>
+
+**Core Concepts to Research:**
+
+**Workflow Anatomy:**
+- `name` - What is your workflow called?
+- `on` - When does it run? (push, pull_request, schedule, etc.)
+- `jobs` - What work needs to be done?
+- `steps` - Individual commands within a job
+- `runs-on` - What OS environment? (ubuntu-latest, etc.)
+
+**Key Questions:**
+- Should you run CI on every push, or only on pull requests?
+- What happens if tests fail? Should the workflow continue?
+- How do you access secrets (like Docker Hub credentials) securely?
+- Why might you want multiple jobs vs multiple steps in one job?
+
+**Python CI Steps Pattern:**
+```yaml
+# This is a pattern, not exact copy-paste code
+# Research the actual syntax and actions needed
+
+- Set up Python environment
+- Install dependencies
+- Run linter
+- Run tests
+```
+
+**Docker CI Steps Pattern:**
+```yaml
+# This is a pattern, not exact copy-paste code
+# Research the actual actions and their parameters
+
+- Log in to Docker Hub
+- Extract metadata for tags
+- Build and push Docker image
+```
+
+**Important Concepts:**
+- **Actions Marketplace:** Reusable actions (actions/checkout@v4, actions/setup-python@v5, docker/build-push-action@v6)
+- **Secrets:** How to store Docker Hub credentials securely
+- **Job Dependencies:** Can one job depend on another succeeding?
+- **Matrix Builds:** Testing multiple Python versions (optional but good to know)
+- **Caching:** Speed up workflows by caching dependencies (we'll add this in Task 3)
+
+**Resources:**
+- [GitHub Actions Documentation](https://docs.github.com/en/actions)
+- [Building and Testing Python](https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python)
+- [Publishing Docker Images](https://docs.docker.com/ci-cd/github-actions/)
+- [GitHub Actions Marketplace](https://github.com/marketplace?type=actions)
+- [Workflow Syntax](https://docs.github.com/en/actions/using-workflows/workflow-syntax-for-github-actions)
+
+**Security Best Practices:**
+- Never hardcode passwords or tokens in workflow files
+- Use GitHub Secrets for sensitive data
+- Understand when secrets are exposed to pull requests from forks
+- Use `secrets.GITHUB_TOKEN` for GitHub API access (auto-provided)
+
+**Docker Hub Authentication:**
+You'll need to create a Docker Hub access token and add it as a GitHub Secret. Research:
+- How to create Docker Hub access tokens
+- How to add secrets to your GitHub repository
+- How to reference secrets in workflow files (hint: `${{ secrets.NAME }}`)
+
+</details>
+
+<details>
+<summary>💡 Versioning Strategy Guidance</summary>
+
+**Semantic Versioning (SemVer):**
+
+**Format:** MAJOR.MINOR.PATCH (e.g., 1.2.3)
+- **MAJOR:** Breaking changes (incompatible API changes)
+- **MINOR:** New features (backward-compatible)
+- **PATCH:** Bug fixes (backward-compatible)
+
+**Implementation Approaches:**
+1. **Manual Git Tags:** Create git tags (v1.0.0) and reference in workflow
+2. **Automated from Commits:** Parse conventional commits to bump version
+3. **GitHub Releases:** Trigger on release creation
+
+**Docker Tagging Example:**
+- `username/app:1.2.3` (full version)
+- `username/app:1.2` (minor version, rolling)
+- `username/app:1` (major version, rolling)
+- `username/app:latest` (latest stable)
+
+**Pros:** Clear when breaking changes occur, industry standard for libraries
+**Cons:** Requires discipline to follow rules correctly
+
+---
+
+**Calendar Versioning (CalVer):**
+
+**Common Formats:**
+- `YYYY.MM.DD` (e.g., 2024.01.15) - Daily releases
+- `YYYY.MM.MICRO` (e.g., 2024.01.0) - Monthly with patch number
+- `YYYY.0M` (e.g., 2024.01) - Monthly releases
+
+**Implementation Approaches:**
+1. **Date-based:** Generate from current date in workflow
+2. **Git SHA:** Combine with short commit SHA (2024.01-a1b2c3d)
+3. **Build Number:** Use GitHub run number (2024.01.42)
+
+**Docker Tagging Example:**
+- `username/app:2024.01` (month version)
+- `username/app:2024.01.123` (with build number)
+- `username/app:latest` (latest build)
+
+**Pros:** No ambiguity, good for continuous deployment, easier to remember
+**Cons:** Doesn't indicate breaking changes
+
+---
+
+**How to Implement in CI:**
+
+**Using docker/metadata-action:**
+```yaml
+# Pattern - research actual syntax
+- name: Docker metadata
+  uses: docker/metadata-action
+  with:
+    # Define your tagging strategy here
+    # Can reference git tags, dates, commit SHAs
+```
+
+**Manual Tagging:**
+```yaml
+# Pattern - research actual syntax
+- name: Generate version
+  run: echo "VERSION=$(date +%Y.%m.%d)" >> $GITHUB_ENV
+
+- name: Build and push
+  # Use ${{ env.VERSION }} in tags
+```
+
+**Questions to Consider:**
+- How often will you release? (Daily? Per feature? Monthly?)
+- Do users need to know about breaking changes explicitly?
+- Are you building a library (use SemVer) or a service (CalVer works)?
+- How will you track what's in each version?
+
+**Resources:**
+- [Semantic Versioning](https://semver.org/)
+- [Calendar Versioning](https://calver.org/)
+- [Docker Metadata Action](https://github.com/docker/metadata-action)
+- [Conventional Commits](https://www.conventionalcommits.org/) (for automated SemVer)
+
+</details>
+
+<details>
+<summary>💡 Debugging GitHub Actions</summary>
+
+**Common Issues & How to Debug:**
+
+**Workflow Won't Trigger:**
+- Check your `on:` configuration
+- Verify you pushed to the correct branch
+- Look at Actions tab for filtering options
+
+**Steps Failing:**
+- Click into the failed step to see full logs
+- Check for typos in action names or parameters
+- Verify secrets are configured correctly
+- Test commands locally first
+
+**Docker Build Fails:**
+- Ensure Dockerfile is in the correct location
+- Check context path in build step
+- Verify base image exists and is accessible
+- Test Docker build locally first
+
+**Authentication Issues:**
+- Verify secret names match exactly (case-sensitive)
+- Check that Docker Hub token has write permissions
+- Ensure you're using `docker/login-action` correctly
+
+**Debugging Techniques:**
+- Add `run: echo "Debug message"` steps to understand workflow state
+- Use `run: env` to see available environment variables
+- Check Actions tab for detailed logs
+- Enable debug logging (add `ACTIONS_RUNNER_DEBUG` secret = true)
+
+</details>
+
+**What to Document:**
+- Your workflow trigger strategy and reasoning
+- Why you chose specific actions from the marketplace
+- Your Docker tagging strategy (latest? version tags? commit SHA?)
+- Link to successful workflow run in GitHub Actions tab
+- Terminal output or screenshot of green checkmark
+
+---
+
+### Task 3 — CI Best Practices & Security (3 pts)
+
+**Objective:** Optimize your CI workflow and add security scanning.
+
+**Requirements:**
+
+1. **Add Status Badge**
+   - Add a GitHub Actions status badge to your `app_python/README.md`
+   - The badge should show the current workflow status (passing/failing)
+
+2. **Implement Dependency Caching**
+   - Add caching for Python dependencies to speed up workflow
+   - Measure and document the speed improvement
+
+3. **Add Security Scanning with Snyk**
+   - Integrate Snyk vulnerability scanning into your workflow
+   - Configure it to check for vulnerabilities in your dependencies
+   - Document any vulnerabilities found and how you addressed them
+
+4. **Apply CI Best Practices**
+   - Research and implement at least 3 additional CI best practices
+   - Document which practices you applied and why they matter
+
+<details>
+<summary>💡 CI Best Practices Guidance</summary>
+
+**Dependency Caching:**
+
+Caching speeds up workflows by reusing previously downloaded dependencies.
+
+**Key Concepts:**
+- What should be cached? (pip packages, Docker layers, etc.)
+- What's the cache key? (based on requirements.txt hash)
+- When does cache become invalid?
+- How much time does caching save?
+
+**Actions to Research:**
+- `actions/cache` for general caching
+- `actions/setup-python` has built-in cache support
+
+**Questions to Explore:**
+- Where are Python packages stored that should be cached?
+- How do you measure cache hit vs cache miss?
+- What happens if requirements.txt changes?
+
+**Status Badges:**
+
+Show workflow status directly in your README.
+
+**Format Pattern:**
+```markdown
+![Workflow Name](https://github.com/username/repo/workflows/workflow-name/badge.svg)
+```
+
+Research how to:
+- Get the correct badge URL for your workflow
+- Make badges clickable (link to Actions tab)
+- Display specific branch status
+
+**CI Best Practices to Consider:**
+
+Research and choose at least 3 to implement:
+
+1. **Fail Fast:** Stop workflow on first failure
+2. **Matrix Builds:** Test multiple Python versions (3.12, 3.13)
+3. **Job Dependencies:** Don't push Docker if tests fail
+4. **Conditional Steps:** Only push on main branch
+5. **Pull Request Checks:** Require passing CI before merge
+6. **Workflow Concurrency:** Cancel outdated workflow runs
+7. **Docker Layer Caching:** Cache Docker build layers
+8. **Environment Variables:** Use env for repeated values
+9. **Secrets Scanning:** Prevent committing secrets
+10. **YAML Validation:** Lint your workflow files
+
+**Resources:**
+- [GitHub Actions Best Practices](https://docs.github.com/en/actions/learn-github-actions/usage-limits-billing-and-administration#usage-limits)
+- [Caching Dependencies](https://docs.github.com/en/actions/using-workflows/caching-dependencies-to-speed-up-workflows)
+- [Security Hardening](https://docs.github.com/en/actions/security-guides/security-hardening-for-github-actions)
+
+</details>
+
+<details>
+<summary>💡 Snyk Integration Guidance</summary>
+
+**What is Snyk?**
+
+Snyk is a security tool that scans your dependencies for known vulnerabilities.
+
+**Key Concepts:**
+- Vulnerability databases (CVEs)
+- Severity levels (low, medium, high, critical)
+- Automated dependency updates
+- Security advisories
+
+**Integration Options:**
+
+1. **Snyk GitHub Action:**
+   - Use `snyk/actions` from GitHub Marketplace
+   - Requires Snyk API token (free tier available)
+   - Can fail builds on vulnerabilities
+
+2. **Snyk CLI in Workflow:**
+   - Install Snyk CLI in workflow
+   - Run `snyk test` command
+   - More flexible but requires setup
+
+**Setup Steps:**
+1. Create free Snyk account
+2. Get API token from Snyk dashboard
+3. Add token as GitHub Secret
+4. Add Snyk step to workflow
+5. Configure severity threshold (what level fails the build?)
+
+**Questions to Explore:**
+- Should every vulnerability fail your build?
+- What if vulnerabilities have no fix available?
+- How do you handle false positives?
+- When should you break the build vs just warn?
+
+**Resources:**
+- [Snyk GitHub Actions](https://github.com/snyk/actions)
+- [Snyk Python Example](https://github.com/snyk/actions/tree/master/python)
+- [Snyk Documentation](https://docs.snyk.io/integrations/ci-cd-integrations/github-actions-integration)
+
+**Common Issues:**
+- Dependencies not installed before Snyk runs
+- API token not configured correctly
+- Overly strict severity settings breaking builds
+- Virtual environment confusion
+
+**What to Document:**
+- Your severity threshold decision and reasoning
+- Any vulnerabilities found and your response
+- Whether you fail builds on vulnerabilities or just warn
+
+</details>
+
+**What to Document:**
+- Status badge in README (visible proof it works)
+- Caching implementation and speed improvement metrics
+- CI best practices you applied with explanations
+- Snyk integration results and vulnerability handling
+- Terminal output showing improved workflow performance
+
+---
+
+## Bonus Task — Multi-App CI with Path Filters + Test Coverage (2.5 pts)
+
+**Objective:** Set up CI for your compiled language app with intelligent path-based triggers AND add test coverage tracking.
+
+**Part 1: Multi-App CI (1.5 pts)**
+
+1. **Create Second CI Workflow**
+   - Create `.github/workflows/<language>-ci.yml` for your Go/Rust/Java app
+   - Implement similar CI steps (lint, test, build Docker image)
+   - Use language-specific actions and best practices
+   - Apply versioning strategy (SemVer or CalVer) consistently
+
+2. **Implement Path-Based Triggers**
+   - Python workflow should only run when `app_python/` files change
+   - Compiled language workflow should only run when `app_<language>/` files change
+   - Neither should run when only docs or other files change
+
+3. **Optimize for Multiple Apps**
+   - Ensure both workflows can run in parallel
+   - Consider using workflow templates (DRY principle)
+   - Document the benefits of path-based triggers
+
+**Part 2: Test Coverage Badge (1 pt)**
+
+4. **Add Coverage Tracking**
+   - Install coverage tool (`pytest-cov` for Python, coverage tool for your other language)
+   - Generate coverage reports in CI workflow
+   - Integrate with codecov.io or coveralls.io (free for public repos)
+   - Add coverage badge to README showing percentage
+
+5. **Coverage Goals**
+   - Document your current coverage percentage
+   - Identify what's not covered and why
+   - Set a coverage threshold in CI (e.g., fail if below 70%)
+
+<details>
+<summary>💡 Path Filters & Multi-App CI</summary>
+
+**Why Path Filters?**
+
+In a monorepo with multiple apps, you don't want to run Python CI when only Go code changes.
+
+**Path Filter Syntax:**
+```yaml
+on:
+  push:
+    paths:
+      - 'app_python/**'
+      - '.github/workflows/python-ci.yml'
+```
+
+**Key Concepts:**
+- Glob patterns for path matching
+- When to include workflow file itself
+- Exclude patterns (paths-ignore)
+- How to test path filters
+
+**Questions to Explore:**
+- Should changes to README.md trigger CI?
+- Should changes to the root .gitignore trigger CI?
+- What about changes to both apps in one commit?
+- How do you test that path filters work correctly?
+
+**Multi-Language CI Patterns:**
+
+**For Go:**
+- actions/setup-go
+- golangci-lint for linting
+- go test for testing
+- Multi-stage Docker builds (from Lab 2 bonus)
+
+**For Rust:**
+- actions-rs/toolchain
+- cargo clippy for linting
+- cargo test for testing
+- cargo-audit for security
+
+**For Java:**
+- actions/setup-java
+- Maven or Gradle for build
+- Checkstyle or SpotBugs for linting
+- JUnit tests
+
+**Workflow Reusability:**
+
+Consider:
+- Reusable workflows (call one workflow from another)
+- Composite actions (bundle steps together)
+- Workflow templates (DRY for similar workflows)
+
+**Resources:**
+- [Path Filters](https://docs.github.com/en/actions/using-workflows/workflow-syntax-for-github-actions#onpushpull_requestpaths)
+- [Reusable Workflows](https://docs.github.com/en/actions/using-workflows/reusing-workflows)
+- [Starter Workflows](https://github.com/actions/starter-workflows/tree/main/ci)
+
+</details>
+
+<details>
+<summary>💡 Test Coverage Tracking</summary>
+
+**What is Test Coverage?**
+
+Coverage measures what percentage of your code is executed by your tests. High coverage = more code is tested.
+
+**Why Coverage Matters:**
+- Identifies untested code paths
+- Prevents regressions (changes breaking untested code)
+- Increases confidence in refactoring
+- Industry standard quality metric
+
+**Coverage Tools by Language:**
+
+**Python (pytest-cov):**
+```bash
+# Install
+pip install pytest-cov
+
+# Run with coverage
+pytest --cov=app_python --cov-report=xml --cov-report=term
+
+# Generates coverage.xml for upload
+```
+
+**Go (built-in):**
+```bash
+go test -coverprofile=coverage.out ./...
+go tool cover -html=coverage.out
+```
+
+**Rust (tarpaulin):**
+```bash
+cargo install cargo-tarpaulin
+cargo tarpaulin --out Xml
+```
+
+**Java (JaCoCo with Maven/Gradle):**
+```bash
+mvn test jacoco:report
+# or
+gradle test jacocoTestReport
+```
+
+**Integration Services:**
+
+**Codecov (Recommended):**
+- Free for public repos
+- Beautiful visualizations
+- PR comments with coverage diff
+- Setup: Sign in with GitHub, add repo, upload coverage report
+
+**Coveralls:**
+- Alternative to Codecov
+- Similar features
+- Different UI
+
+**Coverage in CI Workflow:**
+```yaml
+# Pattern for Python (research actual syntax)
+- name: Run tests with coverage
+  run: pytest --cov=. --cov-report=xml
+
+- name: Upload to Codecov
+  uses: codecov/codecov-action@v4
+  with:
+    file: ./coverage.xml
+    token: ${{ secrets.CODECOV_TOKEN }}
+```
+
+**Coverage Badge:**
+```markdown
+![Coverage](https://codecov.io/gh/username/repo/branch/main/graph/badge.svg)
+```
+
+**Setting Coverage Thresholds:**
+
+You can fail CI if coverage drops below a threshold:
+
+```yaml
+# In pytest.ini or pyproject.toml
+[tool:pytest]
+addopts = --cov=. --cov-fail-under=70
+```
+
+**Questions to Consider:**
+- What's a reasonable coverage target? (70%? 80%? 90%?)
+- Should you aim for 100% coverage? (Usually no - diminishing returns)
+- What code is OK to leave untested? (Error handlers, config, main)
+- How do you test hard-to-reach code paths?
+
+**Best Practices:**
+- Don't chase 100% coverage blindly
+- Focus on testing critical business logic
+- Integration points should have high coverage
+- Simple getters/setters can be skipped
+- Measure coverage trends, not just absolute numbers
+
+**Resources:**
+- [Codecov Documentation](https://docs.codecov.com/)
+- [pytest-cov Documentation](https://pytest-cov.readthedocs.io/)
+- [Go Coverage](https://go.dev/blog/cover)
+- [Cargo Tarpaulin](https://github.com/xd009642/tarpaulin)
+- [JaCoCo](https://www.jacoco.org/)
+
+</details>
+
+**What to Document:**
+- Second workflow implementation with language-specific best practices
+- Path filter configuration and testing proof
+- Benefits analysis: Why path filters matter in monorepos
+- Example showing workflows running independently
+- Terminal output or Actions tab showing selective triggering
+- **Coverage integration:** Screenshot/link to codecov/coveralls dashboard
+- **Coverage analysis:** Current percentage, what's covered/not covered, your threshold
+
+---
+
+## How to Submit
+
+1. **Create Branch:**
+   - Create a new branch called `lab03`
+   - Develop your CI workflows on this branch
+
+2. **Commit Work:**
+   - Add workflow files (`.github/workflows/`)
+   - Add test files (`app_python/tests/`)
+   - Add documentation (`app_python/docs/LAB03.md`)
+   - Commit with descriptive message following conventional commits
+
+3. **Verify CI Works:**
+   - Push to your fork and verify workflows run
+   - Check that all jobs pass
+   - Review workflow logs for any issues
+
+4. **Create Pull Requests:**
+   - **PR #1:** `your-fork:lab03` → `course-repo:master`
+   - **PR #2:** `your-fork:lab03` → `your-fork:master`
+   - CI should run automatically on your PRs
+
+---
+
+## Acceptance Criteria
+
+### Main Tasks (10 points)
+
+**Unit Testing (3 pts):**
+- [ ] Testing framework chosen with justification
+- [ ] Tests exist in `app_python/tests/` directory
+- [ ] All endpoints have test coverage
+- [ ] Tests pass locally (terminal output provided)
+- [ ] README updated with testing instructions
+
+**GitHub Actions CI (4 pts):**
+- [ ] Workflow file exists at `.github/workflows/python-ci.yml`
+- [ ] Workflow includes: dependency installation, linting, testing
+- [ ] Workflow includes: Docker Hub login, build, and push
+- [ ] Versioning strategy chosen (SemVer or CalVer) and implemented
+- [ ] Docker images tagged with at least 2 tags (e.g., version + latest)
+- [ ] Workflow triggers configured appropriately
+- [ ] All workflow steps pass successfully
+- [ ] Docker Hub shows versioned images
+- [ ] Link to successful workflow run provided
+
+**CI Best Practices (3 pts):**
+- [ ] Status badge added to README and working
+- [ ] Dependency caching implemented with performance metrics
+- [ ] Snyk security scanning integrated
+- [ ] At least 3 CI best practices applied
+- [ ] Documentation complete (see Documentation Requirements section)
+
+### Bonus Task (2.5 points)
+
+**Part 1: Multi-App CI (1.5 pts)**
+- [ ] Second workflow created for compiled language app (`.github/workflows/<language>-ci.yml`)
+- [ ] Language-specific linting and testing implemented
+- [ ] Versioning strategy applied to second app
+- [ ] Path filters configured for both workflows
+- [ ] Path filters tested and proven to work (workflows run selectively)
+- [ ] Both workflows can run in parallel
+- [ ] Documentation explains benefits and shows selective triggering
+
+**Part 2: Test Coverage (1 pt)**
+- [ ] Coverage tool integrated (`pytest-cov` or equivalent)
+- [ ] Coverage reports generated in CI workflow
+- [ ] Codecov or Coveralls integration complete
+- [ ] Coverage badge added to README
+- [ ] Coverage threshold set in CI (optional but recommended)
+- [ ] Documentation includes coverage analysis (percentage, what's covered/not)
+
+---
+
+## Documentation Requirements
+
+Create `app_python/docs/LAB03.md` with these sections:
+
+### 1. Overview
+- Testing framework used and why you chose it
+- What endpoints/functionality your tests cover
+- CI workflow trigger configuration (when does it run?)
+- Versioning strategy chosen (SemVer or CalVer) and rationale
+
+### 2. Workflow Evidence
+```
+Provide links/terminal output for:
+- ✅ Successful workflow run (GitHub Actions link)
+- ✅ Tests passing locally (terminal output)
+- ✅ Docker image on Docker Hub (link to your image)
+- ✅ Status badge working in README
+```
+
+### 3. Best Practices Implemented
+Quick list with one-sentence explanations:
+- **Practice 1:** Why it helps
+- **Practice 2:** Why it helps
+- **Practice 3:** Why it helps
+- **Caching:** Time saved (before vs after)
+- **Snyk:** Any vulnerabilities found? Your action taken
+
+### 4. Key Decisions
+Answer these briefly (2-3 sentences each):
+- **Versioning Strategy:** SemVer or CalVer? Why did you choose it for your app?
+- **Docker Tags:** What tags does your CI create? (e.g., latest, version number, etc.)
+- **Workflow Triggers:** Why did you choose those triggers?
+- **Test Coverage:** What's tested vs not tested?
+
+### 5. Challenges (Optional)
+- Any issues you encountered and how you fixed them
+- Keep it brief - bullet points are fine
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Unit Testing** | 3 pts | Comprehensive tests, good coverage |
+| **CI Workflow** | 4 pts | Complete, functional, automated |
+| **Best Practices** | 3 pts | Optimized, secure, well-documented |
+| **Bonus** | 2.5 pts | Multi-app CI with path filters |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** All tasks complete, CI works flawlessly, clear documentation, meaningful tests
+- **8-9/10:** CI works, good test coverage, best practices applied, solid documentation
+- **6-7/10:** CI functional, basic tests, some best practices, minimal documentation
+- **<6/10:** CI broken or missing steps, poor tests, incomplete work
+
+**Quick Checklist for Full Points:**
+- ✅ Tests actually test your endpoints (not just imports)
+- ✅ CI workflow runs and passes
+- ✅ Docker image builds and pushes successfully
+- ✅ At least 3 best practices applied (caching, Snyk, status badge, etc.)
+- ✅ Documentation complete but concise (no essay needed!)
+- ✅ Links/evidence provided (workflow runs, Docker Hub, etc.)
+
+**Documentation Should Take:** 15-30 minutes to write, 5 minutes to review
+
+---
+
+## Resources
+
+<details>
+<summary>📚 GitHub Actions Documentation</summary>
+
+- [GitHub Actions Quickstart](https://docs.github.com/en/actions/quickstart)
+- [Workflow Syntax](https://docs.github.com/en/actions/using-workflows/workflow-syntax-for-github-actions)
+- [Building and Testing Python](https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python)
+- [Publishing Docker Images](https://docs.docker.com/ci-cd/github-actions/)
+- [GitHub Actions Marketplace](https://github.com/marketplace?type=actions)
+
+</details>
+
+<details>
+<summary>🧪 Testing Resources</summary>
+
+- [Pytest Documentation](https://docs.pytest.org/)
+- [Flask Testing Guide](https://flask.palletsprojects.com/en/stable/testing/)
+- [FastAPI Testing Guide](https://fastapi.tiangolo.com/tutorial/testing/)
+- [Python Testing Best Practices](https://realpython.com/python-testing/)
+
+</details>
+
+<details>
+<summary>🔒 Security & Quality</summary>
+
+- [Snyk GitHub Actions](https://github.com/snyk/actions)
+- [Snyk Python Integration](https://docs.snyk.io/integrations/ci-cd-integrations/github-actions-integration)
+- [GitHub Security Best Practices](https://docs.github.com/en/actions/security-guides/security-hardening-for-github-actions)
+- [Dependency Scanning](https://docs.github.com/en/code-security/supply-chain-security)
+
+</details>
+
+<details>
+<summary>⚡ Performance & Optimization</summary>
+
+- [Caching Dependencies](https://docs.github.com/en/actions/using-workflows/caching-dependencies-to-speed-up-workflows)
+- [Docker Build Cache](https://docs.docker.com/build/cache/)
+- [Workflow Optimization](https://docs.github.com/en/actions/learn-github-actions/usage-limits-billing-and-administration)
+
+</details>
+
+<details>
+<summary>🛠️ CI/CD Tools</summary>
+
+- [act](https://github.com/nektos/act) - Run GitHub Actions locally
+- [actionlint](https://github.com/rhysd/actionlint) - Lint workflow files
+- [GitHub CLI](https://cli.github.com/) - Manage workflows from terminal
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 4-6:** CI will validate your Terraform and Ansible code
+- **Lab 7-8:** CI will run integration tests with logging/metrics
+- **Lab 9-10:** CI will validate Kubernetes manifests and Helm charts
+- **Lab 13:** ArgoCD will deploy what CI builds (GitOps!)
+- **All Future Labs:** This pipeline is your safety net for changes
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** CI isn't about having green checkmarks—it's about catching problems before they reach production. Focus on meaningful tests and understanding why each practice matters. Think like a DevOps engineer: automate everything, fail fast, and learn from failures.
diff --git a/labs/lab04.md b/labs/lab04.md
new file mode 100644
index 0000000000..36efa60723
--- /dev/null
+++ b/labs/lab04.md
@@ -0,0 +1,1509 @@
+# Lab 4 — Infrastructure as Code (Terraform & Pulumi)
+
+![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
+![topic](https://img.shields.io/badge/topic-Infrastructure%20as%20Code-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Terraform%20%7C%20Pulumi-informational)
+
+> Provision cloud infrastructure using code with Terraform and Pulumi, comparing both approaches.
+
+## Overview
+
+Learn Infrastructure as Code (IaC) by creating virtual machines in the cloud using two popular tools: Terraform (declarative, HCL) and Pulumi (imperative, real programming languages).
+
+**What You'll Learn:**
+- Terraform fundamentals and HCL syntax
+- Pulumi fundamentals and infrastructure with code
+- Cloud provider APIs and resources
+- Infrastructure lifecycle management
+- IaC best practices and validation
+- Comparing IaC tools and approaches
+
+**Connection to Previous Labs:**
+- **Lab 2:** Created Docker images - now we'll provision infrastructure to run them
+- **Lab 3:** CI/CD for applications - now we'll add CI/CD for infrastructure
+- **Lab 5:** Ansible will provision software on these VMs (you'll need a VM ready!)
+
+**Tech Stack:** Terraform 1.9+ | Pulumi 3.x | Yandex Cloud / AWS
+
+**Why Two Tools?**
+By using both Terraform and Pulumi for the same task, you'll understand:
+- Different IaC philosophies (declarative vs imperative)
+- Tool trade-offs and use cases
+- How to evaluate IaC tools for your needs
+
+**Important for Lab 5:**
+The VM you create in this lab will be used in **Lab 5 (Ansible)** for configuration management. You have two options:
+- **Option A (Recommended):** Keep your cloud VM running until you complete Lab 5
+- **Option B:** Use a local VM (see Local VM Alternative section below)
+
+If you choose to destroy your cloud VM after Lab 4, you can easily recreate it later using your Terraform/Pulumi code!
+
+---
+
+## Important: Cloud Provider Selection
+
+### Recommended for Russia: Yandex Cloud
+
+Yandex Cloud offers free tier and is accessible in Russia:
+- 1 VM with 20% vCPU, 1 GB RAM (free tier)
+- 10 GB SSD storage
+- No credit card required initially
+
+### Alternative Cloud Providers
+
+If Yandex Cloud is unavailable, choose any of these:
+
+**VK Cloud (Russia):**
+- Russian cloud provider
+- Free trial with bonus credits
+- Good documentation in Russian
+
+**AWS (Amazon Web Services):**
+- 750 hours/month free tier (t2.micro)
+- Most popular globally
+- Extensive documentation
+
+**GCP (Google Cloud Platform):**
+- $300 free credits for 90 days
+- Always-free tier for e2-micro
+- Modern interface
+
+**Azure (Microsoft):**
+- $200 free credits for 30 days
+- Free tier for B1s instances
+- Good Windows support
+
+**DigitalOcean:**
+- Simple pricing and interface
+- $200 free credits with GitHub Student Pack
+- Beginner-friendly
+
+### Cost Management 🚨
+
+**IMPORTANT - Read This:**
+- ✅ **Use smallest/free tier instances only**
+- ✅ **Run `terraform destroy` when done testing**
+- ✅ **Consider keeping VM for Lab 5 to avoid recreation**
+- ✅ **Set billing alerts if available**
+- ✅ **If not using for Lab 5, delete resources after lab completion**
+- ❌ **Never commit cloud credentials to Git**
+
+---
+
+## Local VM Alternative
+
+If you cannot or prefer not to use cloud providers, you can use a local VM instead. This VM will need to meet specific requirements for Lab 5 (Ansible).
+
+### Option 1: VirtualBox/VMware VM
+
+**Requirements:**
+- Ubuntu 24.04 LTS (recommended) or Ubuntu 22.04 LTS
+- 1 GB RAM minimum (2 GB recommended)
+- 10 GB disk space
+- Network adapter in Bridged mode (or NAT with port forwarding)
+- SSH server installed and configured
+- Your SSH public key added to `~/.ssh/authorized_keys`
+- Static or predictable IP address
+
+**Setup Steps:**
+```bash
+# Install SSH server (if not installed)
+sudo apt update
+sudo apt install openssh-server
+
+# Add your SSH public key
+mkdir -p ~/.ssh
+echo "your-public-key-here" >> ~/.ssh/authorized_keys
+chmod 700 ~/.ssh
+chmod 600 ~/.ssh/authorized_keys
+
+# Verify SSH access from your host machine
+ssh username@vm-ip-address
+```
+
+### Option 2: Vagrant VM
+
+**Requirements:**
+- Vagrant installed on your machine
+- VirtualBox (or another Vagrant provider)
+
+**Basic Vagrantfile:**
+```ruby
+Vagrant.configure("2") do |config|
+  config.vm.box = "ubuntu/noble64"  # Ubuntu 24.04 LTS
+  # Or use "ubuntu/jammy64" for Ubuntu 22.04 LTS
+  config.vm.network "private_network", ip: "192.168.56.10"
+  config.vm.provider "virtualbox" do |vb|
+    vb.memory = "2048"
+  end
+end
+```
+
+### Option 3: WSL2 (Windows Subsystem for Linux)
+
+**Note:** WSL2 can work but has networking limitations. Bridged mode VM is preferred.
+
+**If using local VM:**
+- You can skip Terraform/Pulumi cloud provider setup
+- Document your local VM setup instead
+- For Task 1, show VM creation (manual or Vagrant)
+- For Task 2, you can skip Pulumi (or use Pulumi to manage Vagrant)
+- Focus on understanding IaC concepts with cloud provider research
+
+**Recommended Approach:**
+Even with a local VM, complete the Terraform/Pulumi tasks with a cloud provider to gain real IaC experience. You can destroy the cloud VM after Lab 4 and use your local VM for Lab 5.
+
+---
+
+## Tasks
+
+### Task 1 — Terraform VM Creation (4 pts)
+
+**Objective:** Create a virtual machine using Terraform on your chosen cloud provider.
+
+**Requirements:**
+
+1. **Setup Terraform**
+   - Install Terraform CLI
+   - Choose and configure your cloud provider
+   - Set up authentication (access keys, service accounts, etc.)
+   - Initialize Terraform
+
+2. **Define Infrastructure**
+
+   Create a `terraform/` directory with the following resources:
+
+   **Minimum Required Resources:**
+   - **VM/Compute Instance** (smallest free tier size)
+   - **Network/VPC** (if required by provider)
+   - **Security Group/Firewall Rules:**
+     - Allow SSH (port 22) from your IP
+     - Allow HTTP (port 80)
+     - Allow custom port 5000 (for future app deployment)
+   - **Public IP Address** (to access VM remotely)
+
+3. **Configuration Best Practices**
+   - Use variables for configurable values (region, instance type, etc.)
+   - Use outputs to display important information (public IP, etc.)
+   - Add appropriate tags/labels for resource identification
+   - Use `.gitignore` for sensitive files
+
+4. **Apply Infrastructure**
+   - Run `terraform plan` to preview changes
+   - Review the plan carefully
+   - Apply infrastructure
+   - Verify VM is accessible via SSH
+   - Document the public IP and connection method
+
+5. **State Management**
+   - Keep state file local (for now)
+   - Understand what the state file contains
+   - **Never commit `terraform.tfstate` to Git**
+
+<details>
+<summary>💡 Terraform Fundamentals</summary>
+
+**What is Terraform?**
+
+Terraform is a declarative IaC tool that lets you define infrastructure in configuration files (HCL - HashiCorp Configuration Language).
+
+**Key Concepts:**
+
+**Providers:**
+- Plugins that interact with cloud APIs
+- Each cloud has its own provider (yandex, aws, google, azurerm)
+- Configure authentication and region
+
+**Resources:**
+- Infrastructure components (VMs, networks, firewalls)
+- Format: `resource "type" "name" { ... }`
+- Each resource has required and optional arguments
+
+**Data Sources:**
+- Query existing infrastructure
+- Example: Find latest Ubuntu image ID
+- Format: `data "type" "name" { ... }`
+
+**Variables:**
+- Make configurations reusable
+- Define in `variables.tf`
+- Set values in `terraform.tfvars` (gitignored!)
+- Reference: `var.variable_name`
+
+**Outputs:**
+- Display important values after apply
+- Example: VM public IP
+- Define in `outputs.tf`
+
+**State File:**
+- Tracks real infrastructure
+- Maps config to reality
+- **Never commit to Git** (contains sensitive data)
+- Add to `.gitignore`
+
+**Typical Workflow:**
+```bash
+terraform init      # Initialize provider plugins
+terraform fmt       # Format code
+terraform validate  # Check syntax
+terraform plan      # Preview changes
+terraform apply     # Create/update infrastructure
+terraform destroy   # Delete all infrastructure
+```
+
+**Resources:**
+- [Terraform Documentation](https://developer.hashicorp.com/terraform/docs)
+- [Terraform Registry](https://registry.terraform.io/) - Provider docs
+- [HCL Syntax](https://developer.hashicorp.com/terraform/language/syntax)
+
+</details>
+
+<details>
+<summary>☁️ Yandex Cloud Terraform Guide</summary>
+
+**Yandex Cloud Setup:**
+
+**Authentication:**
+- Create service account in Yandex Cloud Console
+- Generate authorized key (JSON)
+- Set key file path or use environment variables
+
+**Provider Configuration Pattern:**
+```hcl
+terraform {
+  required_providers {
+    yandex = {
+      source = "yandex-cloud/yandex"
+    }
+  }
+}
+
+provider "yandex" {
+  # Configuration here (zone, folder_id, etc.)
+}
+```
+
+**Key Resources:**
+- `yandex_compute_instance` - Virtual machine
+- `yandex_vpc_network` - Virtual private cloud
+- `yandex_vpc_subnet` - Subnet within VPC
+- `yandex_vpc_security_group` - Firewall rules
+
+**Free Tier Instance:**
+- Platform: standard-v2
+- Cores: 2 (core_fraction = 20%)
+- Memory: 1 GB
+- Boot disk: 10 GB HDD
+
+**SSH Access:**
+- Add SSH public key to `metadata`
+- Use `ssh-keys` metadata field
+- Connect: `ssh <username>@<public_ip>`
+
+**Resources:**
+- [Yandex Cloud Terraform Provider](https://registry.terraform.io/providers/yandex-cloud/yandex/latest/docs)
+- [Getting Started Guide](https://cloud.yandex.com/en/docs/tutorials/infrastructure-management/terraform-quickstart)
+- [Compute Instance Example](https://registry.terraform.io/providers/yandex-cloud/yandex/latest/docs/resources/compute_instance)
+
+</details>
+
+<details>
+<summary>☁️ AWS Terraform Guide</summary>
+
+**AWS Setup:**
+
+**Authentication:**
+- Create IAM user with EC2 permissions
+- Generate access key ID and secret access key
+- Configure AWS CLI or use environment variables
+- Never hardcode credentials
+
+**Provider Configuration Pattern:**
+```hcl
+terraform {
+  required_providers {
+    aws = {
+      source = "hashicorp/aws"
+    }
+  }
+}
+
+provider "aws" {
+  region = var.region  # e.g., "us-east-1"
+}
+```
+
+**Key Resources:**
+- `aws_instance` - EC2 instance
+- `aws_vpc` - Virtual Private Cloud
+- `aws_subnet` - Subnet within VPC
+- `aws_security_group` - Firewall rules
+- `aws_key_pair` - SSH key
+
+**Free Tier Instance:**
+- Instance type: t2.micro
+- AMI: Amazon Linux 2 or Ubuntu (find with data source)
+- 750 hours/month free for 12 months
+- 30 GB storage included
+
+**Data Source for AMI:**
+Use `aws_ami` data source to find latest Ubuntu image dynamically
+
+**Resources:**
+- [AWS Provider Documentation](https://registry.terraform.io/providers/hashicorp/aws/latest/docs)
+- [EC2 Instance Resource](https://registry.terraform.io/providers/hashicorp/aws/latest/docs/resources/instance)
+- [AWS Free Tier](https://aws.amazon.com/free/)
+
+</details>
+
+<details>
+<summary>☁️ GCP Terraform Guide</summary>
+
+**GCP Setup:**
+**Authentication:**
+- Create service account in Google Cloud Console
+- Download JSON key file
+- Set `GOOGLE_APPLICATION_CREDENTIALS` environment variable
+- Enable Compute Engine API
+
+**Provider Configuration Pattern:**
+```hcl
+terraform {
+  required_providers {
+    google = {
+      source = "hashicorp/google"
+    }
+  }
+}
+
+provider "google" {
+  project = var.project_id
+  region  = var.region
+}
+```
+
+**Key Resources:**
+- `google_compute_instance` - VM instance
+- `google_compute_network` - VPC network
+- `google_compute_subnetwork` - Subnet
+- `google_compute_firewall` - Firewall rules
+
+**Free Tier Instance:**
+- Machine type: e2-micro
+- Zone: us-central1-a (or other free tier zone)
+- Always free (within limits)
+- Boot disk: 30 GB standard persistent disk
+
+**Resources:**
+- [Google Provider Documentation](https://registry.terraform.io/providers/hashicorp/google/latest/docs)
+- [Compute Instance Resource](https://registry.terraform.io/providers/hashicorp/google/latest/docs/resources/compute_instance)
+- [GCP Free Tier](https://cloud.google.com/free)
+
+</details>
+
+<details>
+<summary>☁️ Other Cloud Providers</summary>
+
+**Azure:**
+- Provider: `azurerm`
+- Resource: `azurerm_linux_virtual_machine`
+- Free tier: B1s instance
+- [Azure Provider Docs](https://registry.terraform.io/providers/hashicorp/azurerm/latest/docs)
+
+**VK Cloud:**
+- Based on OpenStack
+- Provider: OpenStack provider
+- [VK Cloud Documentation](https://mcs.mail.ru/help/)
+
+**DigitalOcean:**
+- Provider: `digitalocean`
+- Resource: `digitalocean_droplet`
+- Simple and beginner-friendly
+- [DigitalOcean Provider Docs](https://registry.terraform.io/providers/digitalocean/digitalocean/latest/docs)
+
+**Questions to Explore:**
+- What's the smallest instance size for your provider?
+- How do you find the right OS image ID?
+- What authentication method does your provider use?
+- How do you add SSH keys to instances?
+
+</details>
+
+<details>
+<summary>🔒 Security Best Practices</summary>
+
+**Credentials Management:**
+
+**❌ NEVER DO THIS:**
+```hcl
+provider "aws" {
+  access_key = "AKIAIOSFODNN7EXAMPLE"  # NEVER!
+  secret_key = "wJalrXUtnFEMI/K7MDENG/bPxRfiCYEXAMPLEKEY"  # NEVER!
+}
+```
+
+**✅ DO THIS INSTEAD:**
+
+**Option 1: Environment Variables**
+```bash
+export AWS_ACCESS_KEY_ID="your-key"
+export AWS_SECRET_ACCESS_KEY="your-secret"
+# Provider will auto-detect
+```
+
+**Option 2: Credentials File**
+```bash
+# ~/.aws/credentials (for AWS)
+[default]
+aws_access_key_id = your-key
+aws_secret_access_key = your-secret
+```
+
+**Option 3: terraform.tfvars (gitignored)**
+```hcl
+# terraform.tfvars (add to .gitignore!)
+access_key = "your-key"
+secret_key = "your-secret"
+```
+
+**Files to Add to .gitignore:**
+```
+# Terraform
+*.tfstate
+*.tfstate.*
+.terraform/
+terraform.tfvars
+*.tfvars
+.terraform.lock.hcl
+
+# Cloud credentials
+*.pem
+*.key
+*.json  # Service account keys
+credentials
+```
+
+**SSH Key Management:**
+- Generate SSH key pair locally
+- Add public key to cloud provider
+- Keep private key secure (never commit)
+- Use `chmod 600` on private key file
+
+**Security Group Rules:**
+- Restrict SSH to your IP only (not 0.0.0.0/0)
+- Only open ports you need
+- Document why each port is open
+
+</details>
+
+<details>
+<summary>📁 Terraform Project Structure</summary>
+
+**Recommended Structure:**
+
+```
+terraform/
+├── .gitignore           # Ignore state, credentials
+├── main.tf              # Main resources
+├── variables.tf         # Input variables
+├── outputs.tf           # Output values
+├── terraform.tfvars     # Variable values (gitignored!)
+└── README.md            # Setup instructions
+```
+
+**What Goes in Each File:**
+
+**main.tf:**
+- Provider configuration
+- Resource definitions
+- Data sources
+
+**variables.tf:**
+- Variable declarations
+- Descriptions
+- Default values (non-sensitive only)
+
+**outputs.tf:**
+- Important values to display
+- VM IP addresses
+- Connection strings
+
+**terraform.tfvars:**
+- Actual variable values
+- Secrets and credentials
+- **MUST be in .gitignore**
+
+**Alternative: Single File**
+For small projects, you can put everything in `main.tf`, but multi-file is more maintainable.
+
+</details>
+
+**What to Document:**
+- Cloud provider chosen and why
+- Terraform version used
+- Resources created (VM size, region, etc.)
+- Public IP address of created VM
+- SSH connection command
+- Terminal output from `terraform plan` and `terraform apply`
+- Proof of SSH access to VM
+
+---
+
+### Task 2 — Pulumi VM Creation (4 pts)
+
+**Objective:** Destroy the Terraform VM and recreate the same infrastructure using Pulumi.
+
+**Requirements:**
+
+1. **Cleanup Terraform Infrastructure**
+   - Run `terraform destroy` to delete all resources
+   - Verify all resources are deleted in cloud console
+   - Document the cleanup process
+
+2. **Setup Pulumi**
+   - Install Pulumi CLI
+   - Choose a programming language (Python recommended, or TypeScript, Go, C#, Java)
+   - Initialize a new Pulumi project
+   - Configure cloud provider
+
+3. **Recreate Same Infrastructure**
+
+   Create a `pulumi/` directory with equivalent resources:
+
+   **Same Resources as Task 1:**
+   - VM/Compute Instance (same size)
+   - Network/VPC
+   - Security Group/Firewall (same rules)
+   - Public IP Address
+
+   **Goal:** Functionally identical infrastructure, different tool
+
+4. **Apply Infrastructure**
+   - Run `pulumi preview` to see planned changes
+   - Apply infrastructure with `pulumi up`
+   - Verify VM is accessible via SSH
+   - Document the public IP
+
+5. **Compare Experience**
+   - What was easier/harder than Terraform?
+   - How does the code differ?
+   - Which approach do you prefer and why?
+
+<details>
+<summary>💡 Pulumi Fundamentals</summary>
+
+**What is Pulumi?**
+
+Pulumi is an imperative IaC tool that lets you write infrastructure using real programming languages (Python, TypeScript, Go, etc.).
+
+**Key Differences from Terraform:**
+
+| Aspect | Terraform | Pulumi |
+|--------|-----------|--------|
+| **Language** | HCL (declarative) | Python, JS, Go, etc. (imperative) |
+| **State** | Local or remote state file | Pulumi Cloud (free tier) or self-hosted |
+| **Logic** | Limited (count, for_each) | Full programming language |
+| **Testing** | External tools | Native unit tests |
+| **Secrets** | Plain in state | Encrypted by default |
+
+**Key Concepts:**
+
+**Resources:**
+- Similar to Terraform, but defined in code
+- Example (Python): `vm = compute.Instance("my-vm", ...)`
+
+**Stacks:**
+- Like Terraform workspaces
+- Separate environments (dev, staging, prod)
+- Each has its own config and state
+
+**Outputs:**
+- Return values from your program
+- Example: `pulumi.export("ip", vm.public_ip)`
+
+**Config:**
+- Per-stack configuration
+- Set with: `pulumi config set key value`
+- Access in code: `config.get("key")`
+
+**Typical Workflow:**
+```bash
+pulumi new <template>   # Create new project
+pulumi config set ...   # Configure settings
+pulumi preview          # Preview changes (like terraform plan)
+pulumi up               # Create/update infrastructure
+pulumi destroy          # Delete all infrastructure
+pulumi stack output     # View outputs
+```
+
+**Advantages of Pulumi:**
+- Use familiar programming languages
+- Full language features (loops, functions, classes)
+- Better IDE support (autocomplete, type checking)
+- Native testing capabilities
+- Secrets encrypted by default
+
+**Disadvantages of Pulumi:**
+- Smaller community than Terraform
+- More complex for simple tasks
+- Requires programming knowledge
+- Pulumi Cloud dependency (or self-hosted backend)
+
+**Resources:**
+- [Pulumi Documentation](https://www.pulumi.com/docs/)
+- [Pulumi Registry](https://www.pulumi.com/registry/) - Provider docs
+- [Python Examples](https://www.pulumi.com/docs/languages-sdks/python/)
+
+</details>
+
+<details>
+<summary>🐍 Pulumi with Python</summary>
+
+**Project Setup:**
+
+```bash
+pulumi new python
+# Follow prompts for project name, stack name
+```
+
+**Project Structure:**
+```
+pulumi/
+├── __main__.py          # Main infrastructure code
+├── requirements.txt     # Python dependencies
+├── Pulumi.yaml         # Project metadata
+├── Pulumi.dev.yaml     # Stack configuration
+└── venv/               # Python virtual environment
+```
+
+**Basic Pattern (AWS Example):**
+
+```python
+import pulumi
+import pulumi_aws as aws
+
+# Create a security group
+security_group = aws.ec2.SecurityGroup("web-sg",
+    description="Allow SSH and HTTP",
+    ingress=[
+        {"protocol": "tcp", "from_port": 22, "to_port": 22, "cidr_blocks": ["0.0.0.0/0"]},
+        {"protocol": "tcp", "from_port": 80, "to_port": 80, "cidr_blocks": ["0.0.0.0/0"]},
+    ])
+
+# Create an EC2 instance
+instance = aws.ec2.Instance("my-vm",
+    instance_type="t2.micro",
+    ami="ami-0c55b159cbfafe1f0",  # Ubuntu
+    security_groups=[security_group.name])
+
+# Export the instance's public IP
+pulumi.export("public_ip", instance.public_ip)
+```
+
+**Configuration:**
+```bash
+pulumi config set aws:region us-east-1
+pulumi config set --secret aws:accessKey YOUR_KEY
+pulumi config set --secret aws:secretKey YOUR_SECRET
+```
+
+**Running:**
+```bash
+# Activate venv
+source venv/bin/activate  # or venv\Scripts\activate on Windows
+
+# Install dependencies
+pip install -r requirements.txt
+
+# Preview and apply
+pulumi preview
+pulumi up
+```
+
+**Resources:**
+- [Pulumi Python SDK](https://www.pulumi.com/docs/languages-sdks/python/)
+- [Pulumi AWS Examples](https://github.com/pulumi/examples/tree/master/aws-py-webserver)
+
+</details>
+
+<details>
+<summary>📦 Pulumi with TypeScript</summary>
+
+**Project Setup:**
+
+```bash
+pulumi new typescript
+```
+
+**Basic Pattern (AWS Example):**
+
+```typescript
+import * as pulumi from "@pulumi/pulumi";
+import * as aws from "@pulumi/aws";
+
+// Create a security group
+const securityGroup = new aws.ec2.SecurityGroup("web-sg", {
+    description: "Allow SSH and HTTP",
+    ingress: [
+        { protocol: "tcp", fromPort: 22, toPort: 22, cidrBlocks: ["0.0.0.0/0"] },
+        { protocol: "tcp", fromPort: 80, toPort: 80, cidrBlocks: ["0.0.0.0/0"] },
+    ],
+});
+
+// Create an EC2 instance
+const instance = new aws.ec2.Instance("my-vm", {
+    instanceType: "t2.micro",
+    ami: "ami-0c55b159cbfafe1f0",
+    securityGroups: [securityGroup.name],
+});
+
+// Export the instance's public IP
+export const publicIp = instance.publicIp;
+```
+
+**Running:**
+```bash
+npm install
+pulumi preview
+pulumi up
+```
+
+</details>
+
+<details>
+<summary>☁️ Pulumi Cloud Providers</summary>
+
+**Installing Provider Packages:**
+
+**Yandex Cloud (Python):**
+```bash
+pip install pulumi-yandex
+```
+
+**AWS (Python):**
+```bash
+pip install pulumi-aws
+```
+
+**GCP (Python):**
+```bash
+pip install pulumi-gcp
+```
+
+**Azure (Python):**
+```bash
+pip install pulumi-azure-native
+```
+
+**Provider Documentation:**
+- [Pulumi Yandex](https://www.pulumi.com/registry/packages/yandex/)
+- [Pulumi AWS](https://www.pulumi.com/registry/packages/aws/)
+- [Pulumi GCP](https://www.pulumi.com/registry/packages/gcp/)
+- [Pulumi Azure](https://www.pulumi.com/registry/packages/azure-native/)
+
+**Authentication:**
+- Same as Terraform (environment variables, config files)
+- Pulumi can also use `pulumi config set --secret` for secure credential storage
+
+</details>
+
+<details>
+<summary>🔄 Migrating from Terraform to Pulumi</summary>
+
+**Key Differences:**
+
+**Resource Names:**
+- Terraform: `resource "aws_instance" "web" { ... }`
+- Pulumi: `const web = new aws.ec2.Instance("web", { ... })`
+
+**Variables:**
+- Terraform: `var.instance_type`
+- Pulumi: `config.require("instanceType")` or just regular variables
+
+**Outputs:**
+- Terraform: `output "ip" { value = aws_instance.web.public_ip }`
+- Pulumi: `export const ip = web.publicIp` (TS) or `pulumi.export("ip", web.public_ip)` (Python)
+
+**Benefits of Real Programming Language:**
+- Use loops, conditionals, functions naturally
+- Import external libraries
+- Better code reuse (functions, classes)
+- Type checking and IDE support
+
+**Conversion Tips:**
+1. Start with Terraform docs to understand resources needed
+2. Find equivalent Pulumi resources in registry
+3. Convert HCL blocks to function calls
+4. Use language features for logic
+
+**Pulumi Can Import Terraform State:**
+```bash
+pulumi import ...
+```
+But for this lab, start fresh with Pulumi.
+
+</details>
+
+**What to Document:**
+- Programming language chosen for Pulumi
+- Terraform destroy output
+- Pulumi preview and up output
+- Public IP of Pulumi-created VM
+- Comparison: Terraform vs Pulumi experience
+- Code differences (HCL vs Python/TypeScript)
+- Which tool you prefer and why
+
+---
+
+### Task 3 — Documentation (2 pts)
+
+**Objective:** Document your IaC implementation, decisions, and learnings.
+
+Create `terraform/docs/LAB04.md` (or `docs/LAB04.md` at root) with these sections:
+
+### 1. Cloud Provider & Infrastructure
+- Cloud provider chosen and rationale
+- Instance type/size and why
+- Region/zone selected
+- Total cost (should be $0 with free tier)
+- Resources created (list all)
+
+### 2. Terraform Implementation
+- Terraform version used
+- Project structure explanation
+- Key configuration decisions
+- Challenges encountered
+- Terminal output from key commands:
+  - `terraform init`
+  - `terraform plan` (sanitized, no secrets)
+  - `terraform apply`
+  - SSH connection to VM
+
+### 3. Pulumi Implementation
+- Pulumi version and language used
+- How code differs from Terraform
+- Advantages you discovered
+- Challenges encountered
+- Terminal output from:
+  - `pulumi preview`
+  - `pulumi up`
+  - SSH connection to VM
+
+### 4. Terraform vs Pulumi Comparison
+
+Brief comparison (3-5 sentences each):
+- **Ease of Learning:** Which was easier to learn and why?
+- **Code Readability:** Which is more readable for you?
+- **Debugging:** Which was easier to debug when things went wrong?
+- **Documentation:** Which has better docs and examples?
+- **Use Case:** When would you use Terraform? When Pulumi?
+
+### 5. Lab 5 Preparation & Cleanup
+
+**VM for Lab 5:**
+- Are you keeping your VM for Lab 5? (Yes/No)
+- If yes: Which VM (Terraform or Pulumi created)?
+- If no: What will you use for Lab 5? (Local VM/Will recreate cloud VM)
+
+**Cleanup Status:**
+- If keeping VM for Lab 5: Show VM is still running and accessible
+- If destroying everything: Terminal output showing both tools' resources destroyed
+- Cloud console screenshot showing resource status (optional but recommended)
+
+---
+
+## Bonus Task — IaC CI/CD + Infrastructure Import (2.5 pts)
+
+**Objective:** Add automated validation for infrastructure code and learn to import existing resources into Terraform.
+
+### Part 1: GitHub Actions for IaC Validation (1.5 pts)
+
+**Objective:** Automatically validate Terraform code on pull requests.
+
+**Requirements:**
+
+1. **Create Validation Workflow**
+
+   Create `.github/workflows/terraform-ci.yml` that:
+   - Triggers only on changes to `terraform/**` files
+   - Runs `terraform fmt -check` (code formatting validation)
+   - Runs `terraform init`
+   - Runs `terraform validate` (syntax validation)
+   - Runs `tflint` (Terraform linter for best practices)
+
+2. **Workflow Setup**
+   - Install Terraform in workflow
+   - Install tflint
+   - Configure path filters (similar to Lab 3)
+   - Show validation results in workflow logs
+
+3. **Testing**
+   - Create a PR with Terraform changes
+   - Verify workflow runs only for Terraform changes
+   - Show passing and failing validation examples
+
+<details>
+<summary>💡 Terraform CI/CD Concepts</summary>
+
+**Why Validate Infrastructure Code in CI?**
+
+- Catch syntax errors before apply
+- Enforce code formatting standards
+- Check for security issues and bad practices
+- Prevent broken configurations from merging
+- Review infrastructure changes before deployment
+
+**Terraform CI Steps:**
+
+**terraform fmt:**
+- Formats code to canonical style
+- Use `-check` flag to verify without changing files
+- Ensures consistency across team
+
+**terraform validate:**
+- Checks syntax and internal consistency
+- Validates resource configurations
+- Doesn't access provider APIs (fast)
+
+**tflint:**
+- Linter for Terraform code
+- Finds possible errors (invalid instance types, etc.)
+- Checks best practices
+- Provider-specific rules
+
+**Path Filters:**
+- Only run workflow when IaC files change
+- Same concept as Lab 3 path filters
+- Prevents unnecessary CI runs
+
+**Pattern for Workflow:**
+```yaml
+on:
+  pull_request:
+    paths:
+      - 'terraform/**'
+      - '.github/workflows/terraform-ci.yml'
+
+jobs:
+  validate:
+    runs-on: ubuntu-latest
+    steps:
+      - Checkout code
+      - Setup Terraform
+      - Install tflint
+      - Run terraform fmt -check
+      - Run terraform init
+      - Run terraform validate
+      - Run tflint
+```
+
+**Advanced: Terraform Plan in PR**
+
+You can also add `terraform plan` to show what would change:
+- Requires cloud credentials (use GitHub Secrets)
+- Shows plan output as PR comment
+- Helps reviewers understand impact
+- Use `terraform plan -no-color` for readable output
+
+**Security Considerations:**
+- Be careful with secrets in CI
+- Don't expose sensitive outputs
+- Use `-backend=false` for init if not using state
+- Consider using Terraform Cloud for plan sharing
+
+**Resources:**
+- [GitHub Actions for Terraform](https://developer.hashicorp.com/terraform/tutorials/automation/github-actions)
+- [tflint Documentation](https://github.com/terraform-linters/tflint)
+- [Setup Terraform Action](https://github.com/hashicorp/setup-terraform)
+
+</details>
+
+<details>
+<summary>🔧 tflint Setup</summary>
+
+**What is tflint?**
+
+A linter for Terraform that finds:
+- Possible errors (invalid instance types, deprecated syntax)
+- Best practice violations
+- Provider-specific issues
+
+**Installation in CI:**
+```yaml
+- name: Setup TFLint
+  uses: terraform-linters/setup-tflint@v3
+  with:
+    tflint_version: latest
+
+- name: Run TFLint
+  run: tflint --format compact
+  working-directory: terraform/
+```
+
+**Local Installation:**
+```bash
+# macOS
+brew install tflint
+
+# Linux
+curl -s https://raw.githubusercontent.com/terraform-linters/tflint/master/install_linux.sh | bash
+
+# Windows
+choco install tflint
+```
+
+**Configuration (.tflint.hcl):**
+```hcl
+plugin "terraform" {
+  enabled = true
+}
+
+plugin "aws" {  # Or your cloud provider
+  enabled = true
+}
+```
+
+**Running Locally:**
+```bash
+cd terraform/
+tflint --init  # Download plugins
+tflint         # Run linting
+```
+
+**Common Issues Found:**
+- Invalid instance types
+- Missing required arguments
+- Deprecated syntax
+- Security group issues
+- Invalid AMI IDs
+
+</details>
+
+### Part 2: Import GitHub Repository to Terraform (1 pt)
+
+**Objective:** Learn to manage existing infrastructure with Terraform by importing your course repository.
+
+**Requirements:**
+
+1. **Import GitHub Repository**
+   - Create Terraform configuration for GitHub provider
+   - Define a `github_repository` resource for your course repo
+   - Use `terraform import` to bring existing repo under Terraform management
+   - Verify state matches reality
+
+2. **Manage Repository Settings**
+   - Add Terraform code to manage repository settings:
+     - Description
+     - Visibility (public/private)
+     - Has issues enabled
+     - Has wiki enabled
+     - Branch protection rules (optional)
+   - Apply changes and verify in GitHub
+
+3. **Documentation**
+   - Explain the import process
+   - Show terminal output of import command
+   - Document why importing existing resources matters
+
+<details>
+<summary>💡 Why Import Existing Resources?</summary>
+
+**The Problem:**
+
+In real world, you often have:
+- Infrastructure created manually (before IaC adoption)
+- Resources created by other tools or people
+- Legacy systems that need to be managed with code
+
+You can't just run `terraform apply` - resources already exist!
+
+**The Solution: terraform import**
+
+Import brings existing resources into Terraform management:
+1. Write Terraform config describing the resource
+2. Run `terraform import` to link config to real resource
+3. Terraform now manages that resource
+4. Future changes go through Terraform
+
+**Advantages of Managing Existing Resources with IaC:**
+
+**1. Version Control:**
+- Track configuration changes over time
+- See who changed what and when
+- Rollback to previous configurations
+
+**2. Consistency:**
+- Standardize configuration across resources
+- Prevent configuration drift
+- Ensure compliance with policies
+
+**3. Automation:**
+- Changes require code review
+- CI/CD validation
+- Automated testing
+
+**4. Documentation:**
+- Code is living documentation
+- Anyone can see current configuration
+- No "tribal knowledge" needed
+
+**5. Disaster Recovery:**
+- Quickly recreate infrastructure from code
+- No manual steps to remember
+- Tested recovery process
+
+**6. Team Collaboration:**
+- Multiple people can work on infrastructure
+- PR-based workflow
+- No conflicting manual changes
+
+**Real-World Use Cases:**
+
+**Brownfield Infrastructure:**
+- Company has 100s of manually created resources
+- Import them gradually into Terraform
+- Eventually all infrastructure is code-managed
+
+**Migrating Between Tools:**
+- Moving from CloudFormation to Terraform
+- Moving from manual management to IaC
+- Gradual transition without downtime
+
+**Compliance and Governance:**
+- All changes must go through code review
+- Audit trail of who changed what
+- Prevent unauthorized changes
+
+**Cost Management:**
+- Review infrastructure changes before apply
+- Prevent accidental expensive resources
+- Track infrastructure costs in code
+
+**The Import Process:**
+
+```bash
+# 1. Write the resource config (empty or partial)
+resource "github_repository" "course_repo" {
+  name = "DevOps-Core-Course"
+  # ... other settings
+}
+
+# 2. Import the existing resource
+terraform import github_repository.course_repo DevOps-Core-Course
+
+# 3. Terraform now tracks this resource in state
+# 4. Run terraform plan to see any drift
+# 5. Update config to match reality
+# 6. Apply to bring under full management
+```
+
+**Challenges:**
+
+- Config must match reality exactly
+- May need to import many related resources
+- Some resources don't support import
+- Requires careful planning
+
+**Best Practices:**
+
+- Import one resource at a time
+- Test in non-production first
+- Use `terraform plan` to verify match
+- Document the import process
+- Keep manual backups before import
+
+**Resources:**
+- [Terraform Import Command](https://developer.hashicorp.com/terraform/cli/import)
+- [Import Usage Examples](https://developer.hashicorp.com/terraform/cli/import/usage)
+
+</details>
+
+<details>
+<summary>🐙 GitHub Provider Setup</summary>
+
+**Installing GitHub Provider:**
+
+```hcl
+terraform {
+  required_providers {
+    github = {
+      source  = "integrations/github"
+      version = "~> 5.0"
+    }
+  }
+}
+
+provider "github" {
+  token = var.github_token  # Personal access token
+}
+```
+
+**Authentication:**
+
+**Create Personal Access Token:**
+1. GitHub → Settings → Developer settings → Personal access tokens → Tokens (classic)
+2. Generate new token
+3. Select scopes: `repo` (all repo permissions)
+4. Copy token (shown once!)
+
+**Configure Token:**
+```bash
+# Environment variable (recommended)
+export GITHUB_TOKEN="your-token-here"
+
+# Or in terraform.tfvars (gitignored!)
+github_token = "your-token-here"
+```
+
+**Repository Resource:**
+
+```hcl
+resource "github_repository" "course_repo" {
+  name        = "DevOps-Core-Course"
+  description = "DevOps course lab assignments"
+  visibility  = "public"
+
+  has_issues   = true
+  has_wiki     = false
+  has_projects = false
+
+  # Other settings...
+}
+```
+
+**Import Command:**
+
+```bash
+# Format: terraform import <resource_type>.<name> <repo_name>
+terraform import github_repository.course_repo DevOps-Core-Course
+```
+
+**After Import:**
+1. Run `terraform plan` - shows differences between code and reality
+2. Update your config to match reality (eliminate differences)
+3. Run `terraform plan` again - should show "No changes"
+4. Now you can manage the repo with Terraform!
+
+**What You Can Manage:**
+- Repository settings
+- Branch protection rules
+- Collaborators and teams
+- Webhooks
+- Deploy keys
+- Repository secrets
+
+**Resources:**
+- [GitHub Provider Documentation](https://registry.terraform.io/providers/integrations/github/latest/docs)
+- [Repository Resource](https://registry.terraform.io/providers/integrations/github/latest/docs/resources/repository)
+- [Import Guide](https://registry.terraform.io/providers/integrations/github/latest/docs/resources/repository#import)
+
+</details>
+
+**What to Document:**
+- Workflow file implementation
+- Path filter configuration
+- tflint results and any issues found
+- Example of workflow running on PR
+- GitHub repository import process
+- Terminal output of import command
+- Why importing matters (brief explanation)
+- Benefits you see for managing repos with IaC
+
+---
+
+## How to Submit
+
+1. **Create Branch:**
+   - Create a new branch called `lab04`
+   - Work on this branch
+
+2. **Commit Work:**
+   - Add Terraform code (`terraform/` directory)
+   - Add Pulumi code (`pulumi/` directory)
+   - Add documentation (`docs/LAB04.md` or `terraform/docs/LAB04.md`)
+   - Add GitHub workflow (`.github/workflows/terraform-ci.yml` if doing bonus)
+   - **IMPORTANT:** Ensure `.gitignore` excludes:
+     - `*.tfstate`, `*.tfstate.*`, `.terraform/`, `terraform.tfvars`
+     - `pulumi/venv/`, `Pulumi.*.yaml` (stack configs with secrets)
+     - Any credential files
+   - Commit with conventional commits format
+
+3. **CLEANUP BEFORE COMMITTING:**
+
+   **If keeping VM for Lab 5:**
+   - ✅ Keep one VM running (Terraform or Pulumi - your choice)
+   - ✅ Destroy the other tool's resources
+   - ✅ Document which VM you're keeping in LAB04.md
+   - ✅ Check no secrets in code
+   - ✅ Review .gitignore is correct
+
+   **If NOT keeping VM for Lab 5:**
+   - ✅ Run `terraform destroy`
+   - ✅ Run `pulumi destroy`
+   - ✅ Verify no resources in cloud console
+   - ✅ Check no secrets in code
+   - ✅ Review .gitignore is correct
+   - ✅ Document your Lab 5 plan (local VM or recreate cloud VM)
+
+4. **Create Pull Requests:**
+   - **PR #1:** `your-fork:lab04` → `course-repo:master`
+   - **PR #2:** `your-fork:lab04` → `your-fork:master`
+   - Bonus workflow will validate Terraform code automatically
+
+---
+
+## Acceptance Criteria
+
+### Main Tasks (10 points)
+
+**Terraform VM Creation (4 pts):**
+- [ ] Cloud provider chosen and configured
+- [ ] Terraform project created in `terraform/` directory
+- [ ] All required resources defined (VM, network, security group, public IP)
+- [ ] Free tier instance used
+- [ ] Variables and outputs used appropriately
+- [ ] `.gitignore` configured correctly
+- [ ] Infrastructure applied successfully
+- [ ] VM accessible via SSH (proof provided)
+- [ ] Terminal output from `terraform plan` and `terraform apply` provided
+- [ ] No secrets committed to Git
+
+**Pulumi VM Recreation (4 pts):**
+- [ ] Terraform resources destroyed (proof provided)
+- [ ] Pulumi project created in `pulumi/` directory
+- [ ] Programming language chosen
+- [ ] Same infrastructure recreated with Pulumi
+- [ ] Infrastructure applied successfully
+- [ ] VM accessible via SSH (proof provided)
+- [ ] Terminal output from `pulumi preview` and `pulumi up` provided
+- [ ] Comparison with Terraform documented
+
+**Documentation (2 pts):**
+- [ ] `docs/LAB04.md` complete with all required sections
+- [ ] Cloud provider choice justified
+- [ ] Terraform implementation documented
+- [ ] Pulumi implementation documented
+- [ ] Terraform vs Pulumi comparison provided
+- [ ] Lab 5 preparation documented (keeping VM or using local/recreating)
+- [ ] Cleanup status documented (what's kept, what's destroyed)
+- [ ] Terminal outputs provided (sanitized, no secrets)
+
+### Bonus Task (2.5 points)
+
+**Part 1: IaC CI/CD (1.5 pts)**
+- [ ] GitHub Actions workflow created (`.github/workflows/terraform-ci.yml`)
+- [ ] Path filters configured for `terraform/**`
+- [ ] Workflow runs `terraform fmt -check`
+- [ ] Workflow runs `terraform validate`
+- [ ] Workflow runs `tflint`
+- [ ] Workflow triggers only on Terraform changes (proof provided)
+- [ ] Documentation includes workflow implementation details
+
+**Part 2: GitHub Repository Import (1 pt)**
+- [ ] GitHub provider configured in Terraform
+- [ ] Repository resource defined
+- [ ] `terraform import` executed successfully
+- [ ] State matches reality (terraform plan shows no changes)
+- [ ] Terminal output of import process provided
+- [ ] Documentation explains why importing matters
+- [ ] Benefits of managing existing resources documented
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Terraform Implementation** | 4 pts | Working infrastructure, best practices, documentation |
+| **Pulumi Implementation** | 4 pts | Working infrastructure, comparison provided |
+| **Documentation** | 2 pts | Complete, clear, includes cleanup proof |
+| **Bonus: IaC CI/CD** | 1.5 pts | Automated validation, path filters working |
+| **Bonus: Import** | 1 pt | Successful import, benefits explained |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Both tools working perfectly, excellent comparison, comprehensive documentation, proper cleanup
+- **8-9/10:** Infrastructure works, good documentation, minor issues or missing comparisons
+- **6-7/10:** One tool works well, other has issues, minimal comparison, incomplete docs
+- **<6/10:** Infrastructure doesn't work, major issues, secrets committed, no cleanup
+
+**Critical Requirements:**
+- ✅ MUST use free tier resources only
+- ✅ MUST document Lab 5 VM plan (keeping, local, or recreating)
+- ✅ MUST NOT commit secrets or state files
+- ✅ MUST provide SSH access proof
+- ⚠️ Keeping ONE VM for Lab 5 is acceptable (document it!)
+- ❌ Multiple VMs running without documentation = point deduction
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Terraform Documentation</summary>
+
+- [Terraform Documentation](https://developer.hashicorp.com/terraform/docs)
+- [Terraform Registry](https://registry.terraform.io/) - All providers
+- [Terraform Best Practices](https://www.terraform-best-practices.com/)
+- [HCL Configuration Language](https://developer.hashicorp.com/terraform/language)
+
+</details>
+
+<details>
+<summary>📚 Pulumi Documentation</summary>
+
+- [Pulumi Documentation](https://www.pulumi.com/docs/)
+- [Pulumi Registry](https://www.pulumi.com/registry/)
+- [Pulumi Examples](https://github.com/pulumi/examples)
+- [Pulumi vs Terraform](https://www.pulumi.com/docs/concepts/vs/terraform/)
+
+</details>
+
+<details>
+<summary>☁️ Cloud Provider Documentation</summary>
+
+- [Yandex Cloud Docs](https://cloud.yandex.com/en/docs)
+- [AWS Documentation](https://docs.aws.amazon.com/)
+- [GCP Documentation](https://cloud.google.com/docs)
+- [Azure Documentation](https://learn.microsoft.com/azure/)
+- [VK Cloud Docs](https://mcs.mail.ru/help/)
+
+</details>
+
+<details>
+<summary>🔒 Security & Best Practices</summary>
+
+- [Terraform Security Best Practices](https://spacelift.io/blog/terraform-security-best-practices)
+- [Managing Secrets in Terraform](https://developer.hashicorp.com/terraform/tutorials/configuration-language/sensitive-variables)
+- [Pulumi Secrets Management](https://www.pulumi.com/docs/concepts/secrets/)
+- [Git Secrets Prevention](https://github.com/awslabs/git-secrets)
+
+</details>
+
+<details>
+<summary>🛠️ Tools</summary>
+
+- [Terraform CLI](https://developer.hashicorp.com/terraform/downloads)
+- [Pulumi CLI](https://www.pulumi.com/docs/install/)
+- [tflint](https://github.com/terraform-linters/tflint) - Terraform linter
+- [terraform-docs](https://terraform-docs.io/) - Generate docs from code
+- [Infracost](https://www.infracost.io/) - Cost estimation for Terraform
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 5:** Ansible will provision software on your VM (install Docker, deploy your app from Labs 1-3)
+  - **You'll need a VM ready** - either keep your cloud VM from this lab, use a local VM, or recreate later
+- **Lab 6:** Ansible + Terraform integration (provision and configure in one workflow)
+- **Lab 9:** Kubernetes will replace individual VMs (but concepts are same)
+- **Lab 13:** ArgoCD will manage infrastructure changes (GitOps for infrastructure)
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** Infrastructure as Code is about automation, repeatability, and collaboration. Focus on understanding WHY we define infrastructure in code, not just HOW. Consider keeping one VM for Lab 5 (Ansible). If destroying resources, document your Lab 5 plan. Never commit secrets!
diff --git a/labs/lab05.md b/labs/lab05.md
new file mode 100644
index 0000000000..c5a4902a67
--- /dev/null
+++ b/labs/lab05.md
@@ -0,0 +1,975 @@
+# Lab 5 — Ansible Fundamentals
+
+![difficulty](https://img.shields.io/badge/difficulty-beginner-success)
+![topic](https://img.shields.io/badge/topic-Configuration%20Management-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Ansible-informational)
+
+> Learn configuration management fundamentals by building reusable Ansible roles for infrastructure provisioning and application deployment.
+
+## Overview
+
+Master the basics of Ansible by creating a professional role-based automation system. You'll build roles for system provisioning (Docker, common packages) and application deployment, demonstrating idempotency, handlers, and secure credential management with Ansible Vault.
+
+**What You'll Learn:**
+- Ansible roles architecture and best practices
+- Role-based code organization for reusability
+- Writing tasks, handlers, and defaults
+- Idempotency and why it matters
+- Ansible Vault for secure credential management
+- Handlers for efficient service management
+- Infrastructure verification and health checks
+- Basic application deployment with Docker
+
+**Tech Stack:** Ansible 2.16+ | Ansible Vault | Docker | YAML
+
+**Connection to Previous Labs:**
+- **Lab 4:** Use the VM you created (cloud or local)
+- **Labs 1-3:** Deploy your containerized Python app with CI/CD-built images
+- **Lab 6:** Add advanced features (blocks, tags, Docker Compose, CI/CD)
+
+---
+
+## Prerequisites
+
+You need a target VM from Lab 4:
+- **Option A:** Cloud VM from Lab 4 (Terraform/Pulumi)
+- **Option B:** Local VM (VirtualBox/Vagrant)
+- **Option C:** Recreate VM using your Lab 4 code
+
+**VM Requirements:**
+- Ubuntu 24.04 LTS or 22.04 LTS
+- SSH access configured
+- Your SSH key added
+- Sudo access (passwordless recommended for automation)
+- Python 3 installed (usually pre-installed on Ubuntu)
+
+---
+
+## Tasks
+
+### Task 1 — Ansible Setup & Role Structure (2 pts)
+
+**Objective:** Install Ansible locally, create proper role-based project structure, and configure inventory.
+
+#### 1.1 Install Ansible
+
+Install Ansible on your local machine (control node):
+
+**Ubuntu/Debian:**
+```bash
+sudo apt update
+sudo apt install ansible
+```
+
+**macOS:**
+```bash
+brew install ansible
+```
+
+**Windows:**
+- Use WSL2 and install in Linux environment
+- OR use Ansible via Docker
+
+Verify installation: `ansible --version`
+
+#### 1.2 Create Role-Based Project Structure
+
+Create this structure:
+
+```
+ansible/
+├── inventory/
+│   └── hosts.ini              # Static inventory
+├── roles/
+│   ├── common/                # Common system tasks
+│   │   ├── tasks/
+│   │   │   └── main.yml
+│   │   └── defaults/
+│   │       └── main.yml
+│   ├── docker/                # Docker installation
+│   │   ├── tasks/
+│   │   │   └── main.yml
+│   │   ├── handlers/
+│   │   │   └── main.yml
+│   │   └── defaults/
+│   │       └── main.yml
+│   └── app_deploy/            # Application deployment
+│       ├── tasks/
+│       │   └── main.yml
+│       ├── handlers/
+│       │   └── main.yml
+│       └── defaults/
+│           └── main.yml
+├── playbooks/
+│   ├── site.yml               # Main playbook
+│   ├── provision.yml          # System provisioning
+│   └── deploy.yml             # App deployment
+├── group_vars/
+│   └── all.yml               # Encrypted variables (Vault)
+├── ansible.cfg               # Ansible configuration
+└── docs/
+    └── LAB05.md              # Your documentation
+```
+
+<details>
+<summary>💡 Why Ansible Roles?</summary>
+
+**What are Roles?**
+
+Roles are the standard way to organize Ansible code for reusability and maintainability.
+
+**Benefits of Roles:**
+
+1. **Reusability**: Use same role across projects
+2. **Organization**: Clear structure, easy to navigate
+3. **Maintainability**: Changes in one place
+4. **Sharing**: Share roles via Ansible Galaxy
+5. **Testing**: Test roles independently
+6. **Modularity**: Mix and match roles
+
+**Role Structure:**
+
+Each role has a standard structure:
+
+```
+role_name/
+├── tasks/           # Main task list
+│   └── main.yml
+├── handlers/        # Handler definitions
+│   └── main.yml
+├── defaults/        # Default variables (low priority)
+│   └── main.yml
+├── vars/            # Role variables (high priority)
+│   └── main.yml
+├── files/           # Static files to copy
+├── templates/       # Jinja2 templates
+└── meta/            # Role metadata and dependencies
+    └── main.yml
+```
+
+**Only create directories you need!** Empty directories can be omitted.
+
+**Resources:**
+- [Ansible Roles Documentation](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html)
+- [Role Directory Structure](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html#role-directory-structure)
+
+</details>
+
+#### 1.3 Configure Inventory
+
+Create `inventory/hosts.ini` with your VM details:
+
+```ini
+[webservers]
+your-vm-name ansible_host=<VM-IP-ADDRESS> ansible_user=<username>
+```
+
+<details>
+<summary>💡 Inventory Configuration</summary>
+
+**Static Inventory Format:**
+```ini
+[group_name]
+hostname ansible_host=192.168.1.100 ansible_user=ubuntu ansible_ssh_private_key_file=~/.ssh/id_rsa
+
+[group_name:vars]
+ansible_python_interpreter=/usr/bin/python3
+```
+
+**Common Connection Parameters:**
+- `ansible_host` - IP address or hostname
+- `ansible_user` - SSH username
+- `ansible_port` - SSH port (default: 22)
+- `ansible_ssh_private_key_file` - Path to SSH key
+- `ansible_python_interpreter` - Python path on target
+
+**Testing Connectivity:**
+```bash
+ansible all -i inventory/hosts.ini -m ping
+ansible webservers -i inventory/hosts.ini -a "uptime"
+```
+
+**Resources:**
+- [Ansible Inventory Documentation](https://docs.ansible.com/ansible/latest/user_guide/intro_inventory.html)
+
+</details>
+
+#### 1.4 Create Ansible Configuration
+
+Create `ansible.cfg`:
+
+```ini
+[defaults]
+inventory = inventory/hosts.ini
+roles_path = roles
+host_key_checking = False
+remote_user = ubuntu
+retry_files_enabled = False
+
+[privilege_escalation]
+become = True
+become_method = sudo
+become_user = root
+```
+
+#### 1.5 Test Connectivity
+
+Verify Ansible can connect to your VM:
+
+```bash
+cd ansible/
+ansible all -m ping
+ansible webservers -a "uname -a"
+```
+
+You should see successful responses (green "SUCCESS" messages).
+
+---
+
+### Task 2 — System Provisioning Roles (4 pts)
+
+**Objective:** Create dedicated roles for system provisioning and demonstrate idempotency.
+
+#### 2.1 Create Common Role
+
+Create `roles/common/tasks/main.yml`:
+
+**Required Tasks:**
+- Update apt cache
+- Install essential packages (python3-pip, curl, git, vim, htop, etc.)
+- Set timezone (optional but good practice)
+
+**Create `roles/common/defaults/main.yml`:**
+Define default variables for packages to install.
+
+<details>
+<summary>💡 Common Role Pattern</summary>
+
+**Purpose:**
+Basic system setup that every server needs.
+
+**Typical Tasks:**
+- Update package cache
+- Install essential tools
+- Configure system settings
+- Set up logging
+- Create users/groups
+
+**Example pattern to research:**
+```yaml
+---
+- name: Update apt cache
+  apt:
+    update_cache: yes
+    cache_valid_time: 3600
+
+- name: Install common packages
+  apt:
+    name: "{{ common_packages }}"
+    state: present
+```
+
+**Questions:**
+- What does `cache_valid_time` do?
+- How do you define a list of packages in defaults?
+- Should you use `state: present` or `state: latest`?
+
+**Resources:**
+- [apt module](https://docs.ansible.com/ansible/latest/collections/ansible/builtin/apt_module.html)
+- [timezone module](https://docs.ansible.com/ansible/latest/collections/community/general/timezone_module.html)
+
+</details>
+
+#### 2.2 Create Docker Role
+
+Create `roles/docker/tasks/main.yml`:
+
+**Required Tasks:**
+1. Add Docker GPG key
+2. Add Docker repository
+3. Install Docker packages (docker-ce, docker-ce-cli, containerd.io)
+4. Ensure Docker service is running and enabled
+5. Add user to docker group
+6. Install python3-docker (for Ansible docker modules)
+
+**Create `roles/docker/handlers/main.yml`:**
+- Handler to restart Docker service
+
+**Create `roles/docker/defaults/main.yml`:**
+- Docker version constraints (if any)
+- User to add to docker group
+
+<details>
+<summary>💡 Docker Installation Pattern</summary>
+
+**Docker Installation Steps:**
+
+You need to research the official Docker installation for Ubuntu and translate it to Ansible tasks.
+
+**Key Modules:**
+- `apt_key` - Manage APT repository keys
+- `apt_repository` - Manage APT repositories
+- `apt` - Manage packages
+- `service` - Manage services
+- `user` - Manage users and groups
+
+**Questions to Research:**
+- What's Docker's official GPG key URL?
+- What repository URL should you use for Ubuntu?
+- How do you use Ansible facts like `{{ ansible_distribution_release }}`?
+- Why add user to docker group?
+- When should the handler be triggered?
+
+**Handler Pattern:**
+```yaml
+---
+- name: restart docker
+  service:
+    name: docker
+    state: restarted
+```
+
+**Trigger handler with:**
+```yaml
+- name: Some task
+  module: ...
+  notify: restart docker
+```
+
+**Resources:**
+- [Install Docker on Ubuntu (Official)](https://docs.docker.com/engine/install/ubuntu/)
+- [Ansible Handlers](https://docs.ansible.com/ansible/latest/user_guide/playbooks_handlers.html)
+
+</details>
+
+#### 2.3 Create Provisioning Playbook
+
+Create `playbooks/provision.yml`:
+
+```yaml
+---
+- name: Provision web servers
+  hosts: webservers
+  become: yes
+
+  roles:
+    - common
+    - docker
+```
+
+**That's it!** The playbook is clean because all logic is in roles.
+
+#### 2.4 Run Provisioning and Demonstrate Idempotency
+
+**First Run:**
+```bash
+ansible-playbook playbooks/provision.yml
+```
+
+Observe the output - tasks should show "changed" status (yellow).
+
+**Second Run:**
+```bash
+ansible-playbook playbooks/provision.yml
+```
+
+**CRITICAL:** Tasks should show "ok" status (green), not "changed". This demonstrates idempotency!
+
+<details>
+<summary>💡 Understanding Idempotency</summary>
+
+**What is Idempotency?**
+
+An idempotent operation produces the same result whether executed once or multiple times.
+
+**In Ansible:**
+- Running a playbook multiple times should be safe
+- Only makes changes when needed
+- Doesn't break if run repeatedly
+- Converges to desired state
+
+**Ansible Output Colors:**
+- **Green (ok):** Task ran, no change needed (desired state already achieved)
+- **Yellow (changed):** Task made a change to reach desired state
+- **Red (failed):** Task failed
+- **Dark (skipped):** Task was skipped
+
+**Why Idempotency Matters:**
+
+1. **Safety:** Can re-run playbooks without fear
+2. **Reliability:** Consistent results
+3. **Recovery:** Re-run after partial failure
+4. **Drift Detection:** Changes only when state drifts
+5. **Confidence:** Know exactly what will change
+
+**Making Tasks Idempotent:**
+
+**Use Stateful Modules:**
+- `apt: state=present` (not just `apt: name=package`)
+- `service: state=started` (not `command: systemctl start`)
+- `file: state=directory` (not `command: mkdir`)
+
+**Testing Idempotency:**
+
+1. Run playbook first time → many "changed"
+2. Run playbook second time → all "ok", zero "changed"
+3. If tasks show "changed" on second run, investigate why
+
+**Resources:**
+- [Ansible Idempotency](https://docs.ansible.com/ansible/latest/reference_appendices/glossary.html)
+
+</details>
+
+**What to Document:**
+- Terminal output from BOTH runs
+- Analysis: Which tasks changed first time? Why?
+- Explanation: Why nothing changed second time?
+
+---
+
+### Task 3 — Application Deployment Role (2 pts)
+
+**Objective:** Create a deployment role that securely pulls and runs your Python containerized app using Ansible Vault for credentials.
+
+#### 3.1 Initialize Ansible Vault
+
+Create encrypted file for sensitive data:
+
+```bash
+ansible-vault create group_vars/all.yml
+```
+
+You'll be prompted for a vault password. **Remember this password!**
+
+Add your Docker Hub credentials and app configuration:
+
+```yaml
+---
+# Docker Hub credentials
+dockerhub_username: your-username
+dockerhub_password: your-access-token
+
+# Application configuration
+app_name: devops-app
+docker_image: "{{ dockerhub_username }}/{{ app_name }}"
+docker_image_tag: latest
+app_port: 5000
+app_container_name: "{{ app_name }}"
+```
+
+Save and exit.
+
+<details>
+<summary>💡 Ansible Vault Best Practices</summary>
+
+**What is Ansible Vault?**
+
+Ansible Vault encrypts sensitive data so it can be safely stored in version control.
+**Vault Commands:**
+
+```bash
+# Create encrypted file
+ansible-vault create filename.yml
+
+# Edit encrypted file
+ansible-vault edit filename.yml
+
+# View encrypted file
+ansible-vault view filename.yml
+
+# Encrypt existing file
+ansible-vault encrypt filename.yml
+
+# Decrypt file (careful!)
+ansible-vault decrypt filename.yml
+```
+
+**Using Vaulted Files:**
+
+**Option 1: Prompt for password:**
+```bash
+ansible-playbook playbook.yml --ask-vault-pass
+```
+
+**Option 2: Password file:**
+```bash
+echo "your-password" > .vault_pass
+chmod 600 .vault_pass
+# Add .vault_pass to .gitignore!
+
+ansible-playbook playbook.yml --vault-password-file .vault_pass
+```
+
+**Option 3: In ansible.cfg:**
+```ini
+[defaults]
+vault_password_file = .vault_pass
+```
+
+**Best Practices:**
+
+1. **Never commit unencrypted secrets**
+2. **Use separate file for vault password** (add to .gitignore)
+3. **Rotate vault password regularly**
+4. **Don't decrypt files permanently**
+5. **Use `no_log: true` for tasks with secrets**
+
+**Resources:**
+- [Ansible Vault Documentation](https://docs.ansible.com/ansible/latest/user_guide/vault.html)
+
+</details>
+
+#### 3.2 Create Application Deployment Role
+
+Create `roles/app_deploy/tasks/main.yml`:
+
+**Required Tasks:**
+1. Log in to Docker Hub (using vaulted credentials)
+2. Pull Docker image
+3. Stop existing container (if running)
+4. Remove old container (if exists)
+5. Run new container with:
+   - Proper port mapping (5000:5000)
+   - Environment variables (if any)
+   - Restart policy (unless-stopped)
+   - Container name
+6. Wait for application to be ready (port check)
+7. Verify health endpoint
+
+**Create `roles/app_deploy/handlers/main.yml`:**
+- Handler to restart application container
+
+**Create `roles/app_deploy/defaults/main.yml`:**
+- Default port
+- Default restart policy
+- Default environment variables
+
+<details>
+<summary>💡 Docker Deployment with Ansible</summary>
+
+**Key Modules:**
+
+**docker_login:**
+Authenticate with Docker registry.
+
+**Questions:**
+- How do you pass credentials from vaulted variables?
+- What's the `no_log` parameter for?
+
+**docker_image:**
+Manage Docker images (pull, build, remove).
+
+**Questions:**
+- How do you pull an image?
+- What's the `source: pull` parameter?
+
+**docker_container:**
+Manage Docker containers.
+
+**Questions:**
+- How do you ensure a container is running?
+- What restart policies exist?
+- How do you map ports?
+- How do you set environment variables?
+- What's the difference between `state: started` and `state: present`?
+
+**wait_for:**
+Wait for port to be available.
+
+**uri:**
+Make HTTP requests (for health checks).
+
+**Security Note:**
+Always use `no_log: true` for tasks with credentials:
+```yaml
+- name: Login
+  docker_login:
+    username: "{{ dockerhub_username }}"
+    password: "{{ dockerhub_password }}"
+  no_log: true  # Prevents credentials in logs
+```
+
+**Resources:**
+- [docker_login module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_login_module.html)
+- [docker_image module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_image_module.html)
+- [docker_container module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_container_module.html)
+- [wait_for module](https://docs.ansible.com/ansible/latest/collections/ansible/builtin/wait_for_module.html)
+- [uri module](https://docs.ansible.com/ansible/latest/collections/ansible/builtin/uri_module.html)
+
+</details>
+
+#### 3.3 Create Deployment Playbook
+
+Create `playbooks/deploy.yml`:
+
+```yaml
+---
+- name: Deploy application
+  hosts: webservers
+  become: yes
+
+  roles:
+    - app_deploy
+```
+
+#### 3.4 Run Deployment
+
+```bash
+ansible-playbook playbooks/deploy.yml --ask-vault-pass
+```
+
+Or if using password file:
+```bash
+ansible-playbook playbooks/deploy.yml
+```
+
+**Verify:**
+- Container is running: `ansible webservers -a "docker ps"`
+- App is accessible: `curl http://<VM-IP>:5000/health`
+- Check main endpoint: `curl http://<VM-IP>:5000/`
+
+**What to Document:**
+- Terminal output from deployment
+- Container status: `docker ps` output
+- Health check verification
+- Handler execution (if any)
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Objective:** Document your Ansible implementation and demonstrate understanding.
+
+Create `ansible/docs/LAB05.md` with these sections:
+
+#### 1. Architecture Overview
+- Ansible version used
+- Target VM OS and version
+- Role structure diagram or explanation
+- Why roles instead of monolithic playbooks?
+
+#### 2. Roles Documentation
+
+For each role (common, docker, app_deploy):
+- **Purpose**: What does this role do?
+- **Variables**: Key variables and defaults
+- **Handlers**: What handlers are defined?
+- **Dependencies**: Does it depend on other roles?
+
+#### 3. Idempotency Demonstration
+- Terminal output from FIRST provision.yml run
+- Terminal output from SECOND provision.yml run
+- Analysis: What changed first time? What didn't change second time?
+- Explanation: What makes your roles idempotent?
+
+#### 4. Ansible Vault Usage
+- How you store credentials securely
+- Vault password management strategy
+- Example of encrypted file (show it's encrypted!)
+- Why Ansible Vault is important
+
+#### 5. Deployment Verification
+- Terminal output from deploy.yml run
+- Container status: `docker ps` output
+- Health check verification: `curl` outputs
+- Handler execution (if any)
+
+#### 6. Key Decisions
+Answer briefly (2-3 sentences each):
+- **Why use roles instead of plain playbooks?**
+- **How do roles improve reusability?**
+- **What makes a task idempotent?**
+- **How do handlers improve efficiency?**
+- **Why is Ansible Vault necessary?**
+
+#### 7. Challenges (Optional)
+- Issues encountered and solutions
+- Keep it brief - bullet points OK
+
+---
+
+## Bonus Task — Dynamic Inventory with Cloud Plugins (2.5 pts)
+
+**Objective:** Use Ansible's built-in inventory plugins to dynamically discover your cloud VMs instead of hardcoding IPs.
+
+<details>
+<summary>💡 Why Dynamic Inventory?</summary>
+
+**The Problem with Static Inventory:**
+```ini
+[webservers]
+vm ansible_host=192.168.1.100 ansible_user=ubuntu
+```
+- IP changes? Must update manually
+- Multiple VMs? Update each one
+- Scaling? Very tedious
+
+**Dynamic Inventory Solution:**
+- Query cloud provider API automatically
+- Always up-to-date IPs
+- Filter by tags/labels
+- Group automatically
+- Scale to hundreds of VMs
+
+**Ansible Inventory Plugins:**
+Ansible has official plugins for major clouds.
+
+**Available Plugins:**
+- `yandex.cloud.yandex_compute` - Yandex Cloud
+- `amazon.aws.aws_ec2` - Amazon EC2
+- `google.gcp.gcp_compute` - Google Cloud
+- `azure.azcollection.azure_rm` - Microsoft Azure
+- `community.digitalocean.digitalocean` - DigitalOcean
+
+</details>
+
+**Requirements:**
+
+1. **Install the collection for your cloud provider** from Lab 4
+
+2. **Create inventory plugin configuration file** - `ansible/inventory/<cloud>.yml`
+   - Must specify plugin name
+   - Must configure authentication
+   - Must set `ansible_host` to public IP (use `compose` parameter)
+   - Must set `ansible_user` (use `compose` parameter)
+   - Should filter running VMs only
+   - Should create groups (like `webservers`)
+
+3. **Update ansible.cfg** to use the plugin
+
+4. **Test the inventory:**
+   ```bash
+   ansible-inventory --graph    # Show discovered hosts
+   ansible all -m ping          # Test connectivity
+   ```
+
+5. **Run your playbooks** with dynamic inventory
+
+<details>
+<summary>💡 Research Path</summary>
+
+**Steps to Complete:**
+
+1. **Find the right plugin** for your cloud provider
+   - Search: "ansible [your-cloud] inventory plugin"
+   - Official documentation link
+
+2. **Install collection:**
+   - Use `ansible-galaxy collection install <collection-name>`
+   - Some require additional Python packages
+
+3. **Understand required parameters:**
+   - Authentication: How does plugin authenticate?
+   - Connection: How to set `ansible_host` from cloud metadata?
+   - Grouping: How to organize hosts?
+   - Filtering: How to select only your VMs?
+
+4. **Create YAML config file:**
+   - Must start with `plugin: <plugin-name>`
+   - Research what each cloud calls their fields
+   - Example: AWS uses `public_ip_address`, GCP uses `networkInterfaces[0]...`, etc.
+
+5. **Key Questions to Research:**
+   - What authentication method to use?
+   - What's the API field name for public IP?
+   - How to filter only running VMs?
+   - How to create host groups?
+
+**Hints by Cloud:**
+
+**Yandex Cloud:**
+- Collection: `yandex.cloud`
+- Key parameters: `auth_kind`, `folder_id`, `compose`
+- IP field is nested: `network_interfaces[0]...`
+
+**AWS:**
+- Collection: `amazon.aws`
+- Key parameters: `regions`, `filters`, `compose`
+- IP field: `public_ip_address`
+- Filter by tags: `"tag:Name": value`
+
+**GCP:**
+- Collection: `google.gcp`
+- Key parameters: `projects`, `auth_kind`, `compose`
+- IP field: `networkInterfaces[0].accessConfigs[0].natIP`
+
+**Azure:**
+- Collection: `azure.azcollection`
+- Key parameters: `include_vm_resource_groups`, `compose`
+- IP field: `public_ipv4_addresses[0]`
+
+**Documentation Links:**
+- [Ansible Inventory Plugins](https://docs.ansible.com/ansible/latest/plugins/inventory.html)
+- [Dynamic Inventory Guide](https://docs.ansible.com/ansible/latest/user_guide/intro_dynamic_inventory.html)
+- Search: "ansible [cloud] inventory plugin" for specific docs
+
+</details>
+
+**What to Document:**
+- Which cloud plugin you chose and why
+- How you configured authentication
+- How you mapped cloud metadata to Ansible variables
+- Terminal output from `ansible-inventory --graph` showing auto-discovered hosts
+- Terminal output from running playbooks with dynamic inventory
+- Explanation: What happens when VM IP changes? (No manual updates needed!)
+- Benefits compared to static inventory
+
+---
+
+## How to Submit
+
+1. **Create Branch:**
+   ```bash
+   git checkout -b lab05
+   ```
+
+2. **Commit Work:**
+   - Add Ansible project (`ansible/` directory with roles)
+   - Add documentation (`ansible/docs/LAB05.md`)
+   - **IMPORTANT:** Add to `.gitignore`:
+     ```
+     # Ansible
+     *.retry
+     .vault_pass
+     ansible/inventory/*.pyc
+     __pycache__/
+     ```
+   - Commit: `git commit -m "feat: complete lab05 - ansible fundamentals"`
+
+3. **Verify No Secrets:**
+   - ✅ Check vault password not committed
+   - ✅ Check `.vault_pass` not committed
+   - ✅ Encrypted vault files OK to commit (they're encrypted!)
+   - ✅ SSH private keys not committed
+
+4. **Create Pull Requests:**
+   - **PR #1:** `your-fork:lab05` → `course-repo:master`
+   - **PR #2:** `your-fork:lab05` → `your-fork:master`
+
+---
+
+## Acceptance Criteria
+
+### Main Tasks (10 points)
+
+**Setup & Structure (2 pts):**
+- [ ] Proper role-based directory structure created
+- [ ] All three roles created (common, docker, app_deploy)
+- [ ] Each role has appropriate tasks, handlers, and defaults
+- [ ] Ansible.cfg configured correctly
+- [ ] Inventory configured and connectivity tested
+
+**System Provisioning (4 pts):**
+- [ ] Common role implemented
+- [ ] Docker role implemented with all required tasks
+- [ ] Provision playbook uses roles correctly
+- [ ] **Idempotency demonstrated** (two runs, second shows no changes)
+- [ ] Terminal output from both runs provided
+- [ ] Handlers used appropriately
+
+**Application Deployment (2 pts):**
+- [ ] Ansible Vault used for credentials
+- [ ] Vault file encrypted (verify with `ansible-vault view`)
+- [ ] App_deploy role complete with all required tasks
+- [ ] Deploy playbook uses role correctly
+- [ ] Container running with proper configuration
+- [ ] Health check verification included
+- [ ] Handlers defined in role
+
+**Documentation (2 pts):**
+- [ ] `ansible/docs/LAB05.md` complete with all sections
+- [ ] Architecture and role structure explained
+- [ ] Each role documented (purpose, variables, handlers)
+- [ ] Idempotency analysis included
+- [ ] Vault usage documented
+- [ ] Key decisions explained
+
+### Bonus Task (2.5 points)
+
+**Dynamic Inventory (2.5 pts):**
+- [ ] Cloud inventory plugin configured
+- [ ] Integrates with your cloud provider from Lab 4
+- [ ] Playbooks work with dynamic inventory
+- [ ] Terminal output showing `ansible-inventory --graph`
+- [ ] Benefits documented
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Setup & Structure** | 2 pts | Proper role architecture, clean organization |
+| **System Provisioning** | 4 pts | All roles working, idempotent, handlers used |
+| **Application Deployment** | 2 pts | Vault used, role-based deployment, app running |
+| **Documentation** | 2 pts | Complete, clear, justifies decisions |
+| **Bonus: Dynamic Inventory** | 2.5 pts | Cloud plugin working |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Perfect role structure, deep understanding, excellent idempotency demo
+- **8-9/10:** Working roles, good practices, solid understanding
+- **6-7/10:** Basic roles work, some understanding, missing best practices
+- **<6/10:** Roles don't work properly, no idempotency, poor structure
+
+**Critical Requirements:**
+- ✅ MUST use role-based structure (not monolithic playbooks)
+- ✅ MUST demonstrate idempotency (two runs documented)
+- ✅ MUST use Ansible Vault for credentials
+- ✅ MUST NOT commit vault password or unencrypted secrets
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Ansible Core</summary>
+
+- [Ansible Documentation](https://docs.ansible.com/)
+- [Ansible Roles](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html)
+- [Best Practices](https://docs.ansible.com/ansible/latest/user_guide/playbooks_best_practices.html)
+
+</details>
+
+<details>
+<summary>🔒 Security</summary>
+
+- [Ansible Vault](https://docs.ansible.com/ansible/latest/user_guide/vault.html)
+- [Security Best Practices](https://docs.ansible.com/ansible/latest/user_guide/playbooks_best_practices.html#best-practices-for-security)
+
+</details>
+
+<details>
+<summary>🐳 Docker with Ansible</summary>
+
+- [Docker Modules](https://docs.ansible.com/ansible/latest/collections/community/docker/index.html)
+- [Docker Scenario Guide](https://docs.ansible.com/ansible/latest/scenario_guides/guide_docker.html)
+
+</details>
+
+<details>
+<summary>🔄 Dynamic Inventory</summary>
+
+- [Dynamic Inventory](https://docs.ansible.com/ansible/latest/user_guide/intro_dynamic_inventory.html)
+- [Inventory Plugins](https://docs.ansible.com/ansible/latest/plugins/inventory.html)
+
+</details>
+
+---
+
+## Looking Ahead
+
+**Lab 6:** Advanced Ansible features (blocks, tags, Docker Compose, CI/CD automation)
+
+You'll build on these roles by:
+- Adding blocks and tags for better control
+- Upgrading to Docker Compose
+- Implementing wipe logic
+- Automating deployment with GitHub Actions
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** Roles are the foundation of Ansible. Focus on creating clean, idempotent roles with proper structure. Use handlers efficiently. Secure your credentials with Vault. Document your decisions, not just your code. This foundation will be essential for Lab 6!
diff --git a/labs/lab06.md b/labs/lab06.md
new file mode 100644
index 0000000000..c4405cbc47
--- /dev/null
+++ b/labs/lab06.md
@@ -0,0 +1,1352 @@
+# Lab 6 — Advanced Ansible & CI/CD
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Ansible%20%26%20CI%2FCD-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Ansible%20|%20Docker%20Compose%20|%20GitHub%20Actions-informational)
+
+> Enhance your Ansible automation with advanced features including blocks, tags, Docker Compose, role dependencies, wipe logic, and CI/CD integration.
+
+## Overview
+
+Build on Lab 5 by enhancing your Ansible automation with production-ready features. You'll refactor roles with blocks and tags, upgrade to Docker Compose, implement safe cleanup logic, and fully automate deployments with CI/CD.
+
+**What You'll Learn:**
+- Blocks for error handling and task grouping
+- Tags for selective Ansible execution
+- Docker Compose templating with Jinja2
+- Role dependencies and execution order
+- Safe wipe logic with double-gating (variable + tag)
+- GitHub Actions for Ansible automation
+- Multi-app deployment patterns (Bonus)
+
+**Tech Stack:** Ansible 2.16+ | Docker Compose v2 | GitHub Actions | Jinja2
+
+**Prerequisites:** Lab 5 completed (Ansible roles, playbooks, Vault), containerized app from Lab 2, GitHub Actions knowledge from Lab 3
+
+---
+
+## Tasks
+
+### Task 1 — Refactor with Blocks & Tags (2 pts)
+
+#### 1.1 Understanding Blocks
+
+Blocks allow you to:
+- **Group tasks** logically (e.g., all Docker installation tasks)
+- **Apply directives** once to multiple tasks (when, become, tags)
+- **Handle errors** with rescue and always sections
+- **Improve readability** by showing task relationships
+
+**Example Block Pattern:**
+```yaml
+- name: Install package with error handling
+  block:
+    - name: Update apt cache
+      # task 1
+
+    - name: Install package
+      # task 2
+
+  rescue:
+    - name: Handle installation failure
+      # runs only if block fails
+
+  always:
+    - name: Cleanup temp files
+      # runs regardless of success/failure
+
+  when: ansible_os_family == "Debian"
+  become: true
+  tags:
+    - packages
+```
+
+#### 1.2 Understanding Tags
+
+Tags enable selective execution:
+```bash
+# Run only tagged tasks
+ansible-playbook provision.yml --tags "docker"
+
+# Skip specific tags
+ansible-playbook provision.yml --skip-tags "common"
+
+# Multiple tags
+ansible-playbook provision.yml --tags "packages,docker"
+
+# List all available tags
+ansible-playbook provision.yml --list-tags
+```
+
+#### 1.3 Refactor `common` Role
+
+**File:** `roles/common/tasks/main.yml`
+
+**Requirements:**
+1. Group package installation tasks in a block with tag `packages`
+2. Group user creation tasks in a block with tag `users`
+3. Add error handling with rescue for apt cache update failures
+4. Use always block to log completion
+
+**Tag Strategy:**
+- `packages` - all package installation tasks
+- `users` - all user management tasks
+- `common` - entire role (applied at role level)
+
+**Hints:**
+- Add rescue block that runs `apt-get update --fix-missing` on failure
+- Use always block to create a log file in /tmp indicating completion
+- Apply `become: true` at block level instead of per task
+
+**Research Questions:**
+- Q: What happens if rescue block also fails?
+- Q: Can you have nested blocks?
+- Q: How do tags inherit to tasks within blocks?
+
+#### 1.4 Refactor `docker` Role
+
+**File:** `roles/docker/tasks/main.yml`
+
+**Requirements:**
+1. Group Docker installation tasks in block with tag `docker_install`
+2. Group Docker configuration tasks in block with tag `docker_config`
+3. Add rescue block to retry apt update on GPG key failure
+4. Use always block to ensure Docker service is enabled
+
+**Additional Tags:**
+- `docker` - entire role
+- `docker_install` - installation only
+- `docker_config` - configuration only
+
+**Hints:**
+- Docker GPG key addition may fail on first try (network timeout)
+- Rescue block should wait 10 seconds and retry
+- Always block should ensure Docker service is enabled and started
+
+#### 1.5 Testing Blocks & Tags
+
+**Test Commands:**
+```bash
+# Test provision with only docker
+ansible-playbook playbooks/provision.yml --tags "docker"
+
+# Skip common role
+ansible-playbook playbooks/provision.yml --skip-tags "common"
+
+# Install packages only across all roles
+ansible-playbook playbooks/provision.yml --tags "packages"
+
+# Check mode to see what would run
+ansible-playbook playbooks/provision.yml --tags "docker" --check
+
+# Run only docker installation tasks
+ansible-playbook playbooks/provision.yml --tags "docker_install"
+```
+
+**Evidence Required:**
+- Output showing selective execution with --tags
+- Output showing error handling with rescue block triggered
+- List of all available tags (--list-tags output)
+
+---
+
+### Task 2 — Upgrade to Docker Compose (3 pts)
+
+#### 2.1 Why Docker Compose?
+
+**Advantages over `docker run`:**
+- **Declarative configuration** - define desired state, not commands
+- **Multi-container management** - networks, volumes, dependencies
+- **Environment variable management** - .env files, variable substitution
+- **Easy updates** - change config file and recreate
+- **Better for production** - consistent, reproducible deployments
+
+#### 2.2 Rename Role
+
+**Action Required:**
+```bash
+cd ansible/roles
+mv app_deploy web_app
+```
+
+**Update all references:**
+- Playbook imports: `roles/app_deploy` → `roles/web_app`
+- Documentation: app_deploy → web_app
+- Variable prefixes: Consider `web_app_*` for consistency
+
+**Why rename?**
+- `web_app` is more specific and descriptive
+- Prepares for potential other app types (database_app, cache_app)
+- Better aligns with wipe logic variable naming
+
+#### 2.3 Create Docker Compose Template
+
+**File:** `roles/web_app/templates/docker-compose.yml.j2`
+
+**Requirements:**
+1. Use Jinja2 templating for dynamic values
+2. Define service name, image, ports, environment variables
+3. Include restart policy
+4. Use networks if needed
+5. Support variable substitution for app-specific config
+
+**Template Pattern:**
+```yaml
+version: '3.8'
+
+services:
+  {{ app_name }}:
+    image: {{ docker_image }}:{{ docker_tag }}
+    container_name: {{ app_name }}
+    ports:
+      - "{{ app_port }}:{{ app_internal_port }}"
+    environment:
+      # Add environment variables here
+      # Use Vault-encrypted secrets
+    restart: unless-stopped
+    # Add other configuration
+```
+
+**Variables to support:**
+- `app_name` - service/container name (default: devops-app)
+- `docker_image` - Docker Hub image
+- `docker_tag` - image version (default: latest)
+- `app_port` - host port (default: 8000)
+- `app_internal_port` - container port (default: 8000)
+- Environment variables for app configuration
+
+**Research Questions:**
+- Q: What's the difference between `restart: always` and `restart: unless-stopped`?
+- Q: How do Docker Compose networks differ from Docker bridge networks?
+- Q: Can you reference Ansible Vault variables in the template?
+
+#### 2.4 Define Role Dependencies
+
+**File:** `roles/web_app/meta/main.yml`
+
+**Purpose:** Ensure Docker is installed before deploying web app.
+
+**Pattern:**
+```yaml
+---
+dependencies:
+  - role: role_name
+    # Optional variables to pass
+    vars:
+      var_name: value
+```
+
+**Requirements:**
+1. Add `docker` role as dependency
+2. Ensure correct execution order automatically
+3. Document why dependency is needed
+
+**Test:** Run only `web_app` role - Docker should install automatically:
+```bash
+ansible-playbook playbooks/deploy.yml
+# Should automatically run docker role first
+```
+
+#### 2.5 Implement Docker Compose Deployment
+
+**File:** `roles/web_app/tasks/main.yml`
+
+**Requirements:**
+1. Create application directory (e.g., /opt/{{ app_name }})
+2. Template docker-compose.yml to the directory
+3. Use `docker_compose` module (or `community.docker.docker_compose`)
+4. Ensure idempotency (check if already running)
+5. Add appropriate tags: `app_deploy`, `compose`
+
+**Deployment Block Pattern:**
+```yaml
+- name: Deploy application with Docker Compose
+  block:
+    - name: Create app directory
+      # Use file module
+
+    - name: Template docker-compose file
+      # Use template module
+
+    - name: Deploy with docker-compose
+      # Use docker_compose module
+      # state: present (or up)
+
+  rescue:
+    - name: Handle deployment failure
+      # Log error, optionally rollback
+
+  tags:
+    - app_deploy
+    - compose
+```
+
+**Hints:**
+- Install docker-compose Python library: `pip3 install docker-compose`
+- Or use `community.docker` collection (requires installation)
+- Set `pull: yes` to always get latest image
+- Use `project_src` to specify directory with docker-compose.yml
+
+**Research:**
+- Look up `community.docker.docker_compose_v2` module
+- Compare `state: present` vs other state options
+- Understand `recreate` parameter options
+
+#### 2.6 Variables Configuration
+
+**File:** `group_vars/all.yml` (or role defaults)
+
+**Required Variables:**
+```yaml
+# Application Configuration
+app_name: devops-app
+docker_image: your_dockerhub_username/devops-info-service
+docker_tag: latest
+app_port: 8000
+app_internal_port: 8000
+
+# Docker Compose Config
+compose_project_dir: "/opt/{{ app_name }}"
+docker_compose_version: "3.8"
+
+# Secrets (use Vault)
+app_secret_key: !vault |
+          $ANSIBLE_VAULT;1.1;AES256
+          ...
+```
+
+**Encrypt sensitive values:**
+```bash
+ansible-vault encrypt_string 'secret_value' --name 'app_secret_key'
+```
+
+#### 2.7 Testing Docker Compose Deployment
+
+**Test Commands:**
+```bash
+# Full deployment
+ansible-playbook playbooks/deploy.yml
+
+# Check idempotency (run twice, second should show no changes)
+ansible-playbook playbooks/deploy.yml
+ansible-playbook playbooks/deploy.yml
+
+# Verify on target VM
+ssh user@vm_ip
+docker ps
+docker-compose -f /opt/devops-app/docker-compose.yml ps
+curl http://localhost:8000
+```
+
+**Evidence Required:**
+- Output showing Docker Compose deployment success
+- Idempotency proof (second run shows "ok" not "changed")
+- Application running and accessible
+- Contents of templated docker-compose.yml
+
+---
+
+### Task 3 — Wipe Logic Implementation (1 pt)
+
+#### 3.1 Understanding Wipe Logic
+
+**Purpose:** Clean removal of deployed applications for:
+- **Clean reinstallation** (wipe old → deploy new)
+- Testing from fresh state
+- Rolling back to clean slate
+- Decommissioning applications
+- Resource cleanup before upgrades
+
+**Implementation Requirements:**
+- ✅ Controlled by variable: `web_app_wipe: true`
+- ✅ Gated by specific tag: `web_app_wipe`
+- ❌ NOT using the special "never" tag
+- Default behavior: wipe tasks do NOT run
+- Explicit invocation required
+
+#### 3.2 Create Wipe Tasks
+
+**File:** `roles/web_app/tasks/wipe.yml`
+
+**Requirements:**
+1. Stop and remove containers (Docker Compose down)
+2. Remove docker-compose.yml file
+3. Remove application directory
+4. Optionally remove Docker images (consider disk space)
+5. Log wipe completion
+
+**Implementation Pattern:**
+```yaml
+---
+- name: Wipe web application
+  block:
+    - name: Stop and remove containers
+      ...
+
+    - name: Remove docker-compose file
+      ...
+
+    - name: Remove application directory
+      ...
+
+    - name: Log wipe completion
+      debug:
+        msg: "Application {{ app_name }} wiped successfully"
+
+  when: ...
+  tags:
+    - web_app_wipe
+```
+
+**Key Points:**
+- `when` condition checks variable (default: false)
+- `tags` enables selective execution
+- `ignore_errors` prevents failure if already clean
+- `| bool` ensures proper boolean evaluation
+
+#### 3.3 Include Wipe in Main Tasks
+
+**File:** `roles/web_app/tasks/main.yml`
+
+**Add at the beginning (before deployment tasks):**
+```yaml
+---
+# Wipe logic runs first (when explicitly requested)
+- name: Include wipe tasks
+  include_tasks: wipe.yml
+  tags:
+    - web_app_wipe
+
+# Deployment tasks follow...
+- name: Deploy application with Docker Compose
+  block:
+    # ... your deployment tasks
+```
+
+**Why at the beginning?**
+- Enables clean reinstallation: wipe → deploy
+- Logical flow: remove old → install new
+- Tag isolation still prevents accidental wipe during normal deployment
+- Supports use case: `ansible-playbook deploy.yml -e "web_app_wipe=true"`
+
+#### 3.4 Configure Wipe Variable
+
+**File:** `roles/web_app/defaults/main.yml`
+
+**Add:**
+```yaml
+# Wipe Logic Control
+web_app_wipe: false  # Default: do not wipe
+```
+
+**Documentation comment:**
+```yaml
+# Set to true to remove application completely
+# Wipe only:    ansible-playbook deploy.yml -e "web_app_wipe=true" --tags web_app_wipe
+# Clean install: ansible-playbook deploy.yml -e "web_app_wipe=true"
+```
+
+#### 3.5 Testing Wipe Logic
+
+**Test Scenarios:**
+
+**Scenario 1: Normal deployment (wipe should NOT run)**
+```bash
+ansible-playbook playbooks/deploy.yml
+
+# Verify: app deploys normally, wipe tasks skipped (tag not specified)
+ssh user@vm_ip "docker ps"
+```
+
+**Scenario 2: Wipe only (remove existing deployment)**
+```bash
+ansible-playbook playbooks/deploy.yml \
+  -e "web_app_wipe=true" \
+  --tags web_app_wipe
+
+# Verify: app should be removed, deployment skipped
+ssh user@vm_ip "docker ps"  # Should not show app
+ssh user@vm_ip "ls /opt"    # Should not have app directory
+```
+
+**Scenario 3: Clean reinstallation (wipe → deploy)**
+```bash
+# This is the KEY use case: fresh start
+ansible-playbook playbooks/deploy.yml \
+  -e "web_app_wipe=true"
+
+# What happens:
+# 1. Wipe tasks run first (remove old installation)
+# 2. Deployment tasks run second (install fresh)
+# Result: clean reinstallation
+
+# Verify: old app removed, new app running
+ssh user@vm_ip "docker ps"
+```
+
+**Scenario 4: Safety checks (should NOT wipe)**
+```bash
+# 4a: Tag specified but variable false (when condition blocks it)
+ansible-playbook playbooks/deploy.yml --tags web_app_wipe
+# Result: wipe tasks skipped, deployment runs normally
+
+# 4b: Variable true, deployment skipped (only wipe runs)
+ansible-playbook playbooks/deploy.yml \
+  -e "web_app_wipe=true" \
+  --tags web_app_wipe
+# Result: only wipe, no deployment
+```
+
+**Evidence Required:**
+- Output of Scenario 1 showing normal deployment (wipe skipped)
+- Output of Scenario 2 showing wipe-only operation
+- Output of Scenario 3 showing clean reinstall (wipe → deploy)
+- Output of Scenario 4a showing wipe blocked by when condition
+- Screenshot of application running after clean reinstall
+
+#### 3.6 Research Questions
+
+Answer these in your documentation:
+1. **Why use both variable AND tag?** (Double safety mechanism)
+2. **What's the difference between `never` tag and this approach?**
+3. **Why must wipe logic come BEFORE deployment in main.yml?** (Clean reinstall scenario)
+4. **When would you want clean reinstallation vs. rolling update?**
+5. **How would you extend this to wipe Docker images and volumes too?**
+
+---
+
+### Task 4 — CI/CD with GitHub Actions (3 pts)
+
+#### 4.1 Why Automate Ansible?
+
+**Benefits:**
+- **Consistency** - same process every time
+- **Speed** - automatic deployments on push
+- **Safety** - linting catches errors before execution
+- **Auditability** - GitHub logs every deployment
+- **Integration** - combines with testing, building, scanning
+
+**CI/CD Flow:**
+```
+Code Push → Lint Ansible → Run Ansible Playbook → Verify Deployment
+```
+
+#### 4.2 Install GitHub Actions Runner (Optional)
+
+**Two Approaches:**
+
+**Approach A: Self-hosted runner on target VM (Recommended)**
+- More realistic for production
+- Direct access to target server
+- Faster (no SSH overhead)
+- Setup: GitHub Repo → Settings → Actions → Runners → Add runner
+
+**Approach B: GitHub-hosted runner with SSH**
+- Easier setup
+- Requires SSH key configuration
+- Uses GitHub Secrets for credentials
+- Slower but simpler
+
+Choose based on your infrastructure preference.
+
+#### 4.3 Create Ansible Workflow
+
+**File:** `.github/workflows/ansible-deploy.yml`
+
+**Requirements:**
+1. Trigger on push to ansible directory
+2. Run ansible-lint for syntax checking
+3. Execute Ansible playbook
+4. Verify deployment success
+5. Use path filters to avoid unnecessary runs
+
+**Workflow Structure:**
+```yaml
+name: Ansible Deployment
+
+on:
+  push:
+    branches: [ main, master ]
+    paths:
+      - 'ansible/**'
+      - '.github/workflows/ansible-deploy.yml'
+  pull_request:
+    branches: [ main, master ]
+    paths:
+      - 'ansible/**'
+
+jobs:
+  lint:
+    name: Ansible Lint
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@v4
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: '3.12'
+
+      - name: Install dependencies
+        run: |
+          pip install ansible ansible-lint
+
+      - name: Run ansible-lint
+        run: |
+          cd ansible
+          ansible-lint playbooks/*.yml
+
+  deploy:
+    name: Deploy Application
+    needs: lint
+    runs-on: ubuntu-latest  # or self-hosted
+    steps:
+      # Add deployment steps
+      # - Setup Ansible
+      # - Configure SSH (if needed)
+      # - Decrypt Vault (use GitHub Secrets)
+      # - Run playbook
+      # - Verify deployment
+```
+
+#### 4.4 Configure GitHub Secrets
+
+**Required Secrets:** (Settings → Secrets and variables → Actions)
+
+1. `ANSIBLE_VAULT_PASSWORD` - Vault password for decryption
+2. `SSH_PRIVATE_KEY` - SSH key for target VM (if using remote runner)
+3. `VM_HOST` - Target VM IP/hostname
+4. `VM_USER` - SSH username
+
+**Using Secrets in Workflow:**
+```yaml
+- name: Deploy with Ansible
+  env:
+    ANSIBLE_VAULT_PASSWORD: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
+  run: |
+    echo "$ANSIBLE_VAULT_PASSWORD" > /tmp/vault_pass
+    ansible-playbook playbooks/deploy.yml \
+      --vault-password-file /tmp/vault_pass
+    rm /tmp/vault_pass
+```
+
+#### 4.5 Implement Deployment Step
+
+**For self-hosted runner:**
+```yaml
+deploy:
+  runs-on: self-hosted
+  steps:
+    - uses: actions/checkout@v4
+
+    - name: Deploy with Ansible
+      run: |
+        cd ansible
+        echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
+        ansible-playbook playbooks/deploy.yml \
+          --vault-password-file /tmp/vault_pass \
+          --tags "app_deploy"
+        rm /tmp/vault_pass
+```
+
+**For GitHub-hosted runner:**
+```yaml
+deploy:
+  runs-on: ubuntu-latest
+  steps:
+    - uses: actions/checkout@v4
+
+    - name: Set up Python
+      uses: actions/setup-python@v5
+      with:
+        python-version: '3.12'
+
+    - name: Install Ansible
+      run: pip install ansible
+
+    - name: Setup SSH
+      run: |
+        mkdir -p ~/.ssh
+        echo "${{ secrets.SSH_PRIVATE_KEY }}" > ~/.ssh/id_rsa
+        chmod 600 ~/.ssh/id_rsa
+        ssh-keyscan -H ${{ secrets.VM_HOST }} >> ~/.ssh/known_hosts
+
+    - name: Deploy with Ansible
+      run: |
+        cd ansible
+        echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
+        ansible-playbook playbooks/deploy.yml \
+          -i inventory/hosts.ini \
+          --vault-password-file /tmp/vault_pass
+        rm /tmp/vault_pass
+```
+
+#### 4.6 Add Verification Step
+
+**After deployment, verify it worked:**
+```yaml
+- name: Verify Deployment
+  run: |
+    sleep 10  # Wait for app to start
+    curl -f http://${{ secrets.VM_HOST }}:8000 || exit 1
+    curl -f http://${{ secrets.VM_HOST }}:8000/health || exit 1
+```
+
+#### 4.7 Path Filters Best Practice
+
+**Why path filters?**
+- Don't run Ansible workflow when changing docs
+- Separate workflows for different concerns
+- Faster CI, lower costs
+
+**Example:**
+```yaml
+on:
+  push:
+    paths:
+      - 'ansible/**'           # Ansible code
+      - '!ansible/docs/**'     # Exclude docs
+      - '.github/workflows/ansible-deploy.yml'  # Workflow changes
+```
+
+#### 4.8 Add Status Badge
+
+**File:** `README.md` (or ansible/README.md)
+
+**Add badge:**
+```markdown
+[![Ansible Deployment](https://github.com/your-username/your-repo/actions/workflows/ansible-deploy.yml/badge.svg)](https://github.com/your-username/your-repo/actions/workflows/ansible-deploy.yml)
+```
+
+#### 4.9 Testing CI/CD
+
+**Test Sequence:**
+1. Make a change to ansible code (e.g., update variable in group_vars)
+2. Commit and push to GitHub
+3. Watch Actions tab for workflow execution
+4. Verify lint job passes
+5. Verify deploy job succeeds
+6. Check application is updated on target VM
+
+**Evidence Required:**
+- Screenshot of successful workflow run
+- Output logs showing ansible-lint passing
+- Output logs showing ansible-playbook execution
+- Verification step output showing app responding
+- Status badge in README showing passing
+
+#### 4.10 Research Questions
+
+Answer in documentation:
+1. **What are the security implications of storing SSH keys in GitHub Secrets?**
+2. **How would you implement a staging → production deployment pipeline?**
+3. **What would you add to make rollbacks possible?**
+4. **How does self-hosted runner improve security compared to GitHub-hosted?**
+
+---
+
+### Task 5 — Documentation (1 pt)
+
+Create `ansible/docs/LAB06.md` with the following:
+
+**Required Sections:**
+1. **Overview** - What you accomplished and technologies used
+2. **Blocks & Tags** - Block usage in each role, tag strategy, execution examples with screenshots
+3. **Docker Compose Migration** - Template structure, role dependencies, before/after comparison
+4. **Wipe Logic** - Implementation details, variable + tag approach, test results
+5. **CI/CD Integration** - Workflow architecture, setup steps, evidence of automated deployments
+6. **Testing Results** - All test scenarios, idempotency verification, application accessibility
+7. **Challenges & Solutions** - Difficulties encountered and how you solved them
+8. **Research Answers** - All research questions answered with analysis
+
+**Code Documentation:**
+- Add clear comments in all modified Ansible files
+- Document variables in templates
+- Explain safety mechanisms in wipe logic
+- Document workflow steps in CI/CD files
+
+**Evidence:**
+- Terminal outputs showing tagged execution
+- Wipe logic test results (all 4 scenarios)
+- CI/CD workflow logs and screenshots
+- Application accessibility verification
+
+---
+
+### Bonus Part 1 — Multi-App Deployment (1.5 pts)
+
+#### Bonus 1.1 Prerequisites
+
+**Required:**
+- Completed Lab 1 Bonus (compiled language app: Go/Rust/Java/C#)
+- Completed Lab 2 Bonus (multi-stage Docker build)
+- Completed Lab 3 Bonus Part 1 (multi-app CI/CD)
+
+**You should have:**
+- Python web app (everyone has this)
+- Compiled language web app (Go/Rust/Java/C#)
+- Both apps containerized and on Docker Hub
+- Both apps with similar endpoints (/, /health)
+
+#### Bonus 1.2 Role Reusability Pattern
+
+**Key Concept:** Use the same `web_app` role for both apps with different variables.
+
+**Directory Structure:**
+```
+ansible/
+├── inventory/
+│   └── hosts.ini
+├── group_vars/
+│   └── all.yml
+├── host_vars/          # Optional: per-host vars
+├── vars/
+│   ├── app_python.yml  # NEW: Python app variables
+│   └── app_bonus.yml   # NEW: Bonus app variables
+├── roles/
+│   └── web_app/        # Reused for both apps
+└── playbooks/
+    ├── provision.yml
+    ├── deploy_python.yml    # NEW
+    ├── deploy_bonus.yml     # NEW
+    └── deploy_all.yml       # NEW: Deploy both
+```
+
+#### Bonus 1.3 Create Variable Files
+
+**File:** `ansible/vars/app_python.yml`
+```yaml
+---
+app_name: devops-python
+docker_image: your_username/devops-info-service
+docker_tag: latest
+app_port: 8000
+app_internal_port: 8000
+compose_project_dir: "/opt/{{ app_name }}"
+```
+
+**File:** `ansible/vars/app_bonus.yml`
+```yaml
+---
+app_name: devops-go  # or rust, java, csharp
+docker_image: your_username/devops-info-service-go
+docker_tag: latest
+app_port: 8001  # Different port!
+app_internal_port: 8080  # Go apps often use 8080
+compose_project_dir: "/opt/{{ app_name }}"
+```
+
+**Important:** Use different ports to run both apps simultaneously.
+
+#### Bonus 1.4 Create Deployment Playbooks
+
+**File:** `ansible/playbooks/deploy_python.yml`
+```yaml
+---
+- name: Deploy Python Application
+  hosts: all
+  become: true
+  vars_files:
+    - ../vars/app_python.yml
+
+  roles:
+    - web_app
+```
+
+**File:** `ansible/playbooks/deploy_bonus.yml`
+```yaml
+---
+- name: Deploy Bonus Application
+  hosts: all
+  become: true
+  vars_files:
+    - ../vars/app_bonus.yml
+
+  roles:
+    - web_app
+```
+
+**File:** `ansible/playbooks/deploy_all.yml`
+```yaml
+---
+- name: Deploy All Applications
+  hosts: all
+  become: true
+
+  tasks:
+    - name: Deploy Python App
+      include_role:
+        name: web_app
+      vars:
+        app_name: devops-python
+        docker_image: your_username/devops-info-service
+        app_port: 8000
+
+    - name: Deploy Bonus App
+      include_role:
+        name: web_app
+      vars:
+        app_name: devops-go
+        docker_image: your_username/devops-info-service-go
+        app_port: 8001
+        app_internal_port: 8080
+```
+
+#### Bonus 1.5 Extend Wipe Logic
+
+**Wipe logic should support app-specific wipe:**
+
+**Usage:**
+```bash
+# Wipe only Python app
+ansible-playbook playbooks/deploy_python.yml \
+  -e "web_app_wipe=true" \
+  --tags web_app_wipe
+
+# Wipe only Bonus app
+ansible-playbook playbooks/deploy_bonus.yml \
+  -e "web_app_wipe=true" \
+  --tags web_app_wipe
+
+# Wipe both apps
+ansible-playbook playbooks/deploy_all.yml \
+  -e "web_app_wipe=true" \
+  --tags web_app_wipe
+```
+
+**The role automatically handles different apps because `app_name` and `compose_project_dir` are different!**
+
+#### Bonus 1.6 Testing Multi-App Deployment
+
+**Test Commands:**
+```bash
+# Deploy both apps
+ansible-playbook playbooks/deploy_all.yml
+
+# Verify both running
+ssh user@vm_ip "docker ps"
+curl http://vm_ip:8000        # Python app
+curl http://vm_ip:8001        # Bonus app
+
+# Test independent deployment
+ansible-playbook playbooks/deploy_python.yml  # Should not affect bonus app
+ansible-playbook playbooks/deploy_bonus.yml   # Should not affect python app
+
+# Test independent wipe
+ansible-playbook playbooks/deploy_python.yml \
+  -e "web_app_wipe=true" --tags web_app_wipe
+# Verify: Python app removed, bonus app still running
+
+# Test idempotency
+ansible-playbook playbooks/deploy_all.yml
+ansible-playbook playbooks/deploy_all.yml  # Should show minimal changes
+```
+
+**Evidence Required:**
+- Output showing both apps deployed
+- `docker ps` output showing both containers
+- Curl outputs from both apps
+- Proof of independent wipe functionality
+- Idempotency verification for multi-app deployment
+
+#### Bonus 1.7 Documentation
+
+**Add to LAB06.md:**
+- Multi-app architecture explanation
+- Variable file strategy
+- Role reusability benefits
+- Port conflict resolution
+- Independent vs. combined deployment trade-offs
+
+---
+
+### Bonus Part 2 — Multi-App CI/CD (1 pt)
+
+#### Bonus 2.1 Prerequisites
+
+**Required:**
+- Bonus Part 1 completed (multi-app deployment working)
+- Task 4 completed (single app CI/CD working)
+
+#### Bonus 2.2 Workflow Strategy
+
+**Two Approaches:**
+
+**Approach A: Separate Workflows**
+- One workflow per app
+- Path filters for each app's code
+- Independent deployment
+- More control, more files
+
+**Approach B: Matrix Strategy**
+- Single workflow with matrix
+- Deploys both apps
+- Simpler, less flexible
+
+Choose based on your preference (Approach A recommended).
+
+#### Bonus 2.3 Create Workflow for Bonus App
+
+**File:** `.github/workflows/ansible-deploy-bonus.yml`
+
+**Requirements:**
+1. Trigger on bonus app code changes
+2. Run ansible-lint
+3. Deploy bonus app only
+4. Verify bonus app responds
+5. Independent from Python app workflow
+
+**Path Filters:**
+```yaml
+on:
+  push:
+    branches: [ main, master ]
+    paths:
+      - 'ansible/vars/app_bonus.yml'
+      - 'ansible/playbooks/deploy_bonus.yml'
+      - 'ansible/roles/web_app/**'
+      - '.github/workflows/ansible-deploy-bonus.yml'
+```
+
+**Deployment Step:**
+```yaml
+- name: Deploy Bonus Application
+  run: |
+    cd ansible
+    echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
+    ansible-playbook playbooks/deploy_bonus.yml \
+      --vault-password-file /tmp/vault_pass
+    rm /tmp/vault_pass
+```
+
+**Verification:**
+```yaml
+- name: Verify Bonus App Deployment
+  run: |
+    sleep 10
+    curl -f http://${{ secrets.VM_HOST }}:8001 || exit 1
+    curl -f http://${{ secrets.VM_HOST }}:8001/health || exit 1
+```
+
+#### Bonus 2.4 Update Python App Workflow
+
+**File:** `.github/workflows/ansible-deploy.yml`
+
+**Update path filters to be more specific:**
+```yaml
+on:
+  push:
+    paths:
+      - 'ansible/vars/app_python.yml'
+      - 'ansible/playbooks/deploy_python.yml'
+      - 'ansible/playbooks/deploy.yml'  # If this deploys Python
+      - 'ansible/roles/web_app/**'
+      - '.github/workflows/ansible-deploy.yml'
+```
+
+**Update deployment to use specific playbook:**
+```yaml
+- name: Deploy Python Application
+  run: |
+    cd ansible
+    ansible-playbook playbooks/deploy_python.yml \
+      --vault-password-file /tmp/vault_pass
+```
+
+#### Bonus 2.5 Matrix Strategy Alternative
+
+**File:** `.github/workflows/ansible-deploy-matrix.yml`
+
+**Using matrix to deploy both:**
+```yaml
+name: Ansible Multi-App Deployment
+
+on:
+  push:
+    branches: [ main, master ]
+    paths:
+      - 'ansible/**'
+
+jobs:
+  deploy:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        app:
+          - name: python
+            playbook: deploy_python.yml
+            port: 8000
+          - name: bonus
+            playbook: deploy_bonus.yml
+            port: 8001
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Deploy ${{ matrix.app.name }}
+        run: |
+          cd ansible
+          echo "${{ secrets.ANSIBLE_VAULT_PASSWORD }}" > /tmp/vault_pass
+          ansible-playbook playbooks/${{ matrix.app.playbook }} \
+            --vault-password-file /tmp/vault_pass
+          rm /tmp/vault_pass
+
+      - name: Verify ${{ matrix.app.name }}
+        run: |
+          sleep 10
+          curl -f http://${{ secrets.VM_HOST }}:${{ matrix.app.port }}
+```
+
+#### Bonus 2.6 Testing Multi-App CI/CD
+
+**Test Scenarios:**
+
+**Test 1: Python app change should deploy only Python**
+```bash
+# Change ansible/vars/app_python.yml
+git add ansible/vars/app_python.yml
+git commit -m "Update Python app config"
+git push
+
+# Watch Actions - only ansible-deploy.yml should run
+# Verify only Python app redeployed
+```
+
+**Test 2: Bonus app change should deploy only Bonus**
+```bash
+# Change ansible/vars/app_bonus.yml
+git add ansible/vars/app_bonus.yml
+git commit -m "Update Bonus app config"
+git push
+
+# Watch Actions - only ansible-deploy-bonus.yml should run
+```
+
+**Test 3: Role change should deploy both**
+```bash
+# Change ansible/roles/web_app/tasks/main.yml
+git add ansible/roles/web_app/
+git commit -m "Update web_app role"
+git push
+
+# Watch Actions - both workflows should run
+```
+
+**Evidence Required:**
+- Screenshots showing independent workflow triggers
+- Logs proving only affected app deployed
+- Verification of both apps working after role change
+- Status badges for both workflows
+
+#### Bonus 2.7 Documentation
+
+**Add to LAB06.md:**
+- Multi-app CI/CD architecture
+- Workflow triggering logic
+- Path filter strategy
+- Matrix vs separate workflows comparison
+- Evidence of independent deployments
+
+---
+
+## Submission Guidelines
+
+### What to Submit
+
+Submit a single markdown file: **`ansible/docs/LAB06.md`**
+
+### Required Structure
+
+```markdown
+# Lab 6: Advanced Ansible & CI/CD - Submission
+
+**Name:** Your Name
+**Date:** YYYY-MM-DD
+**Lab Points:** 10 + X bonus
+
+---
+
+## Task 1: Blocks & Tags (2 pts)
+[Your implementation details]
+[Evidence: terminal outputs, tag listings]
+[Research answers]
+
+## Task 2: Docker Compose (3 pts)
+[Your implementation]
+[Template code]
+[Before/after comparison]
+[Evidence: deployments, idempotency]
+
+## Task 3: Wipe Logic (1 pt)
+[Implementation explanation]
+[Test results for all scenarios]
+[Evidence proving correct behavior]
+
+## Task 4: CI/CD (3 pts)
+[Workflow setup]
+[Secrets configuration]
+[Evidence: successful runs, badges]
+
+## Task 5: Documentation
+[This file serves as documentation]
+
+## Bonus Part 1: Multi-App (1.5 pts)
+[If completed]
+
+## Bonus Part 2: Multi-App CI/CD (1 pt)
+[If completed]
+
+---
+
+## Summary
+[Overall reflection]
+[Total time spent]
+[Key learnings]
+```
+
+### GitHub Repository Requirements
+
+**Commit all code:**
+```bash
+git add ansible/
+git add .github/workflows/
+git add ansible/docs/LAB06.md
+git commit -m "Complete Lab 6: Advanced Ansible & CI/CD"
+git push
+```
+
+**Repository should contain:**
+- ✅ Updated roles with blocks and tags
+- ✅ Docker Compose templates
+- ✅ Wipe logic implementation
+- ✅ CI/CD workflows
+- ✅ Documentation with evidence
+- ✅ Working deployments (apps accessible)
+
+### Evidence Checklist
+
+**Required Proof:**
+- [ ] Ansible playbook output with selective tags
+- [ ] Rescue block triggered output
+- [ ] Docker Compose deployment success
+- [ ] Idempotency verification (2nd run)
+- [ ] Wipe logic test results (all 4 scenarios)
+- [ ] GitHub Actions successful workflow
+- [ ] ansible-lint passing
+- [ ] Status badge(s) in README
+- [ ] Application(s) accessible via curl
+
+**Bonus Proof (if applicable):**
+- [ ] Both apps deployed and accessible
+- [ ] Independent wipe functionality
+- [ ] Separate workflow runs for each app
+- [ ] Path filter effectiveness demonstrated
+
+---
+
+## Checklist
+
+**Before submitting, ensure you have:**
+- [ ] All three roles refactored with blocks and tags
+- [ ] Docker Compose deployment working with templated config
+- [ ] Role dependencies correctly configured
+- [ ] Wipe logic implemented with variable + tag safety
+- [ ] All 4 wipe scenarios tested successfully
+- [ ] GitHub Actions workflow running and passing
+- [ ] ansible-lint integrated and passing
+- [ ] Path filters configured for efficient CI/CD
+- [ ] Complete documentation in `ansible/docs/LAB06.md`
+- [ ] All research questions answered
+- [ ] Terminal outputs and screenshots included
+- [ ] Application(s) accessible and verified
+
+**Bonus (if attempting):**
+- [ ] Second app deployed using role reusability
+- [ ] Independent wipe logic for each app
+- [ ] Separate CI/CD workflows or matrix strategy
+- [ ] Path filters for independent triggering
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Blocks & Tags** | 2 pts | All roles refactored with blocks, rescue/always, comprehensive tag strategy |
+| **Docker Compose** | 3 pts | Working templated deployment, role dependencies, idempotent |
+| **Wipe Logic** | 1 pt | Variable + tag implementation, all scenarios tested |
+| **CI/CD** | 3 pts | Automated workflow with linting, deployment, verification |
+| **Documentation** | 1 pt | Complete LAB06.md with evidence and analysis |
+| **Bonus: Multi-App** | 1.5 pts | Role reusability, independent deployment and wipe |
+| **Bonus: Multi-App CI/CD** | 1 pt | Separate workflows or matrix, independent triggering |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading Scale:**
+- **10/10:** All tasks working, excellent documentation, proper implementation
+- **8-9/10:** All works, good docs, minor improvements possible
+- **6-7/10:** Core functionality present, basic documentation
+- **<6/10:** Missing features or documentation, needs revision
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Ansible Documentation</summary>
+
+- [Ansible Blocks](https://docs.ansible.com/ansible/latest/user_guide/playbooks_blocks.html)
+- [Ansible Tags](https://docs.ansible.com/ansible/latest/user_guide/playbooks_tags.html)
+- [Ansible Role Dependencies](https://docs.ansible.com/ansible/latest/user_guide/playbooks_reuse_roles.html#using-role-dependencies)
+- [Ansible Variables](https://docs.ansible.com/ansible/latest/user_guide/playbooks_variables.html)
+- [Ansible Vault](https://docs.ansible.com/ansible/latest/user_guide/vault.html)
+
+</details>
+
+<details>
+<summary>🐳 Docker Compose</summary>
+
+- [Docker Compose File Reference](https://docs.docker.com/compose/compose-file/)
+- [Docker Compose Module](https://docs.ansible.com/ansible/latest/collections/community/docker/docker_compose_module.html)
+- [community.docker Collection](https://docs.ansible.com/ansible/latest/collections/community/docker/)
+- [Compose Best Practices](https://docs.docker.com/compose/production/)
+
+</details>
+
+<details>
+<summary>🔄 CI/CD & GitHub Actions</summary>
+
+- [GitHub Actions Documentation](https://docs.github.com/en/actions)
+- [GitHub Actions: Workflow Syntax](https://docs.github.com/en/actions/reference/workflow-syntax-for-github-actions)
+- [Self-hosted Runners](https://docs.github.com/en/actions/hosting-your-own-runners)
+- [Encrypted Secrets](https://docs.github.com/en/actions/security-guides/encrypted-secrets)
+
+</details>
+
+<details>
+<summary>🛠️ Tools & Best Practices</summary>
+
+- [ansible-lint](https://ansible-lint.readthedocs.io/) - Best practices checker
+- [Ansible Galaxy](https://galaxy.ansible.com/) - Community roles
+- [Jinja2 Templating](https://jinja.palletsprojects.com/) - Template engine
+- [YAML Syntax](https://docs.ansible.com/ansible/latest/reference_appendices/YAMLSyntax.html)
+
+</details>
+
+---
+
+## Looking Ahead
+
+Your Ansible automation evolves throughout the course:
+
+- **Lab 7:** Logging Stack - Deploy Loki, Promtail, and Grafana
+- **Lab 8:** Metrics Stack - Add Prometheus metrics to your app
+- **Lab 9:** Kubernetes Basics - Migrate from Docker Compose to K8s deployments
+- **Lab 10:** Helm charts for templated K8s deployments
+- **Lab 11-12:** Secrets with Vault, ConfigMaps, and persistent storage
+- **Lab 13:** GitOps with ArgoCD - Declarative Kubernetes deployments
+
+---
+
+**Good luck!** 🚀
diff --git a/labs/lab07.md b/labs/lab07.md
new file mode 100644
index 0000000000..f971e0b01d
--- /dev/null
+++ b/labs/lab07.md
@@ -0,0 +1,594 @@
+# Lab 7 — Observability & Logging with Loki Stack
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Logging%20%26%20Observability-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Loki%20|%20Promtail%20|%20Grafana-informational)
+
+> Deploy a logging stack with Loki, Promtail, and Grafana to aggregate and visualize logs from your containerized applications.
+
+## Overview
+
+Set up centralized logging for your applications using the Grafana Loki stack. You'll deploy Loki 3.0 (log storage with TSDB), Promtail (log collector), and Grafana 11 (visualization), then integrate your apps from previous labs.
+
+**What You'll Learn:**
+- Loki 3.0 architecture with TSDB (10x faster queries!)
+- Promtail configuration for Docker log collection
+- LogQL query language basics
+- Building interactive log dashboards in Grafana 11
+- Production logging practices and retention policies
+
+**Prerequisites:** Lab 1 (web apps), Lab 2 (Docker), Lab 6 (Docker Compose understanding)
+
+**Tech Stack:** Loki 3.0 + Promtail 3.0 + Grafana 12.3
+
+---
+
+## Tasks
+
+### Task 1 — Deploy Loki Stack (4 pts)
+
+Create a Docker Compose stack with Loki, Promtail, and Grafana.
+
+#### 1.1 Study the Stack
+
+**Research these components before starting:**
+- [Loki Overview](https://grafana.com/docs/loki/latest/get-started/overview/) - How Loki works
+- [Promtail Basics](https://grafana.com/docs/loki/latest/send-data/promtail/) - Log collection
+- [LogQL Introduction](https://grafana.com/docs/loki/latest/query/) - Query language
+
+**Understand:**
+- How is Loki different from Elasticsearch?
+- What are log labels and why do they matter?
+- How does Promtail discover containers?
+
+#### 1.2 Create Project Structure
+
+```
+monitoring/
+├── docker-compose.yml
+├── loki/
+│   └── config.yml
+├── promtail/
+│   └── config.yml
+└── docs/
+    └── LAB07.md
+```
+
+#### 1.3 Configure Docker Compose
+
+**File:** `monitoring/docker-compose.yml`
+
+**Requirements:**
+- Loki service (image: `grafana/loki:3.0.0`, port 3100)
+- Promtail service (image: `grafana/promtail:3.0.0`)
+- Grafana service (image: `grafana/grafana:12.3.1`, port 3000)
+- Volumes for configs and data persistence
+- Shared network
+
+<details>
+<summary>💡 Docker Compose Hints</summary>
+
+**Key points to consider:**
+- Use Docker Compose v2 syntax (version field is optional but use 3.8 for compatibility)
+- Mount config files to `/etc/loki/config.yml` and `/etc/promtail/config.yml`
+- Promtail needs access to Docker logs: `/var/lib/docker/containers:ro`
+- Promtail needs Docker socket: `/var/run/docker.sock:ro` (⚠️ security consideration)
+- Create named volumes: `loki-data` and `grafana-data`
+- Use `command:` to specify config file path (e.g., `-config.file=/etc/loki/config.yml`)
+
+**Grafana environment variables for easier testing:**
+```yaml
+environment:
+  - GF_AUTH_ANONYMOUS_ENABLED=true
+  - GF_AUTH_ANONYMOUS_ORG_ROLE=Admin
+  - GF_SECURITY_ALLOW_EMBEDDING=true  # For iframe embedding if needed
+```
+⚠️ Only for development! Remove for production.
+
+**Note:** Use `docker compose` (space, not hyphen) - the v2 CLI standard.
+
+</details>
+
+#### 1.4 Configure Loki
+
+**File:** `monitoring/loki/config.yml`
+
+**Research and configure:**
+- Basic server settings (port 3100)
+- Storage backend (use `tsdb` with `filesystem` - recommended in Loki 3.0)
+- Schema configuration (use schema v13, find examples in [Loki docs](https://grafana.com/docs/loki/latest/configure/))
+- Log retention: 7 days (168h)
+
+<details>
+<summary>💡 Loki Configuration Hints</summary>
+
+**Essential sections you need:**
+- `auth_enabled: false` (for testing)
+- `server:` - HTTP port
+- `common:` - Shared configuration (new in Loki 3.0, simplifies config)
+- `schema_config:` - Storage schema (use v13 with TSDB for Loki 3.0+)
+- `storage_config:` - Where to store data
+  - Use `tsdb` index type (faster than boltdb-shipper)
+  - Use `filesystem` object store for single-instance setup
+- `limits_config:` - Retention period (`retention_period: 168h` = 7 days)
+- `compactor:` - Cleanup old logs (required when retention is enabled)
+
+**TSDB Benefits (Loki 3.0+):**
+- Faster queries (up to 10x improvement)
+- Lower memory usage
+- Better compression
+
+**Check the [Loki 3.0 configuration docs](https://grafana.com/docs/loki/latest/configure/) for structure and required fields.**
+
+</details>
+
+#### 1.5 Configure Promtail
+
+**File:** `monitoring/promtail/config.yml`
+
+**Requirements:**
+- Configure Loki client endpoint (http://loki:3100)
+- Set up Docker service discovery
+- Add relabeling to extract container name as label
+
+<details>
+<summary>💡 Promtail Configuration Hints</summary>
+
+**Key sections:**
+- `server:` - Promtail's own port (9080)
+- `positions:` - Track what logs were read
+- `clients:` - Where to send logs (Loki URL + `/loki/api/v1/push`)
+- `scrape_configs:` - How to collect logs
+
+**For Docker service discovery:**
+```yaml
+scrape_configs:
+  - job_name: docker
+    docker_sd_configs:
+      - host: unix:///var/run/docker.sock
+        refresh_interval: 5s
+```
+
+**Relabeling extracts container name:**
+- Use `__meta_docker_container_name` source label
+- Create `container` target label
+- Remove leading `/` from container name with regex
+
+Check [Promtail Docker SD docs](https://grafana.com/docs/loki/latest/send-data/promtail/configuration/#docker_sd_configs).
+
+</details>
+
+#### 1.6 Deploy and Verify
+
+**Deploy the stack:**
+```bash
+cd monitoring
+docker compose up -d  # v2 CLI (space, not hyphen)
+docker compose ps
+```
+
+**Verify services:**
+```bash
+# Test Loki
+curl http://localhost:3100/ready
+
+# Check Promtail targets
+curl http://localhost:9080/targets
+
+# Access Grafana
+open http://localhost:3000
+```
+
+**In Grafana:**
+1. Go to **Connections** → **Data sources** → **Add data source** → **Loki**
+2. URL: `http://loki:3100`
+3. Click **Save & Test** (should show "Data source connected")
+4. Navigate to **Explore** → Select **Loki** data source
+5. Query: `{job="docker"}` → You should see logs from all containers
+
+**Alternative:** Provision the data source automatically (see bonus task for Ansible example).
+
+**Evidence:** Screenshot showing logs from at least 3 containers in Grafana Explore.
+
+---
+
+### Task 2 — Integrate Your Applications (3 pts)
+
+Add your apps to the logging stack and implement structured logging.
+
+#### 2.1 Add Structured Logging
+
+**Update your Python app** from Lab 1 to log in JSON format.
+
+**Requirements:**
+- Use Python's `logging` module
+- Output JSON format: `{"timestamp": "...", "level": "...", "message": "...", ...}`
+- Log important events: startup, HTTP requests, errors
+- Include context: method, path, status code, client IP
+
+<details>
+<summary>💡 JSON Logging Hints</summary>
+
+**Option 1: Custom formatter**
+Create a `JSONFormatter` class that inherits from `logging.Formatter` and overrides the `format()` method to return JSON.
+
+**Option 2: Use python-json-logger**
+```bash
+pip install python-json-logger
+```
+Then configure it in your app.
+
+**What to log:**
+- App startup with configuration
+- Each HTTP request (use `@app.before_request`)
+- Response status (use `@app.after_request`)
+- Errors and exceptions
+
+**Why JSON?**
+- Easy to parse by log aggregation tools
+- Structured data, not just text
+- Can extract fields in LogQL queries
+
+</details>
+
+#### 2.2 Add Applications to Docker Compose
+
+**Extend** `monitoring/docker-compose.yml` with your applications:
+- Python app from Lab 1 (port 8000)
+- Bonus app from Lab 1 if you completed it (port 8001)
+
+**Both apps should:**
+- Join the `logging` network
+- Have labels for Promtail filtering: `logging: "promtail"`, `app: "app-name"`
+
+<details>
+<summary>💡 Multi-App Compose Hints</summary>
+
+**Add to your docker-compose.yml:**
+```yaml
+services:
+  # ... loki, promtail, grafana ...
+
+  app-python:
+    image: your-username/devops-info-service:latest
+    ports:
+      - "8000:8000"
+    networks:
+      - logging
+    labels:
+      logging: "promtail"
+      app: "devops-python"
+```
+
+**Filter in Promtail:** Update `promtail/config.yml` to only scrape containers with the label:
+```yaml
+filters:
+  - name: label
+    values: ["logging=promtail"]
+```
+
+</details>
+
+#### 2.3 Generate Logs and Test
+
+**Make requests to generate logs:**
+```bash
+# Generate traffic
+for i in {1..20}; do curl http://localhost:8000/; done
+for i in {1..20}; do curl http://localhost:8000/health; done
+```
+
+**Query logs in Grafana Explore:**
+```logql
+# All logs from Python app
+{app="devops-python"}
+
+# Only errors
+{app="devops-python"} |= "ERROR"
+
+# Parse JSON and filter
+{app="devops-python"} | json | method="GET"
+```
+
+**Evidence:**
+- Screenshot of JSON log output from your app
+- Screenshot of Grafana showing logs from both applications
+- At least 3 different LogQL queries that work
+
+---
+
+### Task 3 — Build Log Dashboard (2 pts)
+
+Create a Grafana dashboard to visualize your application logs.
+
+#### 3.1 Learn LogQL Basics
+
+**Practice these query patterns in Explore first:**
+
+1. **Stream selection:** `{app="devops-python"}`
+2. **Text filtering:** `{app="devops-python"} |= "error"`
+3. **JSON parsing:** `{app="devops-python"} | json`
+4. **Field filtering:** `{app="devops-python"} | json | level="INFO"`
+5. **Metrics from logs:** `rate({app="devops-python"}[1m])`
+
+<details>
+<summary>💡 LogQL Reference</summary>
+
+**Stream selectors:**
+- `{label="value"}` - exact match
+- `{label=~"regex"}` - regex match
+- `{label!="value"}` - not equal
+
+**Line filters:**
+- `|= "text"` - contains
+- `!= "text"` - doesn't contain
+- `|~ "regex"` - regex match
+
+**Parsers:**
+- `| json` - parse JSON logs
+- `| logfmt` - parse logfmt logs
+
+**Aggregations:**
+- `rate({app="app"}[5m])` - logs per second
+- `count_over_time({app="app"}[5m])` - count logs
+- `sum by (level) (count_over_time({app="app"} | json [5m]))` - count by level
+
+Learn more: [LogQL Documentation](https://grafana.com/docs/loki/latest/query/)
+
+</details>
+
+#### 3.2 Create Dashboard
+
+**Requirements - create 4 panels:**
+
+1. **Logs Table** (Logs visualization)
+   - Shows recent logs from all apps
+   - Query: `{app=~"devops-.*"}`
+
+2. **Request Rate** (Time series graph)
+   - Shows logs per second by app
+   - Query: `sum by (app) (rate({app=~"devops-.*"} [1m]))`
+
+3. **Error Logs** (Logs visualization)
+   - Shows only ERROR level logs
+   - Query: `{app=~"devops-.*"} | json | level="ERROR"`
+
+4. **Log Level Distribution** (Stat or Pie chart)
+   - Count logs by level (INFO, ERROR, etc.)
+   - Query: `sum by (level) (count_over_time({app=~"devops-.*"} | json [5m]))`
+
+**How to create:**
+1. **Dashboard** → **New** → **New Dashboard** → **Add visualization**
+2. Select **Loki** data source
+3. Enter LogQL query (use the query builder or code editor)
+4. Choose visualization type (Logs, Time series, Stat, Pie chart, etc.)
+5. Configure panel title and options
+6. **Save dashboard** (Grafana 11 auto-saves drafts)
+
+**Grafana 11 features:**
+- Query builder UI for LogQL (easier for beginners)
+- Better log context and line wrapping
+- Improved variable support
+- Dashboard version history
+
+**Evidence:** Screenshot of your dashboard showing all 4 panels with real data.
+
+---
+
+### Task 4 — Production Readiness (1 pt)
+
+Configure the stack for production use.
+
+#### 4.1 Add Resource Limits
+
+Add resource constraints to prevent services from consuming too much:
+
+```yaml
+deploy:
+  resources:
+    limits:
+      cpus: '1.0'
+      memory: 1G
+    reservations:
+      cpus: '0.5'
+      memory: 512M
+```
+
+**Apply to all services** with appropriate values.
+
+#### 4.2 Secure Grafana
+
+**Remove anonymous authentication:**
+- Change `GF_AUTH_ANONYMOUS_ENABLED` to `false`
+- Set admin password via environment variable
+- Use `.env` file for secrets (don't commit!)
+
+#### 4.3 Add Health Checks
+
+Add `healthcheck:` sections to verify services are working:
+- Loki: `http://localhost:3100/ready`
+- Grafana: `http://localhost:3000/api/health`
+
+<details>
+<summary>💡 Health Check Example</summary>
+
+```yaml
+healthcheck:
+  test: ["CMD-SHELL", "wget --no-verbose --tries=1 --spider http://localhost:3100/ready || exit 1"]
+  interval: 10s
+  timeout: 5s
+  retries: 5
+  start_period: 10s  # Grace period for startup
+```
+
+**Alternative using curl:**
+```yaml
+test: ["CMD-SHELL", "curl -f http://localhost:3100/ready || exit 1"]
+```
+
+</details>
+
+**Evidence:**
+- `docker-compose ps` showing all services healthy
+- Screenshot of Grafana login page (no anonymous access)
+
+---
+
+### Task 5 — Documentation (2 pts)
+
+Create `monitoring/docs/LAB07.md` documenting your setup.
+
+**Required sections:**
+1. **Architecture** - Diagram showing how components connect
+2. **Setup Guide** - Step-by-step deployment instructions
+3. **Configuration** - Explain your Loki/Promtail configs and why
+4. **Application Logging** - How you implemented JSON logging
+5. **Dashboard** - Explain each panel and the LogQL queries
+6. **Production Config** - Security measures, resources, retention
+7. **Testing** - Commands to verify everything works
+8. **Challenges** - Problems you encountered and solutions
+
+**Include:**
+- Configuration file snippets (not full files)
+- Screenshots of Grafana dashboard
+- Example LogQL queries with explanations
+- Evidence of all tasks completed
+
+---
+
+## Bonus — Ansible Automation (2.5 pts)
+
+Automate Loki stack deployment with Ansible (builds on Labs 5-6).
+
+**Create Ansible role** `roles/monitoring` that:
+- Creates monitoring directory structure
+- Templates configuration files (Loki 3.0 format)
+- Deploys stack with Docker Compose v2
+- Waits for services to be ready
+- Configures Grafana data source
+
+**Requirements:**
+- Use Jinja2 templates for configs (versions, ports, retention as variables)
+- Make it idempotent (use `community.docker.docker_compose_v2` module)
+- Add to your existing Ansible setup from Lab 6
+- Create playbook: `playbooks/deploy-monitoring.yml`
+- Compatible with Ansible 2.16+
+
+<details>
+<summary>💡 Ansible Role Structure</summary>
+
+```
+roles/monitoring/
+├── defaults/main.yml       # Variables (versions, ports, etc.)
+├── tasks/
+│   ├── main.yml           # Main orchestration
+│   ├── setup.yml          # Create dirs, template configs
+│   └── deploy.yml         # Docker compose deployment
+├── templates/
+│   ├── docker-compose.yml.j2
+│   ├── loki-config.yml.j2
+│   └── promtail-config.yml.j2
+└── meta/main.yml          # Depends on: docker role
+```
+
+**Key variables to parameterize:**
+- Service versions (loki: 3.0.0, promtail: 3.0.0, grafana: 11.3.0)
+- Ports (loki: 3100, grafana: 3000, promtail: 9080)
+- Retention period (default: 168h / 7 days)
+- Resource limits (memory, CPU)
+- Schema version (v13 for Loki 3.0+)
+
+</details>
+
+**Evidence:**
+- Ansible playbook execution output
+- Idempotency test (run twice, second shows no changes)
+- Templated configuration files
+
+---
+
+## Checklist
+
+**Before submitting:**
+- [ ] Loki, Promtail, Grafana running via Docker Compose
+- [ ] Loki data source configured in Grafana
+- [ ] Python app logging in JSON format
+- [ ] Bonus app (if completed Lab 1 bonus) integrated
+- [ ] Logs visible in Grafana from all containers
+- [ ] Dashboard with 4+ panels created
+- [ ] LogQL queries working for different scenarios
+- [ ] Resource limits on all services
+- [ ] Health checks added
+- [ ] Grafana secured (no anonymous access)
+- [ ] Complete documentation with screenshots
+- [ ] All configuration files in repo
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Stack Deployment** | 4 pts | Loki, Promtail, Grafana configured and working |
+| **App Integration** | 3 pts | Apps logging JSON format, visible in Loki |
+| **Dashboard** | 2 pts | 4+ panels with appropriate LogQL queries |
+| **Production Config** | 1 pt | Resources, security, health checks |
+| **Documentation** | 2 pts | Complete LAB07.md with evidence |
+| **Bonus: Ansible** | 2.5 pts | Automated deployment with Ansible role |
+| **Total** | 12.5 pts | 10 pts required + 2.5 bonus |
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Loki Documentation</summary>
+
+- [Loki 3.0 Overview](https://grafana.com/docs/loki/latest/get-started/overview/)
+- [Loki Configuration](https://grafana.com/docs/loki/latest/configure/)
+- [LogQL Query Language](https://grafana.com/docs/loki/latest/query/)
+- [Storage Configuration](https://grafana.com/docs/loki/latest/storage/)
+
+</details>
+
+<details>
+<summary>🚢 Promtail</summary>
+
+- [Promtail Configuration](https://grafana.com/docs/loki/latest/send-data/promtail/configuration/)
+- [Docker Service Discovery](https://grafana.com/docs/loki/latest/send-data/promtail/configuration/#docker_sd_configs)
+- [Scraping Configuration](https://grafana.com/docs/loki/latest/send-data/promtail/scraping/)
+
+</details>
+
+<details>
+<summary>📊 Grafana</summary>
+
+- [Grafana 11 Dashboards](https://grafana.com/docs/grafana/latest/dashboards/)
+- [Loki Data Source](https://grafana.com/docs/grafana/latest/datasources/loki/)
+- [Explore Logs](https://grafana.com/docs/grafana/latest/explore/logs-integration/)
+
+</details>
+
+<details>
+<summary>📝 Logging Best Practices</summary>
+
+- [Structured Logging with structlog](https://www.structlog.org/en/stable/)
+- [The Twelve-Factor App: Logs](https://12factor.net/logs)
+- [Python Logging HOWTO](https://docs.python.org/3/howto/logging.html)
+- [python-json-logger](https://github.com/madzak/python-json-logger)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 8:** Metrics with Prometheus - Add metrics to complement logs
+- **Lab 9:** Kubernetes Fundamentals - Deploy your apps to K8s
+- **Lab 10-12:** Helm, Secrets, ConfigMaps - Package and configure K8s deployments
+- **Lab 16:** Kubernetes Monitoring - Full observability in K8s
+
+---
+
+**Good luck!** 🚀
diff --git a/labs/lab08.md b/labs/lab08.md
new file mode 100644
index 0000000000..8909a9244c
--- /dev/null
+++ b/labs/lab08.md
@@ -0,0 +1,752 @@
+# Lab 8 — Metrics & Monitoring with Prometheus
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Metrics%20%26%20Monitoring-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Prometheus%20|%20Grafana%20|%20Docker%20Compose-informational)
+
+> Instrument your applications with metrics and build a complete monitoring stack with Prometheus and Grafana.
+
+## Overview
+
+Add observability to your applications by exposing Prometheus metrics, then deploy Prometheus to collect them and Grafana to visualize. You'll instrument your app first, then build the monitoring infrastructure around it.
+
+**What You'll Learn:**
+- Application instrumentation with prometheus_client
+- Prometheus scraping and metric types
+- PromQL query language
+- Building Grafana dashboards for metrics
+- Monitoring best practices (RED method, resource limits)
+- Integration with existing observability stack from Lab 7
+
+**Tech Stack:** Prometheus 3.9+ | Grafana 12.3+ | prometheus_client | PromQL
+
+**Prerequisites:** Lab 7 completed (Loki + Grafana stack), Python app from Lab 1-2
+
+---
+
+## Tasks
+
+### Task 1 — Application Metrics (3 pts)
+
+Add Prometheus metrics to your Python application.
+
+#### 1.1 Understanding Application Metrics
+
+**Why metrics matter:**
+- **Logs** tell you what happened (Lab 7)
+- **Metrics** tell you how much and how often
+- **Together** they provide complete observability
+
+**The RED Method (for request-driven apps):**
+- **R**ate - Requests per second
+- **E**rrors - Error rate
+- **D**uration - Response time
+
+<details>
+<summary>💡 Prometheus Metric Types</summary>
+
+**Counter** - Only goes up (total requests, errors)
+```python
+http_requests_total.inc()  # Increment by 1
+```
+
+**Gauge** - Can go up or down (memory usage, active connections)
+```python
+active_connections.set(42)
+```
+
+**Histogram** - Measures distribution (request duration, response size)
+```python
+request_duration_seconds.observe(0.25)  # Record 250ms request
+```
+
+**Summary** - Similar to histogram, with percentiles
+
+**When to use what:**
+- Counting events? → Counter
+- Current state? → Gauge
+- Distribution/percentiles? → Histogram
+
+**Resources:**
+- [Prometheus Metric Types](https://prometheus.io/docs/concepts/metric_types/)
+- [Instrumentation Best Practices](https://prometheus.io/docs/practices/instrumentation/)
+
+</details>
+
+#### 1.2 Install Prometheus Client
+
+**Add to `requirements.txt`:**
+```txt
+prometheus-client==0.23.1
+```
+
+**Install:**
+```bash
+pip install prometheus-client
+```
+
+#### 1.3 Implement Metrics Endpoint
+
+**Add `/metrics` endpoint to your app:**
+
+**Requirements:**
+- Expose metrics at `/metrics` endpoint
+- Track HTTP requests (counter)
+- Track request duration (histogram)
+- Track active requests (gauge)
+- Use labels: `method`, `endpoint`, `status_code`
+/
+<details>
+<summary>💡 Implementation Guidance</summary>
+
+**Basic Setup (Flask):**
+```python
+from prometheus_client import Counter, Histogram, Gauge, generate_latest
+
+# Define metrics
+http_requests_total = Counter(
+    'http_requests_total',
+    'Total HTTP requests',
+    ['method', 'endpoint', 'status']
+)
+
+http_request_duration_seconds = Histogram(
+    'http_request_duration_seconds',
+    'HTTP request duration',
+    ['method', 'endpoint']
+)
+
+http_requests_in_progress = Gauge(
+    'http_requests_in_progress',
+    'HTTP requests currently being processed'
+)
+
+@app.route('/metrics')
+def metrics():
+    return generate_latest()
+```
+
+**Instrumenting Requests:**
+- Use `@app.before_request` to track start time
+- Use `@app.after_request` to record metrics
+- Increment counter with labels
+- Observe histogram with duration
+- Use gauge context manager for in-progress
+
+**Label Best Practices:**
+- Keep cardinality low (don't use user IDs as labels!)
+- Use `/` for root, `/health` for health, group others
+- Normalize endpoint names (e.g., `/user/{id}` not `/user/123`)
+
+**Resources:**
+- [prometheus_client docs](https://github.com/prometheus/client_python)
+- [Python instrumentation guide](https://prometheus.io/docs/guides/python/)
+
+</details>
+
+#### 1.4 Add Application-Specific Metrics
+
+**Beyond HTTP, track your app's business metrics:**
+- Counter: API calls to external services
+- Gauge: Items in cache, database pool size
+- Histogram: Database query duration
+
+**Example for your DevOps info service:**
+```python
+# Track endpoint usage
+endpoint_calls = Counter('devops_info_endpoint_calls', 'Endpoint calls', ['endpoint'])
+
+# Track system info collection time
+system_info_duration = Histogram('devops_info_system_collection_seconds', 'System info collection time')
+```
+
+#### 1.5 Test Metrics Locally
+
+**Run your app and test:**
+```bash
+python app.py
+curl http://localhost:8000/metrics
+```
+
+**Expected output format:**
+```
+# HELP http_requests_total Total HTTP requests
+# TYPE http_requests_total counter
+http_requests_total{method="GET",endpoint="/",status="200"} 42.0
+http_requests_total{method="GET",endpoint="/health",status="200"} 15.0
+
+# HELP http_request_duration_seconds HTTP request duration
+# TYPE http_request_duration_seconds histogram
+http_request_duration_seconds_bucket{le="0.005",method="GET",endpoint="/"} 10.0
+http_request_duration_seconds_bucket{le="0.01",method="GET",endpoint="/"} 35.0
+...
+```
+
+**Evidence Required:**
+- Screenshot of `/metrics` endpoint output
+- Code showing metric definitions
+- Documentation explaining your metric choices
+
+---
+
+### Task 2 — Prometheus Setup (3 pts)
+
+Deploy Prometheus and configure it to scrape your application metrics.
+
+#### 2.1 Understanding Prometheus Architecture
+
+<details>
+<summary>💡 How Prometheus Works</summary>
+
+**Pull-based model:**
+1. Your app exposes `/metrics` endpoint
+2. Prometheus scrapes (pulls) metrics on schedule
+3. Stores time-series data locally
+4. Provides PromQL for querying
+
+**Key concepts:**
+- **Target** - Endpoint to scrape (your app)
+- **Job** - Collection of targets with same purpose
+- **Scrape interval** - How often to collect (default: 15s)
+- **TSDB** - Time-series database storing metrics
+
+**vs Push-based (like StatsD):**
+- Pull = simpler, apps don't need to know about Prometheus
+- Better for service discovery
+- Failed scrapes are visible
+
+**Resources:**
+- [Prometheus Overview](https://prometheus.io/docs/introduction/overview/)
+- [First Steps with Prometheus](https://prometheus.io/docs/introduction/first_steps/)
+
+</details>
+
+#### 2.2 Add Prometheus to Docker Compose
+
+**Extend `monitoring/docker-compose.yml`** from Lab 7:
+
+**Requirements:**
+- Prometheus service (image: `prom/prometheus:v3.9.0`, port 9090)
+- Mount prometheus config: `./prometheus/prometheus.yml`
+- Mount data volume for persistence: `prometheus-data`
+- Connect to existing `logging` network from Lab 7
+
+<details>
+<summary>💡 Docker Compose Guidance</summary>
+
+**Key points:**
+- Use same network as Loki/Grafana from Lab 7
+- Mount config to `/etc/prometheus/prometheus.yml`
+- Use volume for data persistence: `/prometheus`
+- Add `--config.file=/etc/prometheus/prometheus.yml` command argument
+
+**Resource limits:**
+```yaml
+deploy:
+  resources:
+    limits:
+      memory: 1G
+      cpus: '1.0'
+```
+
+</details>
+
+#### 2.3 Configure Prometheus
+
+**File:** `monitoring/prometheus/prometheus.yml`
+
+**Requirements:**
+- Scrape Prometheus itself (job: `prometheus`)
+- Scrape your Python app (job: `app`)
+- Scrape Loki metrics (job: `loki`)
+- Scrape Grafana metrics (job: `grafana`)
+- Set scrape interval: 15s
+
+<details>
+<summary>💡 Prometheus Configuration Guide</summary>
+
+**Basic structure:**
+```yaml
+global:
+  scrape_interval: 15s
+  evaluation_interval: 15s
+
+# Storage retention (Prometheus 3.x config-based retention)
+storage:
+  tsdb:
+    retention_time: 15d
+    retention_size: 10GB
+
+scrape_configs:
+  - job_name: 'prometheus'
+    static_configs:
+      - targets: ['localhost:9090']
+
+  - job_name: 'app'
+    static_configs:
+      - targets: ['app-python:8000']
+    metrics_path: '/metrics'
+```
+
+**For Docker Compose:**
+- Use service names as hostnames (e.g., `loki:3100`)
+- Prometheus self-scrape uses `localhost:9090`
+- Check each service's metrics port:
+  - Loki: port 3100, path `/metrics`
+  - Grafana: port 3000, path `/metrics`
+  - Your app: port 8000, path `/metrics`
+
+**Resources:**
+- [Prometheus Configuration](https://prometheus.io/docs/prometheus/latest/configuration/configuration/)
+- [Scrape Configs](https://prometheus.io/docs/prometheus/latest/configuration/configuration/#scrape_config)
+
+</details>
+
+#### 2.4 Deploy and Verify
+
+**Deploy the updated stack:**
+```bash
+cd monitoring
+docker compose up -d
+docker compose ps
+```
+
+**Verify Prometheus:**
+1. **Access UI:** http://localhost:9090
+2. **Check targets:** http://localhost:9090/targets
+   - All targets should be "UP" (green)
+3. **Query metrics:** Try query `up` - should show all targets
+
+**Troubleshooting targets:**
+- **State: DOWN** → Check service is running, check port/path
+- **State: UNKNOWN** → Prometheus just started, wait for first scrape
+- **No target** → Check `prometheus.yml` syntax
+
+**Evidence Required:**
+- Screenshot of `/targets` page showing all targets UP
+- Screenshot of a successful PromQL query
+- `prometheus.yml` configuration file
+
+---
+
+### Task 3 — Grafana Dashboards (2 pts)
+
+Build dashboards to visualize your application metrics.
+
+#### 3.1 Add Prometheus Data Source
+
+**In Grafana:**
+1. **Connections** → **Data sources** → **Add data source** → **Prometheus**
+2. URL: `http://prometheus:9090`
+3. **Save & Test**
+
+**Alternative:** Provision automatically (see Ansible bonus).
+
+#### 3.2 Learn PromQL Basics
+
+<details>
+<summary>💡 PromQL Quick Reference</summary>
+
+**Instant Vector (single value per time series):**
+```promql
+http_requests_total                                    # All request counters
+http_requests_total{method="GET"}                      # Filter by label
+http_requests_total{endpoint="/",status="200"}         # Multiple labels
+```
+
+**Range Vector (values over time range):**
+```promql
+http_requests_total[5m]                                # Last 5 minutes of data
+```
+
+**Functions:**
+```promql
+rate(http_requests_total[5m])                          # Requests per second
+sum(rate(http_requests_total[5m]))                     # Total req/s across all series
+sum by (endpoint) (rate(http_requests_total[5m]))      # Req/s per endpoint
+histogram_quantile(0.95, http_request_duration_seconds_bucket)  # 95th percentile latency
+```
+
+**Operators:**
+```promql
+up == 0                                                # Services down
+rate(http_requests_total{status="500"}[5m]) * 100     # Error rate percentage
+```
+
+**Common Queries:**
+- Request rate: `rate(http_requests_total[5m])`
+- Error rate: `sum(rate(http_requests_total{status=~"5.."}[5m]))`
+- p95 latency: `histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m]))`
+- CPU usage: `rate(process_cpu_seconds_total[5m]) * 100`
+
+**Resources:**
+- [PromQL Basics](https://prometheus.io/docs/prometheus/latest/querying/basics/)
+- [PromQL Examples](https://prometheus.io/docs/prometheus/latest/querying/examples/)
+
+</details>
+
+#### 3.3 Create Application Dashboard
+
+**Create dashboard with 6+ panels:**
+
+1. **Request Rate** (Graph)
+   - Query: `sum(rate(http_requests_total[5m])) by (endpoint)`
+   - Shows requests/sec per endpoint
+
+2. **Error Rate** (Graph)
+   - Query: `sum(rate(http_requests_total{status=~"5.."}[5m]))`
+   - Shows 5xx errors/sec
+
+3. **Request Duration p95** (Graph)
+   - Query: `histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m]))`
+   - Shows 95th percentile latency
+
+4. **Request Duration Heatmap** (Heatmap)
+   - Query: `rate(http_request_duration_seconds_bucket[5m])`
+   - Visualizes latency distribution
+
+5. **Active Requests** (Gauge/Graph)
+   - Query: `http_requests_in_progress`
+   - Shows concurrent requests
+
+6. **Status Code Distribution** (Pie Chart)
+   - Query: `sum by (status) (rate(http_requests_total[5m]))`
+   - Shows 2xx vs 4xx vs 5xx
+
+7. **Uptime** (Stat)
+   - Query: `up{job="app"}`
+   - Shows if service is up (1) or down (0)
+
+**Panel configuration tips:**
+- Set appropriate time ranges
+- Use legends with `{{label}}` syntax
+- Set units (requests/sec, seconds, etc.)
+- Add thresholds for alerting visualization
+
+#### 3.4 Import Community Dashboards
+
+**Grafana has pre-built dashboards:**
+
+**For Prometheus metrics:**
+- Dashboard ID: **3662** (Prometheus 2.0 Stats)
+
+**For Loki:**
+- Dashboard ID: **13407** (Loki Dashboard)
+
+**To import:**
+1. **Dashboards** → **New** → **Import**
+2. Enter dashboard ID
+3. Select Prometheus data source
+4. **Import**
+
+Customize these for your needs.
+
+**Evidence Required:**
+- Screenshot of your custom application dashboard with live data
+- Screenshot showing all 6+ panels working
+- Exported dashboard JSON file
+
+---
+
+### Task 4 — Production Configuration (2 pts)
+
+Harden the monitoring stack for production use.
+
+#### 4.1 Add Health Checks
+
+**Add health checks to all services in `docker-compose.yml`:**
+
+**Prometheus:**
+```yaml
+healthcheck:
+  test: ["CMD-SHELL", "wget --no-verbose --tries=1 --spider http://localhost:9090/-/healthy || exit 1"]
+  interval: 10s
+  timeout: 5s
+  retries: 5
+```
+
+**Your app:**
+```yaml
+healthcheck:
+  test: ["CMD-SHELL", "curl -f http://localhost:8000/health || exit 1"]
+  interval: 10s
+  timeout: 5s
+  retries: 5
+```
+
+#### 4.2 Configure Resource Limits
+
+**Set limits on all services:**
+- Prometheus: 1G memory, 1 CPU
+- Loki: 1G memory, 1 CPU
+- Grafana: 512M memory, 0.5 CPU
+- Apps: 256M memory, 0.5 CPU
+
+#### 4.3 Data Retention
+
+**Configure retention periods:**
+
+**Prometheus retention:**
+```yaml
+command:
+  - '--config.file=/etc/prometheus/prometheus.yml'
+  - '--storage.tsdb.retention.time=15d'
+  - '--storage.tsdb.retention.size=10GB'
+```
+
+**Why retention matters:**
+- Disk space management
+- Query performance (smaller dataset = faster queries)
+- Compliance requirements
+
+#### 4.4 Persistent Volumes
+
+**Ensure data survives container restarts:**
+```yaml
+volumes:
+  prometheus-data:
+  loki-data:
+  grafana-data:
+```
+
+**Test persistence:**
+1. Create dashboard
+2. Stop containers: `docker compose down`
+3. Start containers: `docker compose up -d`
+4. Dashboard should still exist
+
+**Evidence Required:**
+- `docker compose ps` showing all services healthy
+- Documentation of retention policies
+- Proof of data persistence after restart
+
+---
+
+### Task 5 — Documentation (2 pts)
+
+Create `monitoring/docs/LAB08.md` documenting your implementation.
+
+**Required sections:**
+1. **Architecture** - Diagram showing metric flow (app → Prometheus → Grafana)
+2. **Application Instrumentation** - What metrics you added and why
+3. **Prometheus Configuration** - Scrape targets, intervals, retention
+4. **Dashboard Walkthrough** - Each panel's purpose and query
+5. **PromQL Examples** - 5+ queries with explanations
+6. **Production Setup** - Health checks, resources, retention policies
+7. **Testing Results** - Screenshots showing everything working
+8. **Challenges & Solutions** - Issues encountered and fixes
+
+**Evidence:**
+- Screenshots of dashboards with live data
+- PromQL queries that demonstrate RED method
+- Proof of all services healthy and scraping
+- Comparison: metrics vs logs (Lab 7) - when to use each
+
+---
+
+## Bonus — Ansible Automation (2.5 pts)
+
+Automate the complete observability stack (Loki + Prometheus + Grafana) deployment with Ansible.
+
+**Extend your `monitoring` role from Lab 7** or create a comprehensive new one.
+
+#### Bonus 1.1 Enhanced Monitoring Role
+
+**Update `roles/monitoring/` to include:**
+- Loki configuration (from Lab 7)
+- Promtail configuration (from Lab 7)
+- **Prometheus configuration** (new)
+- Grafana data sources (Loki + Prometheus)
+- Grafana dashboard provisioning (logs + metrics)
+
+#### Bonus 1.2 Variables to Parameterize
+
+**File:** `roles/monitoring/defaults/main.yml`
+
+**Add Prometheus variables:**
+```yaml
+# Prometheus Configuration
+prometheus_version: "3.9.0"
+prometheus_port: 9090
+prometheus_retention_days: 15
+prometheus_retention_size: "10GB"
+prometheus_scrape_interval: "15s"
+
+# Scrape Targets
+prometheus_targets:
+  - job: "prometheus"
+    targets: ["localhost:9090"]
+  - job: "loki"
+    targets: ["loki:3100"]
+  - job: "grafana"
+    targets: ["grafana:3000"]
+  - job: "app"
+    targets: ["app-python:8000"]
+    path: "/metrics"
+```
+
+#### Bonus 1.3 Template Prometheus Config
+
+**File:** `roles/monitoring/templates/prometheus.yml.j2`
+
+**Use Jinja2 to generate config from variables:**
+```yaml
+global:
+  scrape_interval: {{ prometheus_scrape_interval }}
+
+scrape_configs:
+{% for target in prometheus_targets %}
+  - job_name: '{{ target.job }}'
+    static_configs:
+      - targets: {{ target.targets }}
+    {% if target.path is defined %}
+    metrics_path: '{{ target.path }}'
+    {% endif %}
+{% endfor %}
+```
+
+#### Bonus 1.4 Provision Grafana Dashboards
+
+**Automatically provision dashboards:**
+
+**File:** `roles/monitoring/files/grafana-app-dashboard.json`
+- Export your application dashboard JSON
+- Add to Ansible role files
+
+**File:** `roles/monitoring/tasks/grafana.yml`
+```yaml
+- name: Provision Grafana dashboards
+  copy:
+    src: "{{ item }}"
+    dest: "{{ monitoring_dir }}/grafana/provisioning/dashboards/"
+  loop:
+    - grafana-app-dashboard.json
+    - grafana-logs-dashboard.json
+```
+
+#### Bonus 1.5 End-to-End Deployment
+
+**Single playbook deploys everything:**
+```bash
+ansible-playbook playbooks/deploy-monitoring.yml
+```
+
+**Should deploy:**
+- Loki + Promtail + Grafana (Lab 7)
+- Prometheus (Lab 8)
+- Grafana data sources (Loki + Prometheus)
+- Grafana dashboards (logs + metrics)
+- All with proper config, health checks, resources
+
+**Evidence Required:**
+- Ansible playbook execution showing idempotency
+- Templated configuration files
+- Screenshot of Grafana with both data sources working
+- Both dashboards (logs + metrics) automatically provisioned
+- Documentation of role structure and variables
+
+---
+
+## Checklist
+
+**Before submitting:**
+- [ ] `/metrics` endpoint added to Python app
+- [ ] prometheus_client installed and configured
+- [ ] Counter, Gauge, Histogram metrics implemented
+- [ ] Prometheus deployed and scraping all targets
+- [ ] All targets showing "UP" in Prometheus UI
+- [ ] Prometheus data source added to Grafana
+- [ ] Custom dashboard with 6+ panels created
+- [ ] PromQL queries demonstrating RED method
+- [ ] Health checks on all services
+- [ ] Resource limits configured
+- [ ] Data retention policies set
+- [ ] Volumes persist after restart
+- [ ] Complete LAB08.md documentation
+- [ ] Screenshots of working dashboards
+
+**Bonus (if attempting):**
+- [ ] Ansible role extended for Prometheus
+- [ ] Variables parameterize all configs
+- [ ] Prometheus config templated with Jinja2
+- [ ] Grafana dashboards auto-provisioned
+- [ ] Single playbook deploys full stack
+- [ ] Idempotency verified
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Application Metrics** | 3 pts | `/metrics` endpoint with Counter, Gauge, Histogram; proper labels |
+| **Prometheus Setup** | 3 pts | Deployed, configured, scraping all targets successfully |
+| **Grafana Dashboards** | 2 pts | Custom dashboard with 6+ panels, PromQL queries |
+| **Production Config** | 2 pts | Health checks, resource limits, retention, persistence |
+| **Documentation** | 2 pts | Complete LAB08.md with architecture, queries, evidence |
+| **Bonus: Ansible** | 2.5 pts | Full stack automation with templates and provisioning |
+| **Total** | 12.5 pts | 10 pts required + 2.5 bonus |
+
+**Grading Scale:**
+- **10/10:** All working, excellent dashboards, production-ready config, thorough docs
+- **8-9/10:** All works, good dashboards, basic production config, good docs
+- **6-7/10:** Core working, simple dashboards, minimal config, basic docs
+- **<6/10:** Incomplete, missing components, needs revision
+
+---
+
+## Resources
+
+<details>
+<summary>📊 Prometheus Documentation</summary>
+
+- [Prometheus Overview](https://prometheus.io/docs/introduction/overview/)
+- [Prometheus Configuration](https://prometheus.io/docs/prometheus/latest/configuration/configuration/)
+- [PromQL Basics](https://prometheus.io/docs/prometheus/latest/querying/basics/)
+- [Metric Types](https://prometheus.io/docs/concepts/metric_types/)
+- [Instrumentation Best Practices](https://prometheus.io/docs/practices/instrumentation/)
+
+</details>
+
+<details>
+<summary>🐍 Python Instrumentation</summary>
+
+- [prometheus_client GitHub](https://github.com/prometheus/client_python)
+- [Python Instrumentation](https://prometheus.io/docs/guides/python/)
+- [Flask Metrics Example](https://github.com/prometheus/client_python#flask)
+- [Metric Naming](https://prometheus.io/docs/practices/naming/)
+
+</details>
+
+<details>
+<summary>📈 Grafana & Dashboards</summary>
+
+- [Grafana Prometheus Data Source](https://grafana.com/docs/grafana/latest/datasources/prometheus/)
+- [Dashboard Best Practices](https://grafana.com/docs/grafana/latest/dashboards/build-dashboards/best-practices/)
+- [PromQL in Grafana](https://grafana.com/docs/grafana/latest/datasources/prometheus/query-editor/)
+- [Dashboard Provisioning](https://grafana.com/docs/grafana/latest/administration/provisioning/#dashboards)
+
+</details>
+
+<details>
+<summary>📚 Observability Concepts</summary>
+
+- [RED Method](https://grafana.com/blog/2018/08/02/the-red-method-how-to-instrument-your-services/)
+- [USE Method](http://www.brendangregg.com/usemethod.html) - For resources
+- [The Four Golden Signals](https://sre.google/sre-book/monitoring-distributed-systems/)
+- [Metrics vs Logs vs Traces](https://peter.bourgon.org/blog/2017/02/21/metrics-tracing-and-logging.html)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 9:** Kubernetes - Deploy your monitored apps to K8s
+- **Lab 10:** Helm - Package your monitoring stack as Helm charts
+- **Lab 16:** Kubernetes Monitoring - Full observability with init containers and probes
+
+---
+
+**Good luck!** 🚀
diff --git a/labs/lab09.md b/labs/lab09.md
new file mode 100644
index 0000000000..efcff217f2
--- /dev/null
+++ b/labs/lab09.md
@@ -0,0 +1,730 @@
+# Lab 9 — Kubernetes Fundamentals
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Kubernetes-blue)
+![points](https://img.shields.io/badge/points-12%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Kubernetes-informational)
+
+> Deploy your containerized applications to Kubernetes using declarative manifests and production best practices.
+
+## Overview
+
+Take your Docker images from previous labs and deploy them to Kubernetes. Learn container orchestration fundamentals, declarative configuration, and production deployment patterns.
+
+**What You'll Learn:**
+- Kubernetes core concepts and architecture
+- Writing production-ready manifests
+- Deployments, Services, and networking
+- Health checks and resource management
+- Scaling and updates
+
+**Tech Stack:** Kubernetes 1.33+ | kubectl | minikube or kind | YAML
+
+---
+
+## Tasks
+
+### Task 1 — Local Kubernetes Setup (2 pts)
+
+**Objective:** Set up a local Kubernetes cluster and understand core concepts.
+
+**Requirements:**
+
+1. **Learn Kubernetes Fundamentals**
+   - Study core concepts (Pods, Deployments, Services, Namespaces)
+   - Understand control plane and worker node architecture
+   - Learn the declarative vs imperative approach
+
+2. **Install Tools**
+   - Install `kubectl` (Kubernetes CLI)
+   - Install local cluster: `minikube` OR `kind`
+   - Verify installation with cluster info commands
+
+3. **Cluster Setup**
+   - Start local cluster
+   - Verify all components are running
+   - Explore cluster with kubectl commands
+
+<details>
+<summary>💡 Kubernetes Concepts</summary>
+
+**Core Resources:**
+- **Pod**: Smallest deployable unit, contains one or more containers
+- **Deployment**: Manages replica sets and rolling updates
+- **Service**: Exposes Pods as network service with stable endpoint
+- **Namespace**: Virtual cluster for resource isolation
+
+**Why Kubernetes?**
+- Automatic scaling and load balancing
+- Self-healing (restart failed containers)
+- Rolling updates and rollbacks
+- Service discovery and networking
+- Resource management and scheduling
+
+**Local Development Options:**
+- **minikube**: Full-featured, runs in VM or Docker
+- **kind**: Lightweight, runs in Docker containers, great for CI/CD
+
+**Key Concepts to Research:**
+- Desired state vs actual state
+- Controllers and reconciliation loops
+- Labels and selectors
+- Declarative configuration (YAML manifests)
+
+**Resources:**
+- [What is Kubernetes](https://kubernetes.io/docs/concepts/overview/)
+- [Kubernetes Components](https://kubernetes.io/docs/concepts/overview/components/)
+- [kubectl Cheat Sheet](https://kubernetes.io/docs/reference/kubectl/quick-reference/)
+- [Install Tools](https://kubernetes.io/docs/tasks/tools/)
+
+</details>
+
+<details>
+<summary>💡 Essential kubectl Commands</summary>
+
+**Cluster Information:**
+```bash
+kubectl cluster-info
+kubectl get nodes
+kubectl get namespaces
+```
+
+**Resource Management:**
+```bash
+kubectl get pods
+kubectl get deployments
+kubectl get services
+kubectl describe pod <pod-name>
+kubectl logs <pod-name>
+```
+
+**Apply vs Create:**
+- `kubectl apply` - Declarative, idempotent, preferred
+- `kubectl create` - Imperative, fails if exists
+
+</details>
+
+**Documentation Required:**
+- Terminal output showing successful cluster setup
+- Output of `kubectl cluster-info` and `kubectl get nodes`
+- Brief explanation of your chosen tool (minikube/kind) and why
+
+---
+
+### Task 2 — Application Deployment (3 pts)
+
+**Objective:** Create a Deployment manifest for your Python app with production best practices.
+
+**Requirements:**
+
+1. **Create Deployment Manifest**
+   - File: `k8s/deployment.yml`
+   - Use your Docker image from Lab 2
+   - Minimum 3 replicas
+   - Include resource requests and limits
+   - Add liveness and readiness probes
+   - Use labels for organization
+
+2. **Production Best Practices**
+   - Non-root container (should already be in your image)
+   - Rolling update strategy
+   - Proper container port configuration
+   - Environment variables if needed
+
+<details>
+<summary>💡 Deployment Manifest Structure</summary>
+
+**Essential Sections:**
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: your-app-name
+  labels:
+    app: your-app
+spec:
+  replicas: 3
+  selector:
+    matchLabels:
+      app: your-app
+  template:
+    metadata:
+      labels:
+        app: your-app
+    spec:
+      containers:
+      - name: your-app
+        image: your-dockerhub-username/your-app:latest
+        # Add: ports, resources, probes
+```
+
+**Key Fields to Research:**
+- `replicas`: Number of Pod copies
+- `selector.matchLabels`: How Deployment finds its Pods
+- `template`: Pod specification
+- `resources`: CPU/memory requests and limits
+- `livenessProbe`: Is container healthy?
+- `readinessProbe`: Is container ready for traffic?
+
+**Resources:**
+- [Deployments](https://kubernetes.io/docs/concepts/workloads/controllers/deployment/)
+- [Resource Management](https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/)
+- [Health Checks](https://kubernetes.io/docs/tasks/configure-pod-container/configure-liveness-readiness-startup-probes/)
+
+</details>
+
+<details>
+<summary>💡 Health Checks (Probes)</summary>
+
+**Types of Probes:**
+- **Liveness**: Restart container if failing
+- **Readiness**: Remove from service if not ready
+- **Startup**: For slow-starting containers
+
+**Probe Methods:**
+- HTTP GET (common for web apps)
+- TCP Socket
+- Exec command
+
+**Example Configuration Pattern:**
+```yaml
+livenessProbe:
+  httpGet:
+    path: /health
+    port: 8000
+  initialDelaySeconds: 10
+  periodSeconds: 5
+
+readinessProbe:
+  httpGet:
+    path: /ready
+    port: 8000
+  initialDelaySeconds: 5
+  periodSeconds: 3
+```
+
+**Note:** You may need to add `/health` endpoint to your app.
+
+</details>
+
+<details>
+<summary>💡 Resource Management</summary>
+
+**Why Set Resources?**
+- Prevents resource starvation
+- Enables proper scheduling
+- Protects cluster stability
+
+**Pattern:**
+```yaml
+resources:
+  requests:
+    memory: "128Mi"
+    cpu: "100m"
+  limits:
+    memory: "256Mi"
+    cpu: "200m"
+```
+
+**CPU Units:**
+- `1000m` = 1 CPU core
+- `100m` = 0.1 CPU core
+
+**Memory Units:**
+- `Mi` = Mebibyte (1024-based)
+- `Gi` = Gibibyte
+
+</details>
+
+**Test Your Deployment:**
+```bash
+kubectl apply -f k8s/deployment.yml
+kubectl get deployments
+kubectl get pods
+kubectl describe deployment <name>
+```
+
+---
+
+### Task 3 — Service Configuration (2 pts)
+
+**Objective:** Create a Service to expose your Deployment.
+
+**Requirements:**
+
+1. **Create Service Manifest**
+   - File: `k8s/service.yml`
+   - Type: `NodePort` (for local cluster access)
+   - Target your Deployment's Pods using labels
+   - Expose the correct port
+
+2. **Verify Connectivity**
+   - Apply Service manifest
+   - Access app using `minikube service` command or port-forward
+   - Test all endpoints work
+
+<details>
+<summary>💡 Service Types</summary>
+
+**Service Types:**
+- **ClusterIP** (default): Internal cluster access only
+- **NodePort**: Exposes service on each node's IP at a static port
+- **LoadBalancer**: Cloud provider load balancer
+- **ExternalName**: CNAME record for external service
+
+**For Local Development:**
+Use `NodePort` - allows external access without cloud provider.
+
+**Service Manifest Pattern:**
+```yaml
+apiVersion: v1
+kind: Service
+metadata:
+  name: your-app-service
+spec:
+  type: NodePort
+  selector:
+    app: your-app  # Must match Deployment labels
+  ports:
+    - protocol: TCP
+      port: 80        # Service port
+      targetPort: 8000  # Container port
+      nodePort: 30080   # Optional: specific node port (30000-32767)
+```
+
+**Resources:**
+- [Services](https://kubernetes.io/docs/concepts/services-networking/service/)
+- [Connect Applications with Services](https://kubernetes.io/docs/tutorials/services/connect-applications-service/)
+
+</details>
+
+<details>
+<summary>💡 Accessing Your Service</summary>
+
+**Minikube:**
+```bash
+minikube service <service-name>
+minikube service <service-name> --url
+```
+
+**kind or other:**
+```bash
+kubectl port-forward service/<service-name> 8080:80
+```
+
+**Verify:**
+```bash
+kubectl get services
+kubectl describe service <service-name>
+kubectl get endpoints
+```
+
+</details>
+
+---
+
+### Task 4 — Scaling and Updates (2 pts)
+
+**Objective:** Demonstrate scaling and rolling updates.
+
+**Requirements:**
+
+1. **Scaling**
+   - Scale your deployment to 5 replicas
+   - Verify all replicas are running
+   - Document the process
+
+2. **Rolling Updates**
+   - Update your image tag or change a configuration
+   - Apply the updated manifest
+   - Watch the rollout process
+   - Verify zero downtime
+
+3. **Rollback**
+   - Demonstrate rollback capability
+   - Show rollout history
+
+<details>
+<summary>💡 Scaling Operations</summary>
+
+**Declarative (Preferred):**
+Edit `deployment.yml` replicas field, then:
+```bash
+kubectl apply -f k8s/deployment.yml
+```
+
+**Imperative (Quick Testing):**
+```bash
+kubectl scale deployment/<name> --replicas=5
+```
+
+**Watch Scaling:**
+```bash
+kubectl get pods -w
+kubectl rollout status deployment/<name>
+```
+
+</details>
+
+<details>
+<summary>💡 Rolling Updates</summary>
+
+**How Rolling Updates Work:**
+- Creates new Pods with updated spec
+- Waits for them to be ready
+- Terminates old Pods gradually
+- Ensures minimum availability
+
+**Update Strategy:**
+```yaml
+spec:
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1        # Extra pods during update
+      maxUnavailable: 0  # Ensure availability
+```
+
+**Useful Commands:**
+```bash
+kubectl apply -f k8s/deployment.yml
+kubectl rollout status deployment/<name>
+kubectl rollout history deployment/<name>
+kubectl rollout undo deployment/<name>
+```
+
+**Resources:**
+- [Performing Rolling Update](https://kubernetes.io/docs/tutorials/kubernetes-basics/update/update-intro/)
+
+</details>
+
+---
+
+### Task 5 — Documentation (3 pts)
+
+**Objective:** Document your Kubernetes implementation.
+
+Create `k8s/README.md` with these sections:
+
+**Required Sections:**
+
+1. **Architecture Overview**
+   - Diagram or description of your deployment architecture
+   - How many Pods, which Services, networking flow
+   - Resource allocation strategy
+
+2. **Manifest Files**
+   - Brief description of each manifest
+   - Key configuration choices
+   - Why you chose specific values (replicas, resources, etc.)
+
+3. **Deployment Evidence**
+   - `kubectl get all` output
+   - `kubectl get pods,svc` with detailed view
+   - `kubectl describe deployment <name>` showing replicas and strategy
+   - Screenshot or curl output showing app working
+
+4. **Operations Performed**
+   - Commands used to deploy
+   - Scaling demonstration output
+   - Rolling update demonstration output
+   - Service access method and verification
+
+5. **Production Considerations**
+   - What health checks did you implement and why?
+   - Resource limits rationale
+   - How would you improve this for production?
+   - Monitoring and observability strategy
+
+6. **Challenges & Solutions**
+   - Issues encountered
+   - How you debugged (logs, describe, events)
+   - What you learned about Kubernetes
+
+---
+
+## Bonus Task — Ingress with TLS (2.5 pts)
+
+**Objective:** Deploy multiple applications with Ingress routing and HTTPS.
+
+**Requirements:**
+
+1. **Multi-App Deployment**
+   - Deploy second application (use different image or different config)
+   - Create Deployment and Service for second app
+
+2. **Ingress Controller**
+   - Enable Ingress in minikube or install in kind
+   - Verify Ingress controller is running
+
+3. **Ingress Resources**
+   - Create Ingress manifest with path-based routing
+   - Route `/app1` to first service
+   - Route `/app2` to second service
+
+4. **TLS Configuration**
+   - Generate self-signed certificate
+   - Create TLS Secret
+   - Configure Ingress for HTTPS
+
+<details>
+<summary>💡 Ingress Concepts</summary>
+
+**What is Ingress?**
+HTTP/HTTPS routing layer sitting in front of Services. Provides:
+- URL-based routing
+- TLS/SSL termination
+- Virtual hosting
+- Load balancing
+
+**Ingress vs Service:**
+- Service: L4 (TCP/UDP) load balancing
+- Ingress: L7 (HTTP/HTTPS) routing
+
+**Ingress Controller:**
+Software that implements Ingress rules. Popular options:
+- nginx-ingress (most common)
+- Traefik
+- HAProxy
+- Cloud provider specific
+
+**Enable in Minikube:**
+```bash
+minikube addons enable ingress
+```
+
+**Install in kind:**
+```bash
+kubectl apply -f https://raw.githubusercontent.com/kubernetes/ingress-nginx/main/deploy/static/provider/kind/deploy.yaml
+```
+
+**Important Note:** The Ingress NGINX controller reaches end of life in March 2026. For production deployments, consider migrating to the [Gateway API](https://gateway-api.sigs.k8s.io/), which is the future of Kubernetes traffic management.
+
+**Resources:**
+- [Ingress](https://kubernetes.io/docs/concepts/services-networking/ingress/)
+- [Ingress Controllers](https://kubernetes.io/docs/concepts/services-networking/ingress-controllers/)
+- [Set up Ingress on Minikube](https://kubernetes.io/docs/tasks/access-application-cluster/ingress-minikube/)
+- [Gateway API](https://gateway-api.sigs.k8s.io/) - Next generation traffic management
+
+</details>
+
+<details>
+<summary>💡 Path-Based Routing</summary>
+
+**Ingress Manifest Pattern:**
+```yaml
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+metadata:
+  name: apps-ingress
+  annotations:
+    nginx.ingress.kubernetes.io/rewrite-target: /
+spec:
+  rules:
+  - host: local.example.com
+    http:
+      paths:
+      - path: /app1
+        pathType: Prefix
+        backend:
+          service:
+            name: app1-service
+            port:
+              number: 80
+      - path: /app2
+        pathType: Prefix
+        backend:
+          service:
+            name: app2-service
+            port:
+              number: 80
+```
+
+**Path Types:**
+- `Exact`: Exact match
+- `Prefix`: Matches URL path prefix
+
+**Testing:**
+Add to `/etc/hosts`:
+```
+<minikube-ip> local.example.com
+```
+
+Access:
+```bash
+curl http://local.example.com/app1
+curl http://local.example.com/app2
+```
+
+</details>
+
+<details>
+<summary>💡 TLS Configuration</summary>
+
+**Generate Self-Signed Certificate:**
+```bash
+openssl req -x509 -nodes -days 365 -newkey rsa:2048 \
+  -keyout tls.key -out tls.crt \
+  -subj "/CN=local.example.com/O=local.example.com"
+```
+
+**Create TLS Secret:**
+```bash
+kubectl create secret tls tls-secret \
+  --key tls.key \
+  --cert tls.crt
+```
+
+**Update Ingress:**
+```yaml
+spec:
+  tls:
+  - hosts:
+    - local.example.com
+    secretName: tls-secret
+  rules:
+  # ... your rules
+```
+
+**Test HTTPS:**
+```bash
+curl -k https://local.example.com/app1
+```
+
+</details>
+
+**Documentation Required:**
+- Both applications deployed and accessible via Ingress
+- Ingress manifest with routing rules
+- TLS configuration and certificate creation steps
+- Terminal output showing all resources
+- curl commands demonstrating routing works
+- Explanation of Ingress benefits over NodePort Services
+
+---
+
+## Checklist
+
+### Task 1 — Local Kubernetes Setup (2 pts)
+- [ ] kubectl and local cluster (minikube/kind) installed
+- [ ] Cluster running successfully
+- [ ] Terminal output showing cluster info
+- [ ] Documentation of setup process
+
+### Task 2 — Application Deployment (3 pts)
+- [ ] `k8s/deployment.yml` exists
+- [ ] Uses Docker image from Lab 2
+- [ ] Minimum 3 replicas configured
+- [ ] Resource requests and limits defined
+- [ ] Liveness and readiness probes configured
+- [ ] Deployment successfully running
+
+### Task 3 — Service Configuration (2 pts)
+- [ ] `k8s/service.yml` exists
+- [ ] Service type: NodePort
+- [ ] Correct label selectors
+- [ ] Service accessible from outside cluster
+- [ ] All endpoints responding
+
+### Task 4 — Scaling and Updates (2 pts)
+- [ ] Scaling to 5 replicas demonstrated
+- [ ] Rolling update performed and documented
+- [ ] Rollback capability demonstrated
+- [ ] Zero downtime verified
+
+### Task 5 — Documentation (3 pts)
+- [ ] `k8s/README.md` complete with all sections
+- [ ] Architecture overview provided
+- [ ] Terminal output evidence included
+- [ ] Operations demonstrated
+- [ ] Production considerations discussed
+- [ ] Challenges and learnings documented
+
+### Bonus — Ingress with TLS (2.5 pts)
+- [ ] Second application deployed
+- [ ] Ingress controller enabled
+- [ ] Ingress manifest with path-based routing
+- [ ] TLS certificate generated
+- [ ] HTTPS working
+- [ ] Documentation complete
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Setup** | 2 pts | Cluster running, tools installed |
+| **Deployment** | 3 pts | Production-ready manifest with probes and resources |
+| **Service** | 2 pts | Properly exposed and accessible |
+| **Scaling & Updates** | 2 pts | Demonstrated operations |
+| **Documentation** | 3 pts | Complete and thorough |
+| **Bonus** | 2.5 pts | Ingress with TLS |
+| **Total** | 14.5 pts | 12 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **12/12:** All requirements met, excellent documentation, deep understanding
+- **10-11/12:** Working deployment, good practices, solid documentation
+- **8-9/12:** Basic deployment works, missing some best practices
+- **<8/12:** Missing requirements, no health checks, poor documentation
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Kubernetes Documentation</summary>
+
+- [Kubernetes Documentation](https://kubernetes.io/docs/home/)
+- [Kubernetes Concepts](https://kubernetes.io/docs/concepts/)
+- [kubectl Reference](https://kubernetes.io/docs/reference/kubectl/)
+- [Kubernetes API Reference](https://kubernetes.io/docs/reference/kubernetes-api/)
+
+</details>
+
+<details>
+<summary>🎓 Learning Resources</summary>
+
+- [Kubernetes Basics Tutorial](https://kubernetes.io/docs/tutorials/kubernetes-basics/)
+- [Learn Kubernetes Basics](https://kubernetes.io/docs/tutorials/kubernetes-basics/)
+- [Configuration Best Practices](https://kubernetes.io/docs/concepts/configuration/overview/)
+
+</details>
+
+<details>
+<summary>🛠️ Tools</summary>
+
+- [kubectl](https://kubernetes.io/docs/tasks/tools/) - Kubernetes CLI
+- [minikube](https://minikube.sigs.k8s.io/docs/) - Local Kubernetes
+- [kind](https://kind.sigs.k8s.io/) - Kubernetes in Docker
+- [k9s](https://k9scli.io/) - Terminal UI for Kubernetes
+- [kubectx/kubens](https://github.com/ahmetb/kubectx) - Context and namespace switcher
+
+</details>
+
+<details>
+<summary>🔍 Debugging Resources</summary>
+
+- [Debug Pods](https://kubernetes.io/docs/tasks/debug/debug-application/debug-pods/)
+- [Debug Services](https://kubernetes.io/docs/tasks/debug/debug-application/debug-service/)
+- [Troubleshooting Applications](https://kubernetes.io/docs/tasks/debug/debug-application/)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 10:** Helm charts for package management
+- **Lab 11:** Secrets management with Vault
+- **Lab 12:** ConfigMaps and application configuration
+- **Lab 13:** ArgoCD for GitOps deployments
+- **Lab 14:** Progressive delivery with Argo Rollouts
+- **Lab 15:** StatefulSets for stateful applications
+- **Lab 16:** Kubernetes monitoring and observability
+
+---
+
+**Good luck!** 🚢
+
+> **Remember:** Kubernetes is declarative. Define desired state, let the control plane make it happen. Use health checks and resource limits from day one.
diff --git a/labs/lab10.md b/labs/lab10.md
new file mode 100644
index 0000000000..11952dedb7
--- /dev/null
+++ b/labs/lab10.md
@@ -0,0 +1,903 @@
+# Lab 10 — Helm Package Manager
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Helm-blue)
+![points](https://img.shields.io/badge/points-12%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Helm-informational)
+
+> Package your Kubernetes applications with Helm for reusable, configurable deployments across environments.
+
+## Overview
+
+Transform your Kubernetes manifests from Lab 9 into Helm charts. Learn templating, values management, lifecycle hooks, and chart best practices for production deployments.
+
+**What You'll Learn:**
+- Helm architecture and templating
+- Creating production-ready charts
+- Values and configuration management
+- Chart hooks for lifecycle events
+- Testing and validating charts
+- Library charts for code reuse
+
+**Tech Stack:** Helm 4.x | Kubernetes 1.33+ | Go templating | YAML
+
+---
+
+## Tasks
+
+### Task 1 — Helm Fundamentals (2 pts)
+
+**Objective:** Understand Helm concepts and set up your environment.
+
+**Requirements:**
+
+1. **Learn Helm Concepts**
+   - Understand Charts, Releases, and Repositories
+   - Learn Go template syntax basics
+   - Study Helm architecture (v3)
+
+2. **Install Helm**
+   - Install Helm CLI
+   - Verify installation
+   - Add common chart repositories
+
+3. **Explore Existing Charts**
+   - Search public repositories
+   - Inspect a chart's structure
+   - Understand chart components
+
+<details>
+<summary>💡 Helm Concepts</summary>
+
+**What is Helm?**
+Package manager for Kubernetes. Think `apt`/`yum` for K8s applications.
+
+**Core Concepts:**
+- **Chart**: Package of Kubernetes resources (like a `.deb` or `.rpm`)
+- **Release**: Instance of a chart running in a cluster
+- **Repository**: Collection of charts (like package repositories)
+- **Values**: Configuration parameters for customization
+
+**Why Helm?**
+- **Templating**: Reuse manifests across environments
+- **Versioning**: Track and rollback releases
+- **Dependencies**: Manage complex multi-chart applications
+- **Hooks**: Execute actions during install/upgrade/delete
+- **Standardization**: Industry-standard packaging
+
+**Helm 4 (Current):**
+- Released November 2025, first major version in 6 years
+- Full backward compatibility with Helm 3 charts (apiVersion v2)
+- OCI registry support
+- No Tiller (removed in Helm 3)
+- Improved security and performance
+
+**Chart Structure:**
+```
+mychart/
+├── Chart.yaml          # Chart metadata
+├── values.yaml         # Default configuration values
+├── charts/             # Chart dependencies
+└── templates/          # Kubernetes manifest templates
+    ├── deployment.yaml
+    ├── service.yaml
+    ├── _helpers.tpl    # Template helpers
+    └── NOTES.txt       # Post-install notes
+```
+
+**Resources:**
+- [Helm Architecture](https://helm.sh/docs/topics/architecture/)
+- [Three Big Concepts](https://helm.sh/docs/intro/using_helm/#three-big-concepts)
+- [Charts](https://helm.sh/docs/topics/charts/)
+- [Install Helm](https://helm.sh/docs/intro/install/)
+
+</details>
+
+<details>
+<summary>💡 Essential Helm Commands</summary>
+
+**Repository Management:**
+```bash
+# Note: Traditional HTTP repositories are being phased out
+# Many charts now use OCI registries
+
+# Add a repository (traditional method)
+helm repo add prometheus-community https://prometheus-community.github.io/helm-charts
+helm repo update
+helm search repo prometheus
+
+# Install from OCI registry (modern method)
+helm install my-nginx oci://registry-1.docker.io/bitnamicharts/nginx
+```
+
+**Chart Operations:**
+```bash
+helm create mychart           # Create new chart
+helm lint mychart             # Validate chart
+helm template mychart         # Render templates locally
+helm install myrelease mychart  # Install chart
+helm list                     # List releases
+helm uninstall myrelease      # Remove release
+```
+
+**Debugging:**
+```bash
+helm install --dry-run --debug myrelease mychart
+helm get manifest myrelease
+helm get values myrelease
+```
+
+</details>
+
+**Documentation Required:**
+- Terminal output showing Helm installation and version (should be 4.x)
+- Output of exploring a public chart (e.g., `helm show chart prometheus-community/prometheus`)
+- Brief explanation of Helm's value proposition
+
+---
+
+### Task 2 — Create Your Helm Chart (3 pts)
+
+**Objective:** Convert your Lab 9 Kubernetes manifests into a Helm chart.
+
+**Requirements:**
+
+1. **Initialize Chart**
+   - Create chart in `k8s/` directory
+   - Choose appropriate chart name
+   - Update `Chart.yaml` with metadata
+
+2. **Convert Manifests to Templates**
+   - Move your `deployment.yml` to `templates/deployment.yaml`
+   - Move your `service.yml` to `templates/service.yaml`
+   - Templatize using Go template syntax
+   - Extract values to `values.yaml`
+
+3. **Implement Proper Templating**
+   - Image repository and tag from values
+   - Replica count from values
+   - Resource limits from values
+   - Service type and ports from values
+   - Labels using helper templates
+
+4. **Keep Health Checks**
+   - NEVER comment out liveness/readiness probes
+   - Make probe configuration customizable via values
+   - Provide sensible defaults
+
+<details>
+<summary>💡 Chart.yaml Structure</summary>
+
+**Required Fields:**
+```yaml
+apiVersion: v2              # Chart API version (v2 for Helm 3+)
+name: my-python-app         # Chart name
+description: My Python application Helm chart
+type: application           # application or library
+version: 0.1.0              # Chart version (SemVer)
+appVersion: "1.0"           # App version (can be any string)
+```
+
+**Optional but Recommended:**
+```yaml
+keywords:
+  - python
+  - web
+maintainers:
+  - name: Your Name
+    email: your.email@example.com
+sources:
+  - https://github.com/yourusername/yourapp
+```
+
+**Chart vs App Version:**
+- `version`: Chart version (change when chart changes)
+- `appVersion`: Application version (change when app changes)
+
+</details>
+
+<details>
+<summary>💡 Templating Basics</summary>
+
+**Go Template Syntax:**
+```yaml
+# Access value from values.yaml
+image: {{ .Values.image.repository }}:{{ .Values.image.tag }}
+
+# With default value
+replicas: {{ .Values.replicaCount | default 3 }}
+
+# Conditional
+{{- if .Values.service.enabled }}
+# ... service definition
+{{- end }}
+
+# Range (loop)
+{{- range .Values.env }}
+- name: {{ .name }}
+  value: {{ .value }}
+{{- end }}
+```
+
+**Built-in Objects:**
+- `.Values`: Values from `values.yaml` and overrides
+- `.Chart`: Contents of `Chart.yaml`
+- `.Release`: Info about the release (name, namespace, etc.)
+- `.Template`: Info about current template
+
+**Example Conversion:**
+
+Before (static):
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: my-app
+spec:
+  replicas: 3
+  template:
+    spec:
+      containers:
+      - name: my-app
+        image: myuser/myapp:v1.0
+```
+
+After (templated):
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: {{ include "mychart.fullname" . }}
+  labels:
+    {{- include "mychart.labels" . | nindent 4 }}
+spec:
+  replicas: {{ .Values.replicaCount }}
+  template:
+    spec:
+      containers:
+      - name: {{ .Chart.Name }}
+        image: "{{ .Values.image.repository }}:{{ .Values.image.tag | default .Chart.AppVersion }}"
+```
+
+</details>
+
+<details>
+<summary>💡 Values.yaml Design</summary>
+
+**Structure Your Values:**
+```yaml
+# values.yaml
+replicaCount: 3
+
+image:
+  repository: yourusername/yourapp
+  tag: "1.0"
+  pullPolicy: IfNotPresent
+
+service:
+  type: NodePort
+  port: 80
+  targetPort: 8000
+
+resources:
+  limits:
+    cpu: 200m
+    memory: 256Mi
+  requests:
+    cpu: 100m
+    memory: 128Mi
+
+livenessProbe:
+  httpGet:
+    path: /health
+    port: 8000
+  initialDelaySeconds: 10
+  periodSeconds: 5
+
+readinessProbe:
+  httpGet:
+    path: /ready
+    port: 8000
+  initialDelaySeconds: 5
+  periodSeconds: 3
+```
+
+**Best Practices:**
+- Nested structure for organization
+- Sensible defaults
+- Document each value
+- Make everything configurable
+- Never hardcode secrets
+
+</details>
+
+<details>
+<summary>💡 Helper Templates</summary>
+
+**_helpers.tpl Pattern:**
+```yaml
+{{/*
+Expand the name of the chart.
+*/}}
+{{- define "mychart.name" -}}
+{{- default .Chart.Name .Values.nameOverride | trunc 63 | trimSuffix "-" }}
+{{- end }}
+
+{{/*
+Create a default fully qualified app name.
+*/}}
+{{- define "mychart.fullname" -}}
+{{- if .Values.fullnameOverride }}
+{{- .Values.fullnameOverride | trunc 63 | trimSuffix "-" }}
+{{- else }}
+{{- $name := default .Chart.Name .Values.nameOverride }}
+{{- printf "%s-%s" .Release.Name $name | trunc 63 | trimSuffix "-" }}
+{{- end }}
+{{- end }}
+
+{{/*
+Common labels
+*/}}
+{{- define "mychart.labels" -}}
+helm.sh/chart: {{ include "mychart.chart" . }}
+{{ include "mychart.selectorLabels" . }}
+app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
+app.kubernetes.io/managed-by: {{ .Release.Service }}
+{{- end }}
+```
+
+**Why Helpers?**
+- DRY principle
+- Consistent naming
+- Reusable logic
+- Easier maintenance
+
+</details>
+
+**Test Your Chart:**
+```bash
+helm lint k8s/mychart
+helm template mychart k8s/mychart
+helm install --dry-run --debug test-release k8s/mychart
+helm install myrelease k8s/mychart
+```
+
+---
+
+### Task 3 — Multi-Environment Support (2 pts)
+
+**Objective:** Configure chart for different environments using values files.
+
+**Requirements:**
+
+1. **Create Environment-Specific Values**
+   - `values-dev.yaml` for development
+   - `values-prod.yaml` for production
+   - Different configurations per environment
+
+2. **Environment Differences**
+   - Dev: 1 replica, relaxed resources, NodePort
+   - Prod: 3+ replicas, proper resources, LoadBalancer ready
+   - Different image tags or configurations
+
+3. **Test Both Environments**
+   - Install with dev values
+   - Verify configuration
+   - Upgrade to prod values
+   - Verify changes applied
+
+<details>
+<summary>💡 Values Override Pattern</summary>
+
+**values-dev.yaml:**
+```yaml
+replicaCount: 1
+
+image:
+  tag: "latest"
+
+resources:
+  limits:
+    cpu: 100m
+    memory: 128Mi
+  requests:
+    cpu: 50m
+    memory: 64Mi
+
+service:
+  type: NodePort
+
+livenessProbe:
+  initialDelaySeconds: 5
+  periodSeconds: 10
+```
+
+**values-prod.yaml:**
+```yaml
+replicaCount: 5
+
+image:
+  tag: "1.0.0"  # Specific version
+
+resources:
+  limits:
+    cpu: 500m
+    memory: 512Mi
+  requests:
+    cpu: 200m
+    memory: 256Mi
+
+service:
+  type: LoadBalancer
+
+livenessProbe:
+  initialDelaySeconds: 30
+  periodSeconds: 5
+
+readinessProbe:
+  initialDelaySeconds: 10
+  periodSeconds: 3
+```
+
+**Using Values Files:**
+```bash
+# Development
+helm install myapp-dev k8s/mychart -f k8s/mychart/values-dev.yaml
+
+# Production
+helm install myapp-prod k8s/mychart -f k8s/mychart/values-prod.yaml
+
+# Override specific value
+helm install myapp k8s/mychart --set replicaCount=10
+```
+
+</details>
+
+---
+
+### Task 4 — Chart Hooks (3 pts)
+
+**Objective:** Implement Helm hooks for lifecycle management.
+
+**Requirements:**
+
+1. **Learn Hook Concepts**
+   - Understand hook weights and execution order
+   - Learn hook deletion policies
+
+2. **Implement Hooks**
+   - **Pre-install hook**: Job that runs before installation (e.g., database migration, validation)
+   - **Post-install hook**: Job that runs after installation (e.g., smoke test, notification)
+
+3. **Hook Configuration**
+   - Proper annotations for hook type
+   - Hook weight for execution order
+   - Deletion policy (hook-succeeded)
+
+4. **Verify Hooks**
+   - Lint chart
+   - Dry-run to see hook rendering
+   - Install and verify hook execution
+   - Confirm hooks are deleted per policy
+
+<details>
+<summary>💡 Helm Hooks Concept</summary>
+
+**What Are Hooks?**
+Special Kubernetes resources that execute at specific points in release lifecycle.
+
+**Hook Types:**
+- `pre-install`: Before resources are installed
+- `post-install`: After all resources installed and ready
+- `pre-delete`: Before deletion
+- `post-delete`: After deletion
+- `pre-upgrade`: Before upgrade
+- `post-upgrade`: After upgrade
+- `pre-rollback`: Before rollback
+- `post-rollback`: After rollback
+
+**Hook Weights:**
+- Control execution order
+- Lower weight runs first
+- Default weight: 0
+
+**Hook Deletion Policies:**
+- `before-hook-creation`: Delete previous hook before new one
+- `hook-succeeded`: Delete after successful execution
+- `hook-failed`: Delete after failed execution
+
+**Resources:**
+- [Chart Hooks](https://helm.sh/docs/topics/charts_hooks/)
+
+</details>
+
+<details>
+<summary>💡 Hook Implementation Pattern</summary>
+
+**templates/hooks/pre-install-job.yaml:**
+```yaml
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: "{{ include "mychart.fullname" . }}-pre-install"
+  labels:
+    {{- include "mychart.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": pre-install
+    "helm.sh/hook-weight": "-5"
+    "helm.sh/hook-delete-policy": hook-succeeded
+spec:
+  template:
+    metadata:
+      name: "{{ include "mychart.fullname" . }}-pre-install"
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: pre-install-job
+        image: busybox
+        command: ['sh', '-c', 'echo Pre-install task running && sleep 10 && echo Pre-install completed']
+```
+
+**templates/hooks/post-install-job.yaml:**
+```yaml
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: "{{ include "mychart.fullname" . }}-post-install"
+  labels:
+    {{- include "mychart.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": post-install
+    "helm.sh/hook-weight": "5"
+    "helm.sh/hook-delete-policy": hook-succeeded
+spec:
+  template:
+    metadata:
+      name: "{{ include "mychart.fullname" . }}-post-install"
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: post-install-job
+        image: busybox
+        command: ['sh', '-c', 'echo Post-install validation && sleep 10 && echo Validation passed']
+```
+
+**Real-World Hook Examples:**
+- Pre-install: Database schema migration
+- Post-install: Smoke tests, send notification
+- Pre-upgrade: Backup database
+- Post-upgrade: Run integration tests
+- Pre-delete: Backup data before cleanup
+
+</details>
+
+<details>
+<summary>💡 Testing Hooks</summary>
+
+**Validation Commands:**
+```bash
+# Lint chart
+helm lint k8s/mychart
+
+# Dry run to see hooks
+helm install --dry-run --debug test-release k8s/mychart | grep -A 20 "hook"
+
+# Install and watch hooks
+helm install myrelease k8s/mychart
+kubectl get jobs -w
+kubectl get pods -w
+
+# Check hook execution
+kubectl describe job myrelease-pre-install
+kubectl logs job/myrelease-pre-install
+
+# Verify deletion policy worked
+kubectl get jobs
+```
+
+**Hook Troubleshooting:**
+- Check annotations are correct
+- Verify hook weight if order matters
+- Check pod logs for hook failures
+- Ensure deletion policy is appropriate
+
+</details>
+
+---
+
+### Task 5 — Documentation (2 pts)
+
+**Objective:** Document your Helm chart implementation.
+
+Create `k8s/HELM.md` with these sections:
+
+**Required Sections:**
+
+1. **Chart Overview**
+   - Chart structure explanation
+   - Key template files and their purpose
+   - Values organization strategy
+
+2. **Configuration Guide**
+   - Important values and their purpose
+   - How to customize for different environments
+   - Example installations with different configurations
+
+3. **Hook Implementation**
+   - What hooks you implemented and why
+   - Hook execution order and weights
+   - Deletion policies explanation
+
+4. **Installation Evidence**
+   - `helm list` output
+   - `kubectl get all` showing deployed resources
+   - Hook execution output (`kubectl get jobs`, `kubectl describe job`)
+   - Different environment deployments (dev vs prod)
+
+5. **Operations**
+   - Installation commands used
+   - How to upgrade a release
+   - How to rollback
+   - How to uninstall
+
+6. **Testing & Validation**
+   - `helm lint` output
+   - `helm template` verification
+   - Dry-run output
+   - Application accessibility verification
+
+---
+
+## Bonus Task — Library Charts (2.5 pts)
+
+**Objective:** Create a library chart for shared templates across multiple applications.
+
+**Requirements:**
+
+1. **Deploy Second Application**
+   - Create Helm chart for second app
+   - Notice template duplication (labels, helpers, etc.)
+
+2. **Create Library Chart**
+   - Create library chart in `k8s/common-lib/`
+   - Extract shared templates (labels, names, etc.)
+   - Set chart type to `library` in Chart.yaml
+
+3. **Use Library Chart**
+   - Add library as dependency in both app charts
+   - Reference library templates
+   - Eliminate duplication
+
+4. **Verify**
+   - Both charts install successfully
+   - Templates render correctly using library
+
+<details>
+<summary>💡 Library Chart Concepts</summary>
+
+**What Are Library Charts?**
+Charts that only contain templates (no resources). Used to share common template logic.
+
+**Type: Library**
+- Cannot be installed directly
+- Used as dependencies
+- Share templates across charts
+
+**Common Use Cases:**
+- Standard labels
+- Name generation
+- Security contexts
+- Resource definitions
+- Common configuration patterns
+
+**Resources:**
+- [Library Charts](https://helm.sh/docs/topics/library_charts/)
+
+</details>
+
+<details>
+<summary>💡 Library Chart Implementation</summary>
+
+**k8s/common-lib/Chart.yaml:**
+```yaml
+apiVersion: v2
+name: common-lib
+description: Common templates for all applications
+type: library
+version: 0.1.0
+```
+
+**k8s/common-lib/templates/_labels.tpl:**
+```yaml
+{{/*
+Common labels
+*/}}
+{{- define "common.labels" -}}
+app.kubernetes.io/name: {{ include "common.name" . }}
+app.kubernetes.io/instance: {{ .Release.Name }}
+app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
+app.kubernetes.io/managed-by: {{ .Release.Service }}
+helm.sh/chart: {{ include "common.chart" . }}
+{{- end }}
+
+{{/*
+Selector labels
+*/}}
+{{- define "common.selectorLabels" -}}
+app.kubernetes.io/name: {{ include "common.name" . }}
+app.kubernetes.io/instance: {{ .Release.Name }}
+{{- end }}
+```
+
+**Using Library Chart:**
+
+**app1/Chart.yaml:**
+```yaml
+apiVersion: v2
+name: app1
+version: 0.1.0
+dependencies:
+  - name: common-lib
+    version: 0.1.0
+    repository: "file://../common-lib"
+```
+
+**app1/templates/deployment.yaml:**
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: {{ include "common.fullname" . }}
+  labels:
+    {{- include "common.labels" . | nindent 4 }}
+spec:
+  selector:
+    matchLabels:
+      {{- include "common.selectorLabels" . | nindent 6 }}
+  # ... rest of deployment
+```
+
+**Install with Dependencies:**
+```bash
+helm dependency update k8s/app1
+helm install app1-release k8s/app1
+```
+
+</details>
+
+**Documentation Required:**
+- Library chart structure
+- Shared templates implemented
+- How both apps use the library
+- Benefits of this approach (DRY, consistency, maintainability)
+- Terminal output showing successful deployment of both apps
+
+---
+
+## Checklist
+
+### Task 1 — Helm Fundamentals (2 pts)
+- [ ] Helm installed and verified
+- [ ] Chart repositories explored
+- [ ] Helm concepts understood
+- [ ] Documentation of setup
+
+### Task 2 — Create Your Helm Chart (3 pts)
+- [ ] Chart created in `k8s/` directory
+- [ ] `Chart.yaml` properly configured
+- [ ] Manifests converted to templates
+- [ ] Values properly extracted
+- [ ] Helper templates implemented
+- [ ] Health checks remain functional (not commented out!)
+- [ ] Chart installs successfully
+
+### Task 3 — Multi-Environment Support (2 pts)
+- [ ] `values-dev.yaml` created
+- [ ] `values-prod.yaml` created
+- [ ] Environment-specific configurations
+- [ ] Both environments tested
+- [ ] Documentation of differences
+
+### Task 4 — Chart Hooks (3 pts)
+- [ ] Pre-install hook implemented
+- [ ] Post-install hook implemented
+- [ ] Proper hook annotations
+- [ ] Hook weights configured
+- [ ] Deletion policies applied
+- [ ] Hooks execute successfully
+- [ ] Hooks deleted per policy
+
+### Task 5 — Documentation (2 pts)
+- [ ] `k8s/HELM.md` complete
+- [ ] Chart structure explained
+- [ ] Configuration guide provided
+- [ ] Hook implementation documented
+- [ ] Installation evidence included
+- [ ] Operations documented
+
+### Bonus — Library Charts (2.5 pts)
+- [ ] Library chart created
+- [ ] Shared templates extracted
+- [ ] Two app charts using library
+- [ ] Dependencies configured
+- [ ] Both apps deploy successfully
+- [ ] Documentation complete
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Fundamentals** | 2 pts | Helm installed, concepts understood |
+| **Chart Creation** | 3 pts | Proper templating, values, helpers |
+| **Multi-Environment** | 2 pts | Different configs, tested |
+| **Hooks** | 3 pts | Pre/post install hooks working |
+| **Documentation** | 2 pts | Complete HELM.md |
+| **Bonus** | 2.5 pts | Library chart implementation |
+| **Total** | 14.5 pts | 12 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **12/12:** Excellent templating, working hooks, multi-env, great docs
+- **10-11/12:** Working chart, hooks function, good documentation
+- **8-9/12:** Basic chart works, missing best practices or hooks
+- **<8/12:** Chart doesn't install, commented out probes, poor templating
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Helm Documentation</summary>
+
+- [Helm Documentation](https://helm.sh/docs/)
+- [Chart Best Practices](https://helm.sh/docs/chart_best_practices/)
+- [Chart Template Guide](https://helm.sh/docs/chart_template_guide/)
+- [Helm Commands](https://helm.sh/docs/helm/)
+
+</details>
+
+<details>
+<summary>🎓 Learning Resources</summary>
+
+- [Quickstart Guide](https://helm.sh/docs/intro/quickstart/)
+- [Using Helm](https://helm.sh/docs/intro/using_helm/)
+- [Go Template Primer](https://helm.sh/docs/chart_template_guide/builtin_objects/)
+- [Chart Development Tips](https://helm.sh/docs/howto/charts_tips_and_tricks/)
+
+</details>
+
+<details>
+<summary>🛠️ Tools</summary>
+
+- [Helm](https://helm.sh/) - Official site
+- [Artifact Hub](https://artifacthub.io/) - Public chart repository
+- [helm-docs](https://github.com/norwoodj/helm-docs) - Generate docs from values
+- [chart-testing](https://github.com/helm/chart-testing) - Lint and test charts
+
+</details>
+
+<details>
+<summary>📦 Public Chart Repositories</summary>
+
+- [Bitnami Charts](https://github.com/bitnami/charts)
+- [Prometheus Community](https://github.com/prometheus-community/helm-charts)
+- [Grafana Charts](https://github.com/grafana/helm-charts)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 11:** Secrets management with Vault (integrate with Helm)
+- **Lab 12:** ConfigMaps and persistent volumes
+- **Lab 13:** ArgoCD deploys Helm charts via GitOps
+- **Lab 14:** Progressive delivery with Argo Rollouts
+- **Lab 15:** StatefulSets for stateful applications
+
+---
+
+**Good luck!** ⛵
+
+> **Remember:** Helm makes your deployments reusable and configurable. Never comment out health checks - configure them properly. Template everything, hardcode nothing (except defaults).
diff --git a/labs/lab11.md b/labs/lab11.md
new file mode 100644
index 0000000000..e69ab67618
--- /dev/null
+++ b/labs/lab11.md
@@ -0,0 +1,447 @@
+# Lab 11 — Kubernetes Secrets & HashiCorp Vault
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Secret%20Management-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Vault%20%7C%20K8s%20Secrets-informational)
+
+> Secure your Kubernetes applications by implementing proper secret management with native Secrets and HashiCorp Vault integration.
+
+## Overview
+
+Secret management is critical for production Kubernetes deployments. Hardcoded credentials in code or config files are a security nightmare. This lab teaches you how to properly manage sensitive data using Kubernetes native Secrets and enterprise-grade HashiCorp Vault.
+
+**What You'll Learn:**
+- Kubernetes Secrets creation and consumption
+- Base64 encoding vs actual encryption
+- Helm-based secret management
+- HashiCorp Vault installation and configuration
+- Kubernetes authentication with Vault
+- Sidecar injection pattern for secrets
+
+**Building On:** Your Helm chart from Lab 10 will be extended with secret management capabilities.
+
+**Tech Stack:** Kubernetes Secrets | HashiCorp Vault 1.18+ | Vault Helm 0.28+ | Vault Agent Injector
+
+---
+
+## Tasks
+
+### Task 1 — Kubernetes Secrets Fundamentals (2 pts)
+
+**Objective:** Understand how Kubernetes Secrets work and their security model.
+
+**Requirements:**
+
+1. **Create a Secret Using kubectl**
+   - Create a secret named `app-credentials` with:
+     - `username` key
+     - `password` key
+   - Use the imperative `kubectl create secret` command
+
+2. **Examine the Secret**
+   - View the secret in YAML format
+   - Decode the base64-encoded values
+   - Understand what "encoding" vs "encryption" means
+
+3. **Understand Security Implications**
+   - Research: Are Kubernetes Secrets encrypted at rest by default?
+   - What is etcd encryption and when should you enable it?
+
+<details>
+<summary>💡 Hints</summary>
+
+**Creating Secrets:**
+There are multiple ways to create secrets:
+- `kubectl create secret generic` - from literals or files
+- `kubectl create secret docker-registry` - for image pull secrets
+- `kubectl create secret tls` - for TLS certificates
+
+**Useful Commands:**
+```bash
+# Create from literals
+kubectl create secret generic <name> --from-literal=key=value
+
+# View secret
+kubectl get secret <name> -o yaml
+
+# Decode base64 (Linux/Mac)
+echo "<base64-string>" | base64 -d
+```
+
+**Security Model:**
+Kubernetes Secrets are base64-encoded, NOT encrypted by default. Anyone with API access can decode them. For production:
+- Enable etcd encryption at rest
+- Use RBAC to limit secret access
+- Consider external secret managers (Vault, AWS Secrets Manager, etc.)
+
+**Resources:**
+- [Kubernetes Secrets Concepts](https://kubernetes.io/docs/concepts/configuration/secret/)
+- [Encrypting Secret Data at Rest](https://kubernetes.io/docs/tasks/administer-cluster/encrypt-data/)
+
+</details>
+
+---
+
+### Task 2 — Helm-Managed Secrets (3 pts)
+
+**Objective:** Integrate secrets into your Helm chart and inject them into your application.
+
+**Requirements:**
+
+1. **Create Secret Template**
+   - Add `templates/secrets.yaml` to your Helm chart
+   - Define secret values in `values.yaml` (with placeholder defaults)
+   - Use proper templating for secret name and labels
+
+2. **Inject Secrets as Environment Variables**
+   - Update your deployment to consume the secret
+   - Use `envFrom` with `secretRef` for all keys
+   - OR use individual `env` entries with `secretKeyRef`
+
+3. **Verify Secret Injection**
+   - Deploy the updated chart
+   - Exec into the pod and verify environment variables
+   - Ensure secrets are not visible in `kubectl describe pod`
+
+4. **Add Resource Limits**
+   - Configure CPU and memory requests/limits in your deployment
+   - Use values.yaml for configurability
+   - Apply Kubernetes resource management best practices
+
+<details>
+<summary>💡 Hints</summary>
+
+**Secret Template Structure:**
+Your `templates/secrets.yaml` should:
+- Use the standard `v1` API and `Secret` kind
+- Include proper metadata with templated name and labels
+- Reference values from `values.yaml`
+- Use `stringData` for plain text (auto-encoded) or `data` for pre-encoded
+
+**Consuming Secrets in Deployment:**
+There are two patterns for environment variables:
+
+Pattern 1 - All keys from secret:
+```yaml
+envFrom:
+  - secretRef:
+      name: {{ include "mychart.fullname" . }}-secret
+```
+
+Pattern 2 - Specific keys:
+```yaml
+env:
+  - name: DATABASE_PASSWORD
+    valueFrom:
+      secretKeyRef:
+        name: secret-name
+        key: password
+```
+
+**Resource Limits:**
+```yaml
+resources:
+  requests:
+    memory: "64Mi"
+    cpu: "100m"
+  limits:
+    memory: "128Mi"
+    cpu: "200m"
+```
+
+**Security Note:**
+Never commit real secrets to Git! Use:
+- Placeholder values in `values.yaml`
+- `--set` flag during install
+- External secret management (next task)
+
+**Resources:**
+- [Managing Secrets with kubectl](https://kubernetes.io/docs/tasks/configmap-secret/managing-secret-using-kubectl/)
+- [Resource Management](https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/)
+
+</details>
+
+---
+
+### Task 3 — HashiCorp Vault Integration (3 pts)
+
+**Objective:** Deploy HashiCorp Vault and configure it to inject secrets into your application.
+
+**Requirements:**
+
+1. **Install Vault via Helm**
+   - Add HashiCorp Helm repository
+   - Install Vault in dev mode (for learning purposes)
+   - Verify all Vault pods are running
+
+2. **Configure Vault**
+   - Enable KV secrets engine (v2)
+   - Create a secret path for your application
+   - Store at least two key-value pairs
+
+3. **Configure Kubernetes Authentication**
+   - Enable Kubernetes auth method in Vault
+   - Create a policy that grants read access to your secret path
+   - Create a role bound to your application's service account
+
+4. **Enable Vault Agent Injection**
+   - Add Vault annotations to your deployment
+   - Configure the agent to inject secrets as files
+   - Verify secrets are available inside the pod at the expected path
+
+<details>
+<summary>💡 Hints</summary>
+
+**Installing Vault:**
+```bash
+# Add repo
+helm repo add hashicorp https://helm.releases.hashicorp.com
+helm repo update
+
+# Install in dev mode (NOT for production!)
+helm install vault hashicorp/vault \
+  --set "server.dev.enabled=true" \
+  --set "injector.enabled=true"
+```
+
+**Vault Configuration Steps:**
+1. Exec into Vault pod: `kubectl exec -it vault-0 -- /bin/sh`
+2. Vault is auto-initialized in dev mode
+3. Use `vault` CLI inside the pod
+
+**Key Vault Commands:**
+```bash
+# Enable KV v2
+vault secrets enable -path=secret kv-v2
+
+# Create secret
+vault kv put secret/myapp/config username="admin" password="secret123"
+
+# Enable K8s auth
+vault auth enable kubernetes
+
+# Configure K8s auth (get values from your cluster)
+vault write auth/kubernetes/config \
+  kubernetes_host="https://$KUBERNETES_PORT_443_TCP_ADDR:443"
+```
+
+**Policy and Role:**
+You need to:
+1. Create a policy that allows reading from your secret path
+2. Create a role that binds the policy to your service account
+
+**Vault Agent Annotations:**
+Add these to your deployment's pod template:
+```yaml
+annotations:
+  vault.hashicorp.com/agent-inject: "true"
+  vault.hashicorp.com/role: "your-role"
+  vault.hashicorp.com/agent-inject-secret-config: "secret/data/myapp/config"
+```
+
+**Resources:**
+- [Vault Helm Chart](https://developer.hashicorp.com/vault/docs/platform/k8s/helm)
+- [Vault K8s Sidecar Tutorial](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar)
+- [Agent Annotations](https://developer.hashicorp.com/vault/docs/platform/k8s/injector/annotations)
+
+</details>
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Objective:** Document your secret management implementation.
+
+**Create `k8s/SECRETS.md` with:**
+
+1. **Kubernetes Secrets**
+   - Output of creating and viewing your secret
+   - Decoded secret values demonstration
+   - Explanation of base64 encoding vs encryption
+
+2. **Helm Secret Integration**
+   - Chart structure showing secrets.yaml
+   - How secrets are consumed in deployment
+   - Verification output (env vars in pod, excluding actual values)
+
+3. **Resource Management**
+   - Resource limits configuration
+   - Explanation of requests vs limits
+   - How to choose appropriate values
+
+4. **Vault Integration**
+   - Vault installation verification (`kubectl get pods`)
+   - Policy and role configuration (sanitized)
+   - Proof of secret injection (show file exists, path structure)
+   - Explanation of the sidecar injection pattern
+
+5. **Security Analysis**
+   - Comparison: K8s Secrets vs Vault
+   - When to use each approach
+   - Production recommendations
+
+---
+
+## Bonus Task — Vault Agent Templates (2.5 pts)
+
+**Objective:** Use Vault Agent templating to render secrets in custom formats.
+
+**Requirements:**
+
+1. **Implement Template Annotation**
+   - Use `vault.hashicorp.com/agent-inject-template-*` annotation
+   - Render secrets as a configuration file (e.g., `.env` format or JSON)
+   - Include multiple secrets in a single rendered file
+
+2. **Dynamic Secret Rotation**
+   - Research how Vault Agent handles secret updates
+   - Document the refresh mechanism
+   - Explain `vault.hashicorp.com/agent-inject-command` annotation
+
+3. **Named Templates for Environment Variables**
+   - Create a named template in `_helpers.tpl` for common environment variables
+   - Use `include` to reference it in your deployment
+   - Demonstrate DRY principle in Helm charts
+
+<details>
+<summary>💡 Hints</summary>
+
+**Template Annotation Example:**
+```yaml
+vault.hashicorp.com/agent-inject-template-config: |
+  {{- with secret "secret/data/myapp/config" -}}
+  DATABASE_URL={{ .Data.data.db_url }}
+  API_KEY={{ .Data.data.api_key }}
+  {{- end -}}
+```
+
+**Named Template Pattern:**
+In `_helpers.tpl`:
+```yaml
+{{- define "mychart.envVars" -}}
+- name: APP_ENV
+  value: {{ .Values.environment }}
+- name: LOG_LEVEL
+  value: {{ .Values.logLevel }}
+{{- end -}}
+```
+
+In deployment:
+```yaml
+env:
+  {{- include "mychart.envVars" . | nindent 12 }}
+```
+
+**Resources:**
+- [Vault Agent Templates](https://developer.hashicorp.com/vault/docs/platform/k8s/injector/annotations#vault-hashicorp-com-agent-inject-template)
+- [Helm Named Templates](https://helm.sh/docs/chart_template_guide/named_templates/)
+
+</details>
+
+**Bonus Documentation:**
+- Template annotation configuration
+- Rendered secret file content
+- Named template implementation
+- Benefits of templating approach
+
+---
+
+## Checklist
+
+### Task 1 — Kubernetes Secrets Fundamentals (2 pts)
+- [ ] Secret created via kubectl
+- [ ] Secret viewed and decoded
+- [ ] Security implications understood and documented
+
+### Task 2 — Helm-Managed Secrets (3 pts)
+- [ ] `templates/secrets.yaml` created
+- [ ] Secrets defined in `values.yaml`
+- [ ] Deployment updated to consume secrets
+- [ ] Environment variables verified in pod
+- [ ] Resource limits configured
+
+### Task 3 — HashiCorp Vault Integration (3 pts)
+- [ ] Vault installed via Helm
+- [ ] KV secrets engine configured
+- [ ] Kubernetes auth method enabled
+- [ ] Policy and role created
+- [ ] Vault Agent injection working
+- [ ] Secrets accessible in pod
+
+### Task 4 — Documentation (2 pts)
+- [ ] `k8s/SECRETS.md` complete
+- [ ] All sections documented with evidence
+- [ ] Security analysis included
+
+### Bonus — Vault Agent Templates (2.5 pts)
+- [ ] Template annotation implemented
+- [ ] Custom format rendering working
+- [ ] Named templates in `_helpers.tpl`
+- [ ] Documentation complete
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **K8s Secrets** | 2 pts | Create, view, decode, understand security |
+| **Helm Secrets** | 3 pts | Template, inject, verify, resource limits |
+| **Vault Integration** | 3 pts | Install, configure, auth, inject |
+| **Documentation** | 2 pts | Complete SECRETS.md with evidence |
+| **Bonus** | 2.5 pts | Templates, named templates, rotation |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Working Vault injection, proper Helm secrets, good documentation
+- **8-9/10:** Vault working, minor issues with docs or config
+- **6-7/10:** K8s secrets work, Vault partially configured
+- **<6/10:** Secrets not properly implemented, missing Vault setup
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Documentation</summary>
+
+- [Kubernetes Secrets](https://kubernetes.io/docs/concepts/configuration/secret/)
+- [HashiCorp Vault](https://developer.hashicorp.com/vault/docs)
+- [Vault Helm Chart](https://developer.hashicorp.com/vault/docs/platform/k8s/helm)
+- [Vault K8s Injector](https://developer.hashicorp.com/vault/docs/platform/k8s/injector)
+
+</details>
+
+<details>
+<summary>🎓 Tutorials</summary>
+
+- [Vault on Kubernetes Deployment Guide](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-raft-deployment-guide)
+- [Injecting Secrets into Kubernetes Pods](https://developer.hashicorp.com/vault/tutorials/kubernetes/kubernetes-sidecar)
+- [Kubernetes Auth Method](https://developer.hashicorp.com/vault/docs/auth/kubernetes)
+
+</details>
+
+<details>
+<summary>🔐 Security Best Practices</summary>
+
+- [Kubernetes Secrets Best Practices](https://kubernetes.io/docs/concepts/security/secrets-good-practices/)
+- [Encrypting Data at Rest](https://kubernetes.io/docs/tasks/administer-cluster/encrypt-data/)
+- [External Secrets Operator](https://external-secrets.io/) - Alternative approach
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 12:** ConfigMaps for non-sensitive configuration and persistent storage
+- **Lab 13:** ArgoCD will deploy your secured Helm charts via GitOps
+- **Lab 14:** Progressive delivery with Argo Rollouts
+- **Lab 15:** StatefulSets with persistent storage
+
+---
+
+**Good luck!** 🔐
+
+> **Remember:** Never commit real secrets to version control. Use placeholder values and inject real secrets at deployment time. In production, always use an external secret manager like Vault.
diff --git a/labs/lab12.md b/labs/lab12.md
new file mode 100644
index 0000000000..76fffacf8f
--- /dev/null
+++ b/labs/lab12.md
@@ -0,0 +1,466 @@
+# Lab 12 — ConfigMaps & Persistent Volumes
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Configuration%20%26%20Storage-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-ConfigMaps%20%7C%20PVC-informational)
+
+> Externalize application configuration with ConfigMaps and ensure data persistence with Persistent Volumes.
+
+## Overview
+
+Production applications need externalized configuration and persistent storage. ConfigMaps decouple configuration from container images, enabling the same image to run in different environments. Persistent Volumes ensure your application data survives pod restarts and rescheduling.
+
+**What You'll Learn:**
+- ConfigMap creation and mounting strategies
+- File-based vs environment variable configuration
+- Persistent Volume Claims (PVC) in Kubernetes
+- Volume mounting and data persistence
+- Configuration best practices
+
+**Building On:** Your Helm chart from Lab 11 will be extended with ConfigMaps and persistent storage.
+
+**Tech Stack:** Kubernetes ConfigMaps | PersistentVolumeClaim | Helm | Volume Mounts
+
+---
+
+## Tasks
+
+### Task 1 — Application Persistence Upgrade (2 pts)
+
+**Objective:** Modify your application to track and persist visit counts.
+
+**Requirements:**
+
+1. **Add Visits Counter Logic**
+   - Implement a counter that increments on each request to the root endpoint
+   - Store the counter value in a file (e.g., `/data/visits`)
+   - Create a new `/visits` endpoint that returns the current count
+
+2. **Update Application Code**
+   - Read counter from file on startup (default to 0 if file doesn't exist)
+   - Increment and save on each root endpoint access
+   - Handle concurrent access appropriately
+
+3. **Test Locally with Docker**
+   - Update `docker-compose.yml` to mount a volume for the visits file
+   - Verify the counter persists across container restarts
+   - Update your application's `README.md`
+
+<details>
+<summary>💡 Hints</summary>
+
+**Implementation Pattern:**
+```
+Request to / → Read counter from file → Increment → Write back → Return response
+Request to /visits → Read counter from file → Return count
+```
+
+**File-Based Counter:**
+- Use a simple text file or JSON
+- Handle file not found gracefully
+- Consider atomic write operations
+
+**Docker Compose Volume:**
+```yaml
+volumes:
+  - ./data:/app/data
+```
+
+**Testing:**
+1. Start container
+2. Access root endpoint multiple times
+3. Check file on host: `cat ./data/visits`
+4. Restart container
+5. Verify counter continues from last value
+
+**Thread Safety:**
+For a simple counter, file locking or atomic operations help prevent race conditions. For this lab, basic file read/write is acceptable.
+
+</details>
+
+---
+
+### Task 2 — ConfigMaps (3 pts)
+
+**Objective:** Externalize application configuration using Kubernetes ConfigMaps.
+
+**Requirements:**
+
+1. **Create Configuration File**
+   - Create a `files/` directory in your Helm chart
+   - Add `config.json` with application configuration:
+     - Application name
+     - Environment (dev/prod)
+     - Feature flags or settings
+
+2. **Create ConfigMap Template**
+   - Add `templates/configmap.yaml` to your Helm chart
+   - Use `.Files.Get` to load the config file content
+   - Include proper metadata and labels
+
+3. **Mount ConfigMap as File**
+   - Update deployment to mount ConfigMap as a volume
+   - Mount at a specific path (e.g., `/config/config.json`)
+   - Verify the file is accessible inside the pod
+
+4. **Use ConfigMap as Environment Variables**
+   - Create a second ConfigMap with key-value pairs
+   - Use `envFrom` with `configMapRef` to inject all keys
+   - Verify environment variables in the pod
+
+<details>
+<summary>💡 Hints</summary>
+
+**ConfigMap from File:**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: {{ include "mychart.fullname" . }}-config
+data:
+  config.json: |-
+{{ .Files.Get "files/config.json" | indent 4 }}
+```
+
+**ConfigMap for Env Vars:**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: {{ include "mychart.fullname" . }}-env
+data:
+  APP_ENV: {{ .Values.environment | quote }}
+  LOG_LEVEL: {{ .Values.logLevel | quote }}
+```
+
+**Volume Mount Pattern:**
+In deployment spec:
+```yaml
+volumes:
+  - name: config-volume
+    configMap:
+      name: config-name
+containers:
+  - volumeMounts:
+      - name: config-volume
+        mountPath: /config
+```
+
+**Environment Variables:**
+```yaml
+envFrom:
+  - configMapRef:
+      name: {{ include "mychart.fullname" . }}-env
+```
+
+**Verification:**
+```bash
+kubectl exec <pod> -- cat /config/config.json
+kubectl exec <pod> -- printenv | grep APP_
+```
+
+**Resources:**
+- [ConfigMaps](https://kubernetes.io/docs/concepts/configuration/configmap/)
+- [Configure Pod with ConfigMap](https://kubernetes.io/docs/tasks/configure-pod-container/configure-pod-configmap/)
+
+</details>
+
+---
+
+### Task 3 — Persistent Volumes (3 pts)
+
+**Objective:** Implement persistent storage for your application's visit counter.
+
+**Requirements:**
+
+1. **Create PersistentVolumeClaim**
+   - Add `templates/pvc.yaml` to your Helm chart
+   - Request appropriate storage size (e.g., 100Mi)
+   - Use `ReadWriteOnce` access mode
+   - Make storage class configurable via values
+
+2. **Mount PVC to Deployment**
+   - Add volume referencing the PVC
+   - Mount at your data directory (e.g., `/data`)
+   - Ensure your application writes visits file there
+
+3. **Verify Persistence**
+   - Deploy the application
+   - Access root endpoint multiple times
+   - Delete the pod (not the deployment)
+   - Verify the new pod has the same counter value
+
+4. **Test Data Survival**
+   - Check visits count before pod deletion
+   - Delete pod: `kubectl delete pod <pod-name>`
+   - Wait for new pod to start
+   - Verify visits count is preserved
+
+<details>
+<summary>💡 Hints</summary>
+
+**PVC Template:**
+```yaml
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: {{ include "mychart.fullname" . }}-data
+  labels:
+    {{- include "mychart.labels" . | nindent 4 }}
+spec:
+  accessModes:
+    - ReadWriteOnce
+  resources:
+    requests:
+      storage: {{ .Values.persistence.size }}
+  {{- if .Values.persistence.storageClass }}
+  storageClassName: {{ .Values.persistence.storageClass }}
+  {{- end }}
+```
+
+**Values.yaml:**
+```yaml
+persistence:
+  enabled: true
+  size: 100Mi
+  storageClass: ""  # Use default
+```
+
+**Mounting PVC:**
+```yaml
+volumes:
+  - name: data-volume
+    persistentVolumeClaim:
+      claimName: {{ include "mychart.fullname" . }}-data
+containers:
+  - volumeMounts:
+      - name: data-volume
+        mountPath: /data
+```
+
+**Minikube Storage:**
+Minikube provides a default storage class that provisions hostPath volumes automatically.
+
+**Verification Commands:**
+```bash
+kubectl get pvc
+kubectl describe pvc <pvc-name>
+kubectl exec <pod> -- cat /data/visits
+```
+
+**Resources:**
+- [Persistent Volumes](https://kubernetes.io/docs/concepts/storage/persistent-volumes/)
+- [Configure Pod with PVC](https://kubernetes.io/docs/tasks/configure-pod-container/configure-persistent-volume-storage/)
+
+</details>
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Objective:** Document your ConfigMap and persistence implementation.
+
+**Create `k8s/CONFIGMAPS.md` with:**
+
+1. **Application Changes**
+   - Description of visits counter implementation
+   - New endpoint documentation
+   - Local testing evidence with Docker
+
+2. **ConfigMap Implementation**
+   - ConfigMap template structure
+   - `config.json` content
+   - How ConfigMap is mounted as file
+   - How ConfigMap provides environment variables
+   - Verification outputs
+
+3. **Persistent Volume**
+   - PVC configuration explanation
+   - Access modes and storage class discussion
+   - Volume mount configuration
+   - Persistence test evidence:
+     - Counter value before pod deletion
+     - Pod deletion command
+     - Counter value after new pod starts
+
+4. **ConfigMap vs Secret**
+   - When to use ConfigMap
+   - When to use Secret
+   - Key differences
+
+**Required Screenshots/Outputs:**
+- `kubectl get configmap,pvc` output
+- File content inside pod (`cat /config/config.json`)
+- Environment variables in pod
+- Persistence test (before/after pod restart)
+
+---
+
+## Bonus Task — ConfigMap Hot Reload (2.5 pts)
+
+**Objective:** Understand ConfigMap update behavior and implement configuration reloading.
+
+**Requirements:**
+
+1. **Test Default Update Behavior**
+   - Update ConfigMap content (e.g., via `kubectl edit configmap`)
+   - Observe when changes appear in the mounted file
+   - Document the delay (kubelet sync period)
+
+2. **Understand subPath Limitation**
+   - Research why `subPath` mounts don't receive updates
+   - Document when to use and avoid `subPath`
+
+3. **Implement Application Reload**
+   - Research approaches for configuration hot reload:
+     - Sidecar pattern (config reloader)
+     - Application file watching
+     - Pod restart via annotations
+   - Implement one approach and document it
+
+4. **Helm Upgrade Pattern**
+   - Use `helm.sh/resource-policy` or checksum annotations
+   - Trigger pod restart when ConfigMap changes
+   - Demonstrate the pattern
+
+<details>
+<summary>💡 Hints</summary>
+
+**Checksum Annotation Pattern:**
+```yaml
+spec:
+  template:
+    metadata:
+      annotations:
+        checksum/config: {{ include (print $.Template.BasePath "/configmap.yaml") . | sha256sum }}
+```
+
+This causes the deployment to update (and pods to restart) whenever the ConfigMap changes.
+
+**Config Reloader Sidecar:**
+Projects like `stakater/Reloader` automatically restart pods when ConfigMaps change.
+
+**Kubelet Sync Period:**
+By default, kubelet syncs ConfigMap changes every 60 seconds + cache TTL. Total delay can be up to a few minutes.
+
+**subPath Behavior:**
+When using `subPath`, the file is a copy, not a symlink, so it doesn't update. Use full directory mounts for auto-updates.
+
+**Resources:**
+- [ConfigMap Auto-Updates](https://kubernetes.io/docs/concepts/configuration/configmap/#mounted-configmaps-are-updated-automatically)
+- [Reloader](https://github.com/stakater/Reloader)
+
+</details>
+
+**Bonus Documentation:**
+- Update delay measurement
+- subPath limitation explanation
+- Chosen reload approach implementation
+- Evidence of configuration reload working
+
+---
+
+## Checklist
+
+### Task 1 — Application Persistence Upgrade (2 pts)
+- [ ] Visits counter implemented
+- [ ] `/visits` endpoint created
+- [ ] Counter persists in file
+- [ ] Docker Compose volume configured
+- [ ] Local testing successful
+- [ ] README updated
+
+### Task 2 — ConfigMaps (3 pts)
+- [ ] `files/config.json` created
+- [ ] ConfigMap template for file mounting
+- [ ] ConfigMap template for env vars
+- [ ] ConfigMap mounted as file in pod
+- [ ] Environment variables injected
+- [ ] Verification outputs collected
+
+### Task 3 — Persistent Volumes (3 pts)
+- [ ] PVC template created
+- [ ] PVC mounted to deployment
+- [ ] Visits file stored on PVC
+- [ ] Persistence tested (pod deletion)
+- [ ] Data survives pod restart
+
+### Task 4 — Documentation (2 pts)
+- [ ] `k8s/CONFIGMAPS.md` complete
+- [ ] Application changes documented
+- [ ] ConfigMap implementation documented
+- [ ] PVC implementation documented
+- [ ] All verification outputs included
+
+### Bonus — ConfigMap Hot Reload (2.5 pts)
+- [ ] Update delay tested
+- [ ] subPath limitation documented
+- [ ] Reload mechanism implemented
+- [ ] Documentation complete
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **App Upgrade** | 2 pts | Visits counter, persistence, /visits endpoint |
+| **ConfigMaps** | 3 pts | File mount, env vars, proper templating |
+| **Persistent Volumes** | 3 pts | PVC, mount, verified persistence |
+| **Documentation** | 2 pts | Complete CONFIGMAPS.md |
+| **Bonus** | 2.5 pts | Hot reload understanding and implementation |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Working persistence, proper ConfigMaps, verified data survival
+- **8-9/10:** ConfigMaps work, persistence mostly working
+- **6-7/10:** Basic ConfigMap mounting, persistence issues
+- **<6/10:** ConfigMaps not properly mounted, no persistence
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Documentation</summary>
+
+- [ConfigMaps](https://kubernetes.io/docs/concepts/configuration/configmap/)
+- [Persistent Volumes](https://kubernetes.io/docs/concepts/storage/persistent-volumes/)
+- [Persistent Volume Claims](https://kubernetes.io/docs/concepts/storage/persistent-volumes/#persistentvolumeclaims)
+- [Storage Classes](https://kubernetes.io/docs/concepts/storage/storage-classes/)
+
+</details>
+
+<details>
+<summary>🎓 Tutorials</summary>
+
+- [Configure Pod with ConfigMap](https://kubernetes.io/docs/tasks/configure-pod-container/configure-pod-configmap/)
+- [Configure Pod with PVC](https://kubernetes.io/docs/tasks/configure-pod-container/configure-persistent-volume-storage/)
+- [Mounting ConfigMaps as Files](https://kubernetes.io/docs/concepts/configuration/configmap/#using-configmaps-as-files-from-a-pod)
+
+</details>
+
+<details>
+<summary>🛠️ Tools & Patterns</summary>
+
+- [Helm Files Function](https://helm.sh/docs/chart_template_guide/accessing_files/)
+- [Stakater Reloader](https://github.com/stakater/Reloader)
+- [Minikube Storage](https://minikube.sigs.k8s.io/docs/handbook/persistent_volumes/)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 13:** ArgoCD will deploy your configured Helm charts via GitOps
+- **Lab 14:** Progressive delivery with Argo Rollouts
+- **Lab 15:** StatefulSets for per-pod persistent storage
+- **Lab 16:** Monitoring your application configuration and storage
+
+---
+
+**Good luck!** 📦
+
+> **Remember:** ConfigMaps are for non-sensitive configuration data. Use Secrets (Lab 11) for sensitive data. Persistent Volumes ensure your data survives the ephemeral nature of pods.
diff --git a/labs/lab13.md b/labs/lab13.md
new file mode 100644
index 0000000000..21c6321d21
--- /dev/null
+++ b/labs/lab13.md
@@ -0,0 +1,594 @@
+# Lab 13 — GitOps with ArgoCD
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-GitOps-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-ArgoCD%202.13-informational)
+
+> Implement GitOps continuous deployment using ArgoCD for declarative, version-controlled Kubernetes deployments.
+
+## Overview
+
+GitOps is the practice of using Git as the single source of truth for declarative infrastructure and applications. ArgoCD is a declarative, GitOps continuous delivery tool for Kubernetes that automatically syncs your cluster state with your Git repository.
+
+**What You'll Learn:**
+- GitOps principles and benefits
+- ArgoCD installation and configuration
+- Application deployment via ArgoCD
+- Multi-environment deployment patterns
+- Auto-sync and self-healing mechanisms
+- Sync policies and strategies
+
+**Building On:** Your Helm chart from Labs 10-12 will be deployed and managed by ArgoCD.
+
+**Tech Stack:** ArgoCD 2.13+ | Kubernetes | Helm | GitOps
+
+---
+
+## Tasks
+
+### Task 1 — ArgoCD Installation & Setup (2 pts)
+
+**Objective:** Install ArgoCD and access the management interface.
+
+**Requirements:**
+
+1. **Install ArgoCD via Helm**
+   - Add the ArgoCD Helm repository
+   - Create a dedicated namespace for ArgoCD
+   - Install ArgoCD with appropriate configuration
+   - Wait for all components to be ready
+
+2. **Access ArgoCD UI**
+   - Set up port forwarding to the ArgoCD server
+   - Retrieve the initial admin password
+   - Log in to the ArgoCD web interface
+   - Explore the UI layout and features
+
+3. **Install ArgoCD CLI**
+   - Install the `argocd` CLI tool for your platform
+   - Log in via CLI
+   - Verify connection with basic commands
+
+<details>
+<summary>💡 Hints</summary>
+
+**Installation Commands:**
+```bash
+# Add Helm repo
+helm repo add argo https://argoproj.github.io/argo-helm
+helm repo update
+
+# Create namespace and install
+kubectl create namespace argocd
+helm install argocd argo/argo-cd --namespace argocd
+
+# Wait for pods
+kubectl wait --for=condition=ready pod -l app.kubernetes.io/name=argocd-server -n argocd --timeout=120s
+```
+
+**Accessing UI:**
+```bash
+# Port forward (keep running)
+kubectl port-forward svc/argocd-server -n argocd 8080:443
+
+# Get initial password
+kubectl -n argocd get secret argocd-initial-admin-secret -o jsonpath="{.data.password}" | base64 -d
+
+# Access at https://localhost:8080
+# Username: admin
+```
+
+**CLI Installation:**
+- **macOS:** `brew install argocd`
+- **Linux:** Download from GitHub releases
+- Check [ArgoCD CLI Installation](https://argo-cd.readthedocs.io/en/stable/cli_installation/)
+
+**CLI Login:**
+```bash
+argocd login localhost:8080 --insecure
+# Use admin and the password retrieved above
+```
+
+**Resources:**
+- [ArgoCD Getting Started](https://argo-cd.readthedocs.io/en/stable/getting_started/)
+- [ArgoCD Helm Chart](https://github.com/argoproj/argo-helm/tree/main/charts/argo-cd)
+
+</details>
+
+---
+
+### Task 2 — Application Deployment (3 pts)
+
+**Objective:** Deploy your application using ArgoCD's declarative Application resource.
+
+**Requirements:**
+
+1. **Create ArgoCD Application Manifest**
+   - Create `k8s/argocd/` directory
+   - Create `application.yaml` defining your app
+   - Specify:
+     - Source: Your Git repository and path to Helm chart
+     - Destination: Target cluster and namespace
+     - Sync policy: Manual initially
+
+2. **Deploy the Application**
+   - Apply the Application manifest
+   - Observe the application in ArgoCD UI
+   - Understand the sync status indicators
+
+3. **Perform Initial Sync**
+   - Trigger manual sync via UI or CLI
+   - Watch the deployment progress
+   - Verify all resources are created
+   - Access your application
+
+4. **Test GitOps Workflow**
+   - Make a change to your Helm chart (e.g., replica count)
+   - Commit and push to your repository
+   - Observe ArgoCD detecting the drift
+   - Sync the changes
+
+<details>
+<summary>💡 Hints</summary>
+
+**Application Manifest Structure:**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Application
+metadata:
+  name: python-app
+  namespace: argocd
+spec:
+  project: default
+  source:
+    repoURL: https://github.com/<username>/<repo>.git
+    targetRevision: <branch>
+    path: <path-to-helm-chart>
+    helm:
+      valueFiles:
+        - values.yaml
+  destination:
+    server: https://kubernetes.default.svc
+    namespace: default
+  syncPolicy:
+    syncOptions:
+      - CreateNamespace=true
+```
+
+**Key Fields:**
+- `repoURL`: Your GitHub repository URL
+- `targetRevision`: Branch name (e.g., `main`, `lab13`)
+- `path`: Path to Helm chart within repo (e.g., `k8s/app-python`)
+- `destination.namespace`: Where to deploy
+
+**Apply and Sync:**
+```bash
+kubectl apply -f k8s/argocd/application.yaml
+
+# CLI sync
+argocd app sync python-app
+
+# Check status
+argocd app get python-app
+```
+
+**Sync Status:**
+- **Synced:** Cluster matches Git
+- **OutOfSync:** Git has changes not applied
+- **Unknown:** Unable to determine state
+- **Healthy/Degraded/Progressing:** Application health
+
+**Resources:**
+- [ArgoCD Application Specification](https://argo-cd.readthedocs.io/en/stable/operator-manual/declarative-setup/)
+- [Sync Options](https://argo-cd.readthedocs.io/en/stable/user-guide/sync-options/)
+
+</details>
+
+---
+
+### Task 3 — Multi-Environment Deployment (3 pts)
+
+**Objective:** Deploy your application to multiple environments (dev/prod) with different configurations.
+
+**Requirements:**
+
+1. **Create Namespaces**
+   - Create `dev` and `prod` namespaces
+   - These will host separate instances of your app
+
+2. **Create Environment-Specific Applications**
+   - Create `application-dev.yaml` using `values-dev.yaml`
+   - Create `application-prod.yaml` using `values-prod.yaml`
+   - Different replica counts, resource limits per environment
+
+3. **Enable Auto-Sync for Dev**
+   - Configure automatic sync for the dev environment
+   - Add `automated` sync policy
+   - Enable `selfHeal` and `prune` options
+
+4. **Keep Prod Manual**
+   - Production remains manual sync
+   - Understand why this is a best practice
+   - Document the deployment workflow difference
+
+5. **Verify Both Environments**
+   - Both apps visible in ArgoCD UI
+   - Different configurations applied
+   - Resources deployed to correct namespaces
+
+<details>
+<summary>💡 Hints</summary>
+
+**Create Namespaces:**
+```bash
+kubectl create namespace dev
+kubectl create namespace prod
+```
+
+**Dev Application with Auto-Sync:**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Application
+metadata:
+  name: python-app-dev
+  namespace: argocd
+spec:
+  project: default
+  source:
+    repoURL: https://github.com/<username>/<repo>.git
+    targetRevision: <branch>
+    path: <path-to-helm-chart>
+    helm:
+      valueFiles:
+        - values-dev.yaml
+  destination:
+    server: https://kubernetes.default.svc
+    namespace: dev
+  syncPolicy:
+    automated:
+      prune: true
+      selfHeal: true
+    syncOptions:
+      - CreateNamespace=true
+```
+
+**Prod Application (Manual):**
+```yaml
+# Similar but without automated sync policy
+syncPolicy:
+  syncOptions:
+    - CreateNamespace=true
+  # No automated block = manual sync
+```
+
+**Sync Policy Options:**
+- `automated`: Enable auto-sync
+- `prune`: Delete resources removed from Git
+- `selfHeal`: Revert manual cluster changes
+- Without `automated`: Manual sync required
+
+**Why Manual for Prod?**
+- Change review before deployment
+- Controlled release timing
+- Compliance requirements
+- Rollback planning
+
+**Verification:**
+```bash
+kubectl get pods -n dev
+kubectl get pods -n prod
+argocd app list
+```
+
+</details>
+
+---
+
+### Task 4 — Self-Healing & Sync Policies (2 pts)
+
+**Objective:** Test and understand ArgoCD's self-healing and drift detection capabilities.
+
+**Requirements:**
+
+1. **Test Self-Healing (Dev Environment)**
+   - Manually scale the deployment:
+     ```bash
+     kubectl scale deployment <name> -n dev --replicas=5
+     ```
+   - Observe ArgoCD detecting the drift
+   - Watch it automatically revert to Git-defined state
+   - Document the behavior with timestamps
+
+2. **Test Pod Deletion**
+   - Delete a pod in dev namespace
+   - Observe Kubernetes recreating the pod
+   - Note: This is Kubernetes behavior, not ArgoCD
+   - Understand the difference between:
+     - Kubernetes self-healing (pod recreation)
+     - ArgoCD self-healing (configuration drift)
+
+3. **Test Configuration Drift**
+   - Manually edit a resource (e.g., add a label)
+   - Observe ArgoCD diff view
+   - Watch self-heal revert the change
+
+4. **Document Sync Behavior**
+   - Explain when ArgoCD syncs vs when Kubernetes heals
+   - What triggers ArgoCD sync?
+   - What is the sync interval?
+
+<details>
+<summary>💡 Hints</summary>
+
+**Self-Healing Test:**
+```bash
+# Scale manually
+kubectl scale deployment python-app-dev -n dev --replicas=5
+
+# Watch ArgoCD revert (if selfHeal enabled)
+kubectl get pods -n dev -w
+
+# Check ArgoCD status
+argocd app get python-app-dev
+```
+
+**View Drift:**
+```bash
+argocd app diff python-app-dev
+```
+
+**Pod Deletion Test:**
+```bash
+# Delete a pod
+kubectl delete pod -n dev -l app.kubernetes.io/name=python-app
+
+# Kubernetes recreates it immediately (ReplicaSet controller)
+kubectl get pods -n dev -w
+```
+
+**Key Difference:**
+- **Kubernetes Self-Healing:** ReplicaSet/Deployment ensures desired pod count
+- **ArgoCD Self-Healing:** Reverts cluster state to match Git state
+
+**Sync Interval:**
+ArgoCD polls Git every 3 minutes by default. You can also:
+- Use webhooks for immediate sync
+- Manually trigger sync
+- Configure different intervals
+
+**Resources:**
+- [Automated Sync Policy](https://argo-cd.readthedocs.io/en/stable/user-guide/auto_sync/)
+- [Self Heal](https://argo-cd.readthedocs.io/en/stable/user-guide/auto_sync/#automatic-self-healing)
+
+</details>
+
+**Documentation Required in `k8s/ARGOCD.md`:**
+
+1. **ArgoCD Setup**
+   - Installation verification
+   - UI access method
+   - CLI configuration
+
+2. **Application Configuration**
+   - Application manifests
+   - Source and destination configuration
+   - Values file selection
+
+3. **Multi-Environment**
+   - Dev vs Prod configuration differences
+   - Sync policy differences and rationale
+   - Namespace separation
+
+4. **Self-Healing Evidence**
+   - Manual scale test with before/after
+   - Pod deletion test
+   - Configuration drift test
+   - Explanation of behaviors
+
+5. **Screenshots**
+   - ArgoCD UI showing both applications
+   - Sync status
+   - Application details view
+
+---
+
+## Bonus Task — ApplicationSet (2.5 pts)
+
+**Objective:** Use ApplicationSet to generate multiple applications from a single template.
+
+**Requirements:**
+
+1. **Understand ApplicationSet**
+   - Research ApplicationSet generators
+   - Understand use cases (multi-cluster, multi-tenant, mono-repo)
+
+2. **Implement List Generator**
+   - Create an ApplicationSet that generates both dev and prod apps
+   - Use the List generator to define environment-specific parameters
+   - Replace individual Application manifests
+
+3. **Implement Git Directory Generator (Optional)**
+   - If you have multiple apps in your repo
+   - Use Git directory generator to auto-discover apps
+
+4. **Document the Pattern**
+   - Benefits of ApplicationSet over individual Applications
+   - When to use which generator type
+   - Scaling considerations
+
+<details>
+<summary>💡 Hints</summary>
+
+**ApplicationSet with List Generator:**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: ApplicationSet
+metadata:
+  name: python-app-set
+  namespace: argocd
+spec:
+  generators:
+    - list:
+        elements:
+          - env: dev
+            namespace: dev
+            valuesFile: values-dev.yaml
+            autoSync: true
+          - env: prod
+            namespace: prod
+            valuesFile: values-prod.yaml
+            autoSync: false
+  template:
+    metadata:
+      name: 'python-app-{{env}}'
+    spec:
+      project: default
+      source:
+        repoURL: https://github.com/<username>/<repo>.git
+        targetRevision: <branch>
+        path: <path-to-helm-chart>
+        helm:
+          valueFiles:
+            - '{{valuesFile}}'
+      destination:
+        server: https://kubernetes.default.svc
+        namespace: '{{namespace}}'
+      syncPolicy:
+        # Conditional sync policy based on env
+        # Note: This requires templating tricks or separate ApplicationSets
+```
+
+**Git Directory Generator:**
+```yaml
+generators:
+  - git:
+      repoURL: https://github.com/<username>/<repo>.git
+      revision: HEAD
+      directories:
+        - path: k8s/*
+```
+
+**Generators Available:**
+- List: Explicit list of parameters
+- Cluster: Multi-cluster deployments
+- Git: Based on Git files/directories
+- Matrix: Combine multiple generators
+- Merge: Merge generator outputs
+
+**Resources:**
+- [ApplicationSet Documentation](https://argo-cd.readthedocs.io/en/stable/user-guide/application-set/)
+- [Generators](https://argo-cd.readthedocs.io/en/stable/operator-manual/applicationset/Generators/)
+
+</details>
+
+**Bonus Documentation:**
+- ApplicationSet manifest
+- Generator configuration explanation
+- Generated Applications screenshot
+- Comparison with individual Applications
+
+---
+
+## Checklist
+
+### Task 1 — ArgoCD Installation & Setup (2 pts)
+- [ ] ArgoCD installed via Helm
+- [ ] All pods running in argocd namespace
+- [ ] UI accessible via port-forward
+- [ ] Admin password retrieved
+- [ ] CLI installed and logged in
+
+### Task 2 — Application Deployment (3 pts)
+- [ ] `k8s/argocd/` directory created
+- [ ] Application manifest created
+- [ ] Application visible in ArgoCD UI
+- [ ] Initial sync completed
+- [ ] App accessible and working
+- [ ] GitOps workflow tested
+
+### Task 3 — Multi-Environment Deployment (3 pts)
+- [ ] Dev and prod namespaces created
+- [ ] Dev application with auto-sync
+- [ ] Prod application with manual sync
+- [ ] Different configurations per environment
+- [ ] Both apps deployed and verified
+
+### Task 4 — Self-Healing & Documentation (2 pts)
+- [ ] Manual scale test performed
+- [ ] Self-healing observed
+- [ ] Pod deletion test performed
+- [ ] Configuration drift test done
+- [ ] `k8s/ARGOCD.md` complete
+
+### Bonus — ApplicationSet (2.5 pts)
+- [ ] ApplicationSet manifest created
+- [ ] Multiple apps generated from template
+- [ ] Generator configuration documented
+- [ ] Benefits documented
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Installation** | 2 pts | ArgoCD running, UI/CLI accessible |
+| **App Deployment** | 3 pts | Application manifest, sync working |
+| **Multi-Environment** | 3 pts | Dev/prod with different configs |
+| **Self-Healing** | 2 pts | Tests performed, documented |
+| **Bonus** | 2.5 pts | ApplicationSet implementation |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+**Grading:**
+- **10/10:** Full GitOps workflow, multi-env, self-healing documented
+- **8-9/10:** ArgoCD works, minor issues with multi-env or docs
+- **6-7/10:** Basic app deployment, missing multi-env or self-healing
+- **<6/10:** ArgoCD not properly configured, apps not syncing
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Documentation</summary>
+
+- [ArgoCD Documentation](https://argo-cd.readthedocs.io/)
+- [ArgoCD Operator Manual](https://argo-cd.readthedocs.io/en/stable/operator-manual/)
+- [Application CRD](https://argo-cd.readthedocs.io/en/stable/operator-manual/declarative-setup/)
+- [Sync Policies](https://argo-cd.readthedocs.io/en/stable/user-guide/auto_sync/)
+
+</details>
+
+<details>
+<summary>🎓 GitOps Concepts</summary>
+
+- [GitOps Principles](https://opengitops.dev/)
+- [GitOps Working Group](https://github.com/gitops-working-group/gitops-working-group)
+- [ArgoCD Best Practices](https://argo-cd.readthedocs.io/en/stable/user-guide/best_practices/)
+
+</details>
+
+<details>
+<summary>🛠️ Advanced Topics</summary>
+
+- [ApplicationSet](https://argo-cd.readthedocs.io/en/stable/user-guide/application-set/)
+- [Sync Waves](https://argo-cd.readthedocs.io/en/stable/user-guide/sync-waves/)
+- [Resource Hooks](https://argo-cd.readthedocs.io/en/stable/user-guide/resource_hooks/)
+- [Notifications](https://argo-cd.readthedocs.io/en/stable/operator-manual/notifications/)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 14:** Progressive delivery with Argo Rollouts
+- **Lab 15:** StatefulSets for stateful applications
+- **Lab 16:** Monitoring your GitOps deployments
+
+---
+
+**Good luck!** 🔄
+
+> **Remember:** GitOps means Git is the source of truth. Any changes should go through Git, not direct `kubectl` commands. ArgoCD ensures your cluster always matches what's in Git.
diff --git a/labs/lab14.md b/labs/lab14.md
new file mode 100644
index 0000000000..6cc6eaa347
--- /dev/null
+++ b/labs/lab14.md
@@ -0,0 +1,453 @@
+# Lab 14 — Progressive Delivery with Argo Rollouts
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Progressive%20Delivery-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Argo%20Rollouts-informational)
+
+> Implement canary and blue-green deployment strategies for safe, automated releases with traffic shifting and automatic rollback.
+
+## Overview
+
+Progressive delivery extends continuous delivery by gradually rolling out changes to a subset of users before full deployment. Argo Rollouts provides advanced deployment capabilities including canary releases, blue-green deployments, and automated rollbacks based on metrics.
+
+**What You'll Learn:**
+- Canary deployment strategy with traffic shifting
+- Blue-green deployment with instant rollback
+- Argo Rollouts Dashboard for visualization
+- Metrics-based automated promotion/rollback
+- Integration with existing Kubernetes services
+
+**Building On:** Your Helm chart from Lab 13 (ArgoCD) with Deployment will be converted to Rollout.
+
+**Tech Stack:** Argo Rollouts 1.7+ | Kubernetes | Prometheus (optional for analysis)
+
+---
+
+## Tasks
+
+### Task 1 — Argo Rollouts Fundamentals (2 pts)
+
+**Objective:** Install Argo Rollouts and understand the Rollout CRD.
+
+**Requirements:**
+
+1. **Install Argo Rollouts Controller**
+   - Install via kubectl or Helm
+   - Verify controller is running
+   - Install kubectl plugin for CLI management
+
+2. **Install Argo Rollouts Dashboard**
+   - Deploy the dashboard for visualization
+   - Access via port-forward
+   - Explore the UI
+
+3. **Understand Rollout vs Deployment**
+   - Compare Rollout CRD with Deployment
+   - Identify additional fields for progressive delivery
+   - Document key differences
+
+<details>
+<summary>💡 Hints</summary>
+
+**Installation:**
+```bash
+# Install controller
+kubectl create namespace argo-rollouts
+kubectl apply -n argo-rollouts -f https://github.com/argoproj/argo-rollouts/releases/latest/download/install.yaml
+
+# Install kubectl plugin
+# macOS
+brew install argoproj/tap/kubectl-argo-rollouts
+
+# Linux
+curl -LO https://github.com/argoproj/argo-rollouts/releases/latest/download/kubectl-argo-rollouts-linux-amd64
+chmod +x kubectl-argo-rollouts-linux-amd64
+sudo mv kubectl-argo-rollouts-linux-amd64 /usr/local/bin/kubectl-argo-rollouts
+
+# Verify
+kubectl argo rollouts version
+```
+
+**Dashboard:**
+```bash
+# Install dashboard
+kubectl apply -n argo-rollouts -f https://github.com/argoproj/argo-rollouts/releases/latest/download/dashboard-install.yaml
+
+# Access
+kubectl port-forward svc/argo-rollouts-dashboard -n argo-rollouts 3100:3100
+# Open http://localhost:3100
+```
+
+**Rollout vs Deployment:**
+- Rollout has `strategy` field with `canary` or `blueGreen` options
+- Supports traffic management, analysis, and automated rollback
+- Otherwise identical structure to Deployment
+
+**Resources:**
+- [Argo Rollouts Installation](https://argoproj.github.io/argo-rollouts/installation/)
+- [Rollout Specification](https://argoproj.github.io/argo-rollouts/features/specification/)
+
+</details>
+
+---
+
+### Task 2 — Canary Deployment (3 pts)
+
+**Objective:** Implement canary deployment strategy with gradual traffic shifting.
+
+**Requirements:**
+
+1. **Convert Deployment to Rollout**
+   - Create `templates/rollout.yaml` in your Helm chart
+   - Change `kind: Deployment` to `kind: Rollout`
+   - Add canary strategy configuration
+
+2. **Configure Canary Steps**
+   - Implement progressive traffic shifting:
+     - 20% → pause (manual promotion)
+     - 40% → pause 30 seconds
+     - 60% → pause 30 seconds
+     - 80% → pause 30 seconds
+     - 100%
+
+3. **Deploy and Test**
+   - Install the Rollout
+   - Make a change (e.g., update image tag or env var)
+   - Watch traffic shifting in dashboard
+   - Manually promote through first step
+   - Observe automatic progression
+
+4. **Test Rollback**
+   - During a rollout, abort it
+   - Observe traffic shifting back to stable version
+   - Verify instant rollback capability
+
+<details>
+<summary>💡 Hints</summary>
+
+**Rollout with Canary Strategy:**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Rollout
+metadata:
+  name: {{ include "mychart.fullname" . }}
+spec:
+  replicas: {{ .Values.replicaCount }}
+  selector:
+    matchLabels:
+      {{- include "mychart.selectorLabels" . | nindent 6 }}
+  template:
+    # Same as Deployment pod template
+    metadata:
+      labels:
+        {{- include "mychart.selectorLabels" . | nindent 8 }}
+    spec:
+      containers:
+        - name: {{ .Chart.Name }}
+          image: "{{ .Values.image.repository }}:{{ .Values.image.tag }}"
+          # ... rest of container spec
+  strategy:
+    canary:
+      steps:
+        - setWeight: 20
+        - pause: {}  # Manual promotion required
+        - setWeight: 40
+        - pause: { duration: 30s }
+        - setWeight: 60
+        - pause: { duration: 30s }
+        - setWeight: 80
+        - pause: { duration: 30s }
+        - setWeight: 100
+```
+
+**CLI Commands:**
+```bash
+# Watch rollout status
+kubectl argo rollouts get rollout <name> -w
+
+# Promote to next step
+kubectl argo rollouts promote <name>
+
+# Abort rollout
+kubectl argo rollouts abort <name>
+
+# Retry aborted rollout
+kubectl argo rollouts retry rollout <name>
+```
+
+**Important:** Your existing Service still works - it automatically routes to the correct pods based on Rollout's traffic management.
+
+</details>
+
+---
+
+### Task 3 — Blue-Green Deployment (3 pts)
+
+**Objective:** Implement blue-green deployment with preview environment.
+
+**Requirements:**
+
+1. **Create Blue-Green Rollout**
+   - Create a separate values file or modify existing
+   - Configure `blueGreen` strategy instead of `canary`
+   - Set up active and preview services
+
+2. **Configure Services**
+   - Active service: serves production traffic
+   - Preview service: serves new version for testing
+   - Understand `autoPromotionEnabled` setting
+
+3. **Test Blue-Green Flow**
+   - Deploy initial version (blue)
+   - Update image/config (triggers green deployment)
+   - Access preview service to test new version
+   - Promote green to active
+   - Verify instant switch
+
+4. **Test Instant Rollback**
+   - After promotion, trigger rollback
+   - Observe instant traffic switch back
+   - Document the speed difference vs canary
+
+<details>
+<summary>💡 Hints</summary>
+
+**Blue-Green Strategy:**
+```yaml
+spec:
+  strategy:
+    blueGreen:
+      activeService: {{ include "mychart.fullname" . }}
+      previewService: {{ include "mychart.fullname" . }}-preview
+      autoPromotionEnabled: false  # Manual promotion
+      # autoPromotionSeconds: 30  # Or auto-promote after 30s
+```
+
+**Preview Service:**
+```yaml
+apiVersion: v1
+kind: Service
+metadata:
+  name: {{ include "mychart.fullname" . }}-preview
+spec:
+  selector:
+    {{- include "mychart.selectorLabels" . | nindent 4 }}
+  ports:
+    - port: {{ .Values.service.port }}
+      targetPort: {{ .Values.service.targetPort }}
+```
+
+**Testing:**
+```bash
+# Access active (production)
+kubectl port-forward svc/myapp 8080:80
+
+# Access preview (new version)
+kubectl port-forward svc/myapp-preview 8081:80
+
+# Compare both, then promote
+kubectl argo rollouts promote myapp
+```
+
+**Blue-Green vs Canary:**
+- Blue-Green: Instant switch, all-or-nothing
+- Canary: Gradual traffic shift, percentage-based
+- Blue-Green: Need 2x resources during deployment
+- Canary: Shared resources, mixed traffic
+
+</details>
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Objective:** Document your progressive delivery implementation.
+
+**Create `k8s/ROLLOUTS.md` with:**
+
+1. **Argo Rollouts Setup**
+   - Installation verification
+   - Dashboard access
+
+2. **Canary Deployment**
+   - Strategy configuration explained
+   - Step-by-step rollout progression (screenshots from dashboard)
+   - Promotion and abort demonstration
+
+3. **Blue-Green Deployment**
+   - Strategy configuration explained
+   - Preview vs active service
+   - Promotion process
+
+4. **Strategy Comparison**
+   - When to use canary vs blue-green
+   - Pros and cons of each
+   - Your recommendation for different scenarios
+
+5. **CLI Commands Reference**
+   - Useful commands you used
+   - Monitoring and troubleshooting
+
+---
+
+## Bonus Task — Automated Analysis (2.5 pts)
+
+**Objective:** Integrate metrics-based analysis for automated promotion/rollback.
+
+**Requirements:**
+
+1. **Create AnalysisTemplate**
+   - Define success criteria based on metrics
+   - Use Prometheus or web analysis provider
+   - Set failure thresholds
+
+2. **Integrate with Canary**
+   - Add analysis step to canary strategy
+   - Configure automatic rollback on failure
+   - Test with intentional failure
+
+3. **Document Analysis**
+   - AnalysisTemplate configuration
+   - How metrics determine success/failure
+   - Demonstration of auto-rollback
+
+<details>
+<summary>💡 Hints</summary>
+
+**Simple Web Analysis (no Prometheus):**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: AnalysisTemplate
+metadata:
+  name: success-rate
+spec:
+  metrics:
+    - name: webcheck
+      provider:
+        web:
+          url: http://{{ include "mychart.fullname" . }}.default.svc/health
+          jsonPath: "{$.status}"
+      successCondition: result == "ok"
+      interval: 10s
+      count: 3
+      failureLimit: 1
+```
+
+**Canary with Analysis:**
+```yaml
+strategy:
+  canary:
+    steps:
+      - setWeight: 20
+      - analysis:
+          templates:
+            - templateName: success-rate
+      - setWeight: 50
+      - pause: { duration: 30s }
+      - setWeight: 100
+```
+
+**Prometheus Analysis (if Lab 16 monitoring is set up):**
+```yaml
+metrics:
+  - name: error-rate
+    provider:
+      prometheus:
+        address: http://prometheus.monitoring:9090
+        query: |
+          sum(rate(http_requests_total{status=~"5.*"}[1m])) /
+          sum(rate(http_requests_total[1m]))
+    successCondition: result[0] < 0.05
+    interval: 30s
+```
+
+**Resources:**
+- [Analysis & Progressive Delivery](https://argoproj.github.io/argo-rollouts/features/analysis/)
+- [AnalysisTemplate Specification](https://argoproj.github.io/argo-rollouts/analysis/overview/)
+
+</details>
+
+---
+
+## Checklist
+
+### Task 1 — Argo Rollouts Fundamentals (2 pts)
+- [ ] Controller installed and running
+- [ ] kubectl plugin installed
+- [ ] Dashboard accessible
+- [ ] Rollout vs Deployment differences documented
+
+### Task 2 — Canary Deployment (3 pts)
+- [ ] Deployment converted to Rollout
+- [ ] Canary steps configured
+- [ ] Traffic shifting observed in dashboard
+- [ ] Manual promotion tested
+- [ ] Rollback tested
+
+### Task 3 — Blue-Green Deployment (3 pts)
+- [ ] Blue-green strategy configured
+- [ ] Preview service created
+- [ ] Preview environment tested
+- [ ] Promotion to active tested
+- [ ] Instant rollback verified
+
+### Task 4 — Documentation (2 pts)
+- [ ] `k8s/ROLLOUTS.md` complete
+- [ ] Both strategies documented
+- [ ] Screenshots included
+- [ ] Comparison analysis provided
+
+### Bonus — Automated Analysis (2.5 pts)
+- [ ] AnalysisTemplate created
+- [ ] Integrated with canary strategy
+- [ ] Auto-rollback demonstrated
+- [ ] Documentation complete
+
+---
+
+## Rubric
+
+| Criteria | Points | Description |
+|----------|--------|-------------|
+| **Fundamentals** | 2 pts | Installation, dashboard, concepts |
+| **Canary** | 3 pts | Working canary with traffic shifting |
+| **Blue-Green** | 3 pts | Working blue-green with preview |
+| **Documentation** | 2 pts | Complete ROLLOUTS.md |
+| **Bonus** | 2.5 pts | Automated analysis integration |
+| **Total** | 12.5 pts | 10 pts required + 2.5 pts bonus |
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Official Documentation</summary>
+
+- [Argo Rollouts Documentation](https://argoproj.github.io/argo-rollouts/)
+- [Canary Strategy](https://argoproj.github.io/argo-rollouts/features/canary/)
+- [Blue-Green Strategy](https://argoproj.github.io/argo-rollouts/features/bluegreen/)
+- [Analysis & Progressive Delivery](https://argoproj.github.io/argo-rollouts/features/analysis/)
+
+</details>
+
+<details>
+<summary>🎓 Tutorials</summary>
+
+- [Getting Started Guide](https://argoproj.github.io/argo-rollouts/getting-started/)
+- [Canary with Traffic Management](https://argoproj.github.io/argo-rollouts/getting-started/nginx/)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 15:** StatefulSets for stateful applications (different use case than Rollouts)
+- **Lab 16:** Monitoring your rollouts with Prometheus/Grafana
+
+---
+
+**Good luck!** 🚀
+
+> **Remember:** Rollouts replace Deployments when you need progressive delivery. For stateful applications (Lab 15), you'll still use StatefulSets - they serve different purposes.
diff --git a/labs/lab15.md b/labs/lab15.md
new file mode 100644
index 0000000000..cbc416b25e
--- /dev/null
+++ b/labs/lab15.md
@@ -0,0 +1,304 @@
+# Lab 15 — StatefulSets & Persistent Storage
+
+![difficulty](https://img.shields.io/badge/difficulty-advanced-red)
+![topic](https://img.shields.io/badge/topic-StatefulSets-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-StatefulSet%20%7C%20PVC-informational)
+
+> Manage stateful applications in Kubernetes with stable network identities and persistent per-pod storage.
+
+## Overview
+
+While Deployments and Rollouts are perfect for stateless applications, many real-world applications need stable identities and persistent storage per instance. StatefulSets provide guarantees about ordering, uniqueness, and storage that other controllers cannot offer.
+
+**What You'll Learn:**
+- StatefulSet vs Deployment: when to use which
+- Stable network identities and pod naming
+- VolumeClaimTemplates for per-pod storage
+- Headless Services for direct pod access
+- Ordered vs parallel pod management
+
+**Building On:** Your Helm chart with visits counter from Lab 12. Note: StatefulSets serve a different purpose than Rollouts (Lab 14) - use Rollouts for progressive delivery of stateless apps, StatefulSets for stateful apps.
+
+**Tech Stack:** StatefulSets | Headless Services | VolumeClaimTemplates | Persistent Volumes
+
+---
+
+## Tasks
+
+### Task 1 — StatefulSet Concepts (2 pts)
+
+**Objective:** Understand when and why to use StatefulSets.
+
+**Requirements:**
+
+1. **Study StatefulSet Guarantees**
+   - Stable, unique network identifiers
+   - Stable, persistent storage
+   - Ordered, graceful deployment and scaling
+
+2. **Compare with Deployments**
+   - Document key differences
+   - When to use Deployment vs StatefulSet
+   - Examples of stateful workloads
+
+3. **Understand Headless Services**
+   - What is a headless service (`clusterIP: None`)?
+   - How DNS works with StatefulSets
+
+<details>
+<summary>💡 Hints</summary>
+
+**StatefulSet Use Cases:**
+- Databases (MySQL, PostgreSQL, MongoDB)
+- Message queues (Kafka, RabbitMQ)
+- Distributed systems (Elasticsearch, Cassandra)
+
+**Key Differences:**
+
+| Feature | Deployment | StatefulSet |
+|---------|------------|-------------|
+| Pod Names | Random suffix | Ordered index (pod-0, pod-1) |
+| Storage | Shared PVC | Per-pod PVC via templates |
+| Scaling | Any order | Ordered (0→1→2) |
+| Network ID | Random | Stable DNS name |
+
+**Headless Service:**
+A Service with `clusterIP: None` creates DNS records for each pod:
+- `pod-0.service-name.namespace.svc.cluster.local`
+
+**Resources:**
+- [StatefulSet Basics](https://kubernetes.io/docs/tutorials/stateful-application/basic-stateful-set/)
+- [StatefulSet Concepts](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/)
+
+</details>
+
+---
+
+### Task 2 — Convert Deployment to StatefulSet (3 pts)
+
+**Objective:** Transform your Helm chart to use a StatefulSet with per-pod storage.
+
+**Requirements:**
+
+1. **Create StatefulSet Template**
+   - Create `statefulset.yaml` (keep rollout.yaml for reference)
+   - Add `serviceName` field pointing to headless service
+   - Configure `volumeClaimTemplates` for per-pod storage
+
+2. **Create Headless Service**
+   - Create a new service with `clusterIP: None`
+   - Keep your existing service for external access
+
+3. **Configure VolumeClaimTemplates**
+   - Each pod gets its own PVC automatically
+   - Configure storage class and size via values
+
+4. **Deploy and Verify**
+   - Pods named with ordinal suffixes (app-0, app-1, app-2)
+   - Each pod has its own PVC
+
+<details>
+<summary>💡 Hints</summary>
+
+**StatefulSet Structure:**
+```yaml
+apiVersion: apps/v1
+kind: StatefulSet
+metadata:
+  name: {{ include "mychart.fullname" . }}
+spec:
+  serviceName: {{ include "mychart.fullname" . }}-headless
+  replicas: {{ .Values.replicaCount }}
+  selector:
+    matchLabels:
+      {{- include "mychart.selectorLabels" . | nindent 6 }}
+  template:
+    # Same as Deployment pod template
+  volumeClaimTemplates:
+    - metadata:
+        name: data
+      spec:
+        accessModes: [ "ReadWriteOnce" ]
+        resources:
+          requests:
+            storage: {{ .Values.persistence.size }}
+```
+
+**Headless Service:**
+```yaml
+apiVersion: v1
+kind: Service
+metadata:
+  name: {{ include "mychart.fullname" . }}-headless
+spec:
+  clusterIP: None
+  selector:
+    {{- include "mychart.selectorLabels" . | nindent 4 }}
+  ports:
+    - port: {{ .Values.service.port }}
+```
+
+**Verification:**
+```bash
+kubectl get statefulset
+kubectl get pods
+kubectl get pvc
+```
+
+</details>
+
+---
+
+### Task 3 — Headless Service & Pod Identity (3 pts)
+
+**Objective:** Verify stable network identities and per-pod storage isolation.
+
+**Requirements:**
+
+1. **Test DNS Resolution**
+   - Exec into a pod
+   - Resolve other pods via DNS
+   - Document the DNS naming pattern
+
+2. **Test Per-Pod Storage**
+   - Access your app through each pod
+   - Verify each pod maintains its own visit count
+   - Demonstrate isolation between pods
+
+3. **Test Persistence**
+   - Note visit counts for each pod
+   - Delete one pod (not the StatefulSet)
+   - Verify the visit count is preserved after restart
+
+<details>
+<summary>💡 Hints</summary>
+
+**DNS Resolution Test:**
+```bash
+kubectl exec -it <statefulset>-0 -- /bin/sh
+nslookup <statefulset>-1.<headless-service>
+```
+
+**Per-Pod Visit Count Test:**
+```bash
+kubectl port-forward pod/<statefulset>-0 8080:8000 &
+kubectl port-forward pod/<statefulset>-1 8081:8000 &
+curl localhost:8080/visits
+curl localhost:8081/visits
+```
+
+**Persistence Test:**
+```bash
+kubectl exec <statefulset>-0 -- cat /data/visits
+kubectl delete pod <statefulset>-0
+# Wait for restart
+kubectl exec <statefulset>-0 -- cat /data/visits
+```
+
+</details>
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Objective:** Document your StatefulSet implementation.
+
+**Create `k8s/STATEFULSET.md` with:**
+
+1. **StatefulSet Overview** - Why StatefulSet, differences from Deployment
+2. **Resource Verification** - Output of `kubectl get po,sts,svc,pvc`
+3. **Network Identity** - DNS resolution outputs
+4. **Per-Pod Storage Evidence** - Different visit counts per pod
+5. **Persistence Test** - Data survives pod deletion
+
+---
+
+## Bonus Task — Update Strategies (2.5 pts)
+
+**Objective:** Explore StatefulSet update strategies.
+
+**Requirements:**
+
+1. **Implement Partitioned Rolling Update**
+   - Configure `updateStrategy` with `partition`
+   - Update only pods with ordinal >= partition value
+
+2. **Test OnDelete Strategy**
+   - Pods only update when manually deleted
+   - Document use cases
+
+<details>
+<summary>💡 Hints</summary>
+
+**Rolling Update with Partition:**
+```yaml
+spec:
+  updateStrategy:
+    type: RollingUpdate
+    rollingUpdate:
+      partition: 2
+```
+
+**OnDelete Strategy:**
+```yaml
+spec:
+  updateStrategy:
+    type: OnDelete
+```
+
+**Resources:**
+- [StatefulSet Update Strategies](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/#update-strategies)
+
+</details>
+
+---
+
+## Checklist
+
+- [ ] StatefulSet guarantees documented
+- [ ] `statefulset.yaml` created with volumeClaimTemplates
+- [ ] Headless service created
+- [ ] Per-pod PVCs verified
+- [ ] DNS resolution tested
+- [ ] Per-pod storage isolation proven
+- [ ] Persistence test passed
+- [ ] `k8s/STATEFULSET.md` complete
+
+---
+
+## Rubric
+
+| Criteria | Points |
+|----------|--------|
+| **Concepts** | 2 pts |
+| **Implementation** | 3 pts |
+| **Identity & Storage** | 3 pts |
+| **Documentation** | 2 pts |
+| **Bonus** | 2.5 pts |
+| **Total** | 12.5 pts |
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Documentation</summary>
+
+- [StatefulSets](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/)
+- [Headless Services](https://kubernetes.io/docs/concepts/services-networking/service/#headless-services)
+- [VolumeClaimTemplates](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/#volume-claim-templates)
+
+</details>
+
+---
+
+## Looking Ahead
+
+- **Lab 16:** Monitoring your StatefulSet with Prometheus/Grafana
+
+---
+
+**Good luck!** 💾
+
+> **Remember:** StatefulSets are for applications needing stable identity and storage. For progressive delivery of stateless apps, use Rollouts (Lab 14).
diff --git a/labs/lab16.md b/labs/lab16.md
new file mode 100644
index 0000000000..6fa7220f36
--- /dev/null
+++ b/labs/lab16.md
@@ -0,0 +1,261 @@
+# Lab 16 — Kubernetes Monitoring & Init Containers
+
+![difficulty](https://img.shields.io/badge/difficulty-advanced-red)
+![topic](https://img.shields.io/badge/topic-Observability-blue)
+![points](https://img.shields.io/badge/points-10%2B2.5-orange)
+![tech](https://img.shields.io/badge/tech-Prometheus%20%7C%20Grafana-informational)
+
+> Implement comprehensive cluster monitoring with Kube-Prometheus stack and learn init container patterns.
+
+## Overview
+
+Production Kubernetes clusters require robust monitoring. The Kube-Prometheus stack provides a complete solution with Prometheus, Grafana, and Alertmanager. Init containers enable setup tasks before your main application starts.
+
+**What You'll Learn:**
+- Kube-Prometheus stack components
+- Grafana dashboard exploration
+- Prometheus metrics and queries
+- Init container patterns
+
+**Tech Stack:** Prometheus | Grafana | Alertmanager | node-exporter | Init Containers
+
+**Tested Versions:** Minikube v1.34+ | Kubernetes v1.32+ | kube-prometheus-stack 65.x
+
+---
+
+## Tasks
+
+### Task 1 — Kube-Prometheus Stack (2 pts)
+
+**Objective:** Install and understand the monitoring stack.
+
+**Requirements:**
+
+1. **Understand Components** - Document roles of:
+   - Prometheus Operator
+   - Prometheus
+   - Alertmanager
+   - Grafana
+   - kube-state-metrics
+   - node-exporter
+
+2. **Install via Helm**
+   - Add prometheus-community repository
+   - Install in monitoring namespace
+   - Verify all pods are running
+
+<details>
+<summary>💡 Hints</summary>
+
+**Installation:**
+```bash
+helm repo add prometheus-community https://prometheus-community.github.io/helm-charts
+helm repo update
+
+helm install monitoring prometheus-community/kube-prometheus-stack \
+  --namespace monitoring \
+  --create-namespace
+
+kubectl get pods -n monitoring
+```
+
+**Resources:**
+- [kube-prometheus-stack](https://github.com/prometheus-community/helm-charts/tree/main/charts/kube-prometheus-stack)
+
+</details>
+
+---
+
+### Task 2 — Grafana Dashboard Exploration (3 pts)
+
+**Objective:** Use Grafana dashboards to answer questions about your cluster.
+
+**Access Grafana:**
+```bash
+kubectl port-forward svc/monitoring-grafana -n monitoring 3000:80
+# Default: admin / prom-operator
+```
+
+**Answer these questions using dashboards:**
+
+1. **Pod Resources:** CPU/memory usage of your StatefulSet
+2. **Namespace Analysis:** Which pods use most/least CPU in default namespace?
+3. **Node Metrics:** Memory usage (% and MB), CPU cores
+4. **Kubelet:** How many pods/containers managed?
+5. **Network:** Traffic for pods in default namespace
+6. **Alerts:** How many active alerts? Check Alertmanager UI
+
+<details>
+<summary>💡 Hints</summary>
+
+**Useful Dashboards:**
+- "Kubernetes / Compute Resources / Namespace (Pods)"
+- "Kubernetes / Compute Resources / Pod"
+- "Node Exporter / Nodes"
+- "Kubernetes / Kubelet"
+
+**Alertmanager:**
+```bash
+kubectl port-forward svc/monitoring-kube-prometheus-alertmanager -n monitoring 9093:9093
+```
+
+</details>
+
+---
+
+### Task 3 — Init Containers (3 pts)
+
+**Objective:** Implement init containers for pod initialization.
+
+**Requirements:**
+
+1. **Implement Basic Init Container**
+   - Download a file using `wget`
+   - Save to shared volume
+   - Verify main container can access it
+
+2. **Wait-for-Service Pattern**
+   - Create init container that waits for a service
+   - Only start main container when dependency ready
+
+<details>
+<summary>💡 Hints</summary>
+
+**Download Init Container:**
+```yaml
+spec:
+  initContainers:
+    - name: init-download
+      image: busybox:1.36
+      command: ['sh', '-c', 'wget -O /work-dir/index.html https://example.com']
+      volumeMounts:
+        - name: workdir
+          mountPath: /work-dir
+  containers:
+    - name: main-app
+      volumeMounts:
+        - name: workdir
+          mountPath: /data
+  volumes:
+    - name: workdir
+      emptyDir: {}
+```
+
+**Wait Pattern:**
+```yaml
+initContainers:
+  - name: wait-for-service
+    image: busybox:1.36
+    command: ['sh', '-c', 'until nslookup myservice; do sleep 2; done']
+```
+
+**Verification:**
+```bash
+kubectl get pods -w  # Watch Init:0/1 → Running
+kubectl logs <pod> -c init-download
+kubectl exec <pod> -- cat /data/index.html
+```
+
+</details>
+
+---
+
+### Task 4 — Documentation (2 pts)
+
+**Create `k8s/MONITORING.md` with:**
+
+1. **Stack Components** - Descriptions in your own words
+2. **Installation Evidence** - `kubectl get po,svc -n monitoring`
+3. **Dashboard Answers** - All 6 questions with screenshots
+4. **Init Containers** - Implementation and proof of success
+
+---
+
+## Bonus Task — Custom Metrics & ServiceMonitor (2.5 pts)
+
+**Objective:** Expose application metrics and configure Prometheus scraping.
+
+**Requirements:**
+
+1. **Add `/metrics` endpoint** to your app using Prometheus client library
+2. **Create ServiceMonitor** CRD for Prometheus to scrape your app
+3. **Verify metrics in Prometheus UI**
+
+<details>
+<summary>💡 Hints</summary>
+
+**ServiceMonitor:**
+```yaml
+apiVersion: monitoring.coreos.com/v1
+kind: ServiceMonitor
+metadata:
+  name: myapp-monitor
+  labels:
+    release: monitoring
+spec:
+  selector:
+    matchLabels:
+      app.kubernetes.io/name: myapp
+  endpoints:
+    - port: http
+      path: /metrics
+```
+
+**Prometheus UI:**
+```bash
+kubectl port-forward svc/monitoring-kube-prometheus-prometheus -n monitoring 9090:9090
+```
+
+</details>
+
+---
+
+## Checklist
+
+- [ ] Prometheus stack installed
+- [ ] All 6 dashboard questions answered
+- [ ] Screenshots included
+- [ ] Init container downloading file
+- [ ] Wait-for-service pattern implemented
+- [ ] `k8s/MONITORING.md` complete
+
+---
+
+## Rubric
+
+| Criteria | Points |
+|----------|--------|
+| **Prometheus Stack** | 2 pts |
+| **Grafana Exploration** | 3 pts |
+| **Init Containers** | 3 pts |
+| **Documentation** | 2 pts |
+| **Bonus** | 2.5 pts |
+| **Total** | 12.5 pts |
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Documentation</summary>
+
+- [Prometheus](https://prometheus.io/docs/)
+- [Grafana](https://grafana.com/docs/)
+- [Init Containers](https://kubernetes.io/docs/concepts/workloads/pods/init-containers/)
+- [ServiceMonitor](https://prometheus-operator.dev/docs/user-guides/getting-started/)
+
+</details>
+
+---
+
+## Course Completion
+
+Congratulations on completing the core Kubernetes labs! You now have experience with the complete DevOps lifecycle from development to production monitoring.
+
+**Optional:** Labs 17-18 are exam alternatives covering Fly.io and 4EVERLAND.
+
+---
+
+**Good luck!** 📊
+
+> **Remember:** Monitoring is not optional in production. If you can't measure it, you can't improve it.
diff --git a/labs/lab17.md b/labs/lab17.md
new file mode 100644
index 0000000000..c0ca8ed79d
--- /dev/null
+++ b/labs/lab17.md
@@ -0,0 +1,447 @@
+# Lab 17 — Fly.io Edge Deployment
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Edge%20Computing-blue)
+![points](https://img.shields.io/badge/points-20-orange)
+![type](https://img.shields.io/badge/type-Exam%20Alternative-purple)
+
+> Deploy your application globally on Fly.io's edge infrastructure and experience simplified cloud deployment.
+
+## Overview
+
+Fly.io is a platform for running applications close to users worldwide. Unlike Kubernetes which requires cluster management, Fly.io abstracts infrastructure away while still giving you control over deployment, scaling, and observability.
+
+**This is an Exam Alternative Lab** — Complete both Lab 17 and Lab 18 to replace the final exam.
+
+**What You'll Learn:**
+- Edge computing concepts
+- Platform-as-a-Service deployment
+- Global application distribution
+- Kubernetes vs PaaS trade-offs
+- Modern deployment workflows
+
+**Prerequisites:** Working Docker image from Lab 2
+
+**Tech Stack:** Fly.io | flyctl CLI | Docker | Multi-region deployment
+
+---
+
+## Exam Alternative Requirements
+
+| Requirement | Details |
+|-------------|---------|
+| **Deadline** | 1 week before exam date |
+| **Minimum Score** | 16/20 points |
+| **Must Complete** | Both Lab 17 AND Lab 18 |
+| **Total Points** | 40 pts (replaces 40 pt exam) |
+
+---
+
+## Tasks
+
+### Task 1 — Fly.io Setup (3 pts)
+
+**Objective:** Set up Fly.io account and CLI.
+
+**Requirements:**
+
+1. **Create Account**
+   - Sign up at [fly.io](https://fly.io)
+   - No credit card required for free tier
+   - Verify email
+
+2. **Install flyctl CLI**
+   - Install for your operating system
+   - Authenticate with `fly auth login`
+   - Verify with `fly version`
+
+3. **Explore Platform Concepts**
+   - Understand Fly Machines (VMs)
+   - Understand Fly Volumes (persistent storage)
+   - Understand Regions and edge deployment
+
+<details>
+<summary>💡 Hints</summary>
+
+**Installation:**
+```bash
+# macOS
+brew install flyctl
+
+# Linux
+curl -L https://fly.io/install.sh | sh
+
+# Windows (PowerShell)
+pwsh -Command "iwr https://fly.io/install.ps1 -useb | iex"
+```
+
+**Authentication:**
+```bash
+fly auth login
+# Opens browser for authentication
+
+fly auth whoami
+# Verify logged in
+```
+
+**Free Tier Includes:**
+- 3 shared-cpu-1x VMs (256MB RAM)
+- 3GB persistent storage
+- 160GB outbound bandwidth
+
+**Resources:**
+- [Fly.io Docs](https://fly.io/docs/)
+- [Getting Started](https://fly.io/docs/getting-started/)
+
+</details>
+
+---
+
+### Task 2 — Deploy Application (4 pts)
+
+**Objective:** Deploy your application to Fly.io.
+
+**Requirements:**
+
+1. **Prepare Application**
+   - Ensure Dockerfile works locally
+   - Application should listen on port 8080 (or configure in fly.toml)
+
+2. **Launch Application**
+   - Run `fly launch` in your app directory
+   - Configure app name and region
+   - Review generated `fly.toml`
+
+3. **Deploy**
+   - Run `fly deploy`
+   - Wait for deployment to complete
+   - Access your application via provided URL
+
+4. **Verify**
+   - Test all endpoints work
+   - Check application logs
+   - Verify health checks pass
+
+<details>
+<summary>💡 Hints</summary>
+
+**Launch Process:**
+```bash
+cd app_python  # or app_go
+
+fly launch
+# Follow prompts:
+# - App name: your-unique-name
+# - Region: select closest
+# - Postgres/Redis: No (for now)
+# - Deploy now: Yes
+```
+
+**fly.toml Configuration:**
+```toml
+app = "your-app-name"
+primary_region = "ams"  # Amsterdam, or your choice
+
+[build]
+  dockerfile = "Dockerfile"
+
+[http_service]
+  internal_port = 8080
+  force_https = true
+  auto_stop_machines = true
+  auto_start_machines = true
+  min_machines_running = 0
+
+[checks]
+  [checks.health]
+    type = "http"
+    port = 8080
+    path = "/health"
+    interval = "10s"
+    timeout = "2s"
+```
+
+**Useful Commands:**
+```bash
+fly status          # App status
+fly logs            # View logs
+fly open            # Open in browser
+fly ssh console     # SSH into machine
+```
+
+</details>
+
+---
+
+### Task 3 — Multi-Region Deployment (4 pts)
+
+**Objective:** Deploy your application to multiple regions worldwide.
+
+**Requirements:**
+
+1. **Add Regions**
+   - Deploy to at least 3 regions (e.g., ams, iad, sin)
+   - Understand region codes
+
+2. **Verify Global Distribution**
+   - Check machines in each region
+   - Access from different regions if possible
+
+3. **Test Latency**
+   - Document response times from different regions
+   - Understand how Fly routes requests to nearest region
+
+4. **Scale Machines**
+   - Scale to 2 machines in primary region
+   - Understand scaling commands
+
+<details>
+<summary>💡 Hints</summary>
+
+**Region Codes:**
+- `ams` - Amsterdam
+- `iad` - Virginia, USA
+- `sin` - Singapore
+- `syd` - Sydney
+- `lhr` - London
+
+**Adding Regions:**
+```bash
+# Add regions
+fly regions add iad sin
+
+# List regions
+fly regions list
+
+# Check machines
+fly machines list
+```
+
+**Scaling:**
+```bash
+# Scale in specific region
+fly scale count 2 --region ams
+
+# Or modify fly.toml and deploy
+```
+
+**Verify Distribution:**
+```bash
+fly status
+# Shows machines in each region
+
+fly ping
+# Test connectivity to regions
+```
+
+</details>
+
+---
+
+### Task 4 — Secrets & Persistence (3 pts)
+
+**Objective:** Configure secrets and persistent storage.
+
+**Requirements:**
+
+1. **Configure Secrets**
+   - Set at least 2 secrets using `fly secrets`
+   - Verify secrets are available in application
+   - Understand secret management on Fly
+
+2. **Attach Volume** (if app needs persistence)
+   - Create Fly Volume
+   - Attach to application
+   - Verify data persists across deployments
+
+<details>
+<summary>💡 Hints</summary>
+
+**Secrets:**
+```bash
+# Set secrets
+fly secrets set DATABASE_URL="postgres://..." API_KEY="secret123"
+
+# List secrets (names only)
+fly secrets list
+
+# Secrets available as env vars in app
+```
+
+**Volumes:**
+```bash
+# Create volume
+fly volumes create myapp_data --size 1 --region ams
+
+# Update fly.toml
+[mounts]
+  source = "myapp_data"
+  destination = "/data"
+
+# Deploy
+fly deploy
+```
+
+**Verify Persistence:**
+```bash
+fly ssh console
+# Inside machine
+cat /data/visits
+```
+
+</details>
+
+---
+
+### Task 5 — Monitoring & Operations (3 pts)
+
+**Objective:** Monitor and manage your deployed application.
+
+**Requirements:**
+
+1. **View Metrics**
+   - Access Fly.io dashboard
+   - View CPU, memory, network metrics
+   - Understand machine states
+
+2. **Manage Deployments**
+   - Deploy a new version
+   - View deployment history
+   - Understand rollback capability
+
+3. **Health Checks**
+   - Configure HTTP health checks
+   - Verify health check execution
+   - Understand failure behavior
+
+<details>
+<summary>💡 Hints</summary>
+
+**Dashboard:**
+- Visit https://fly.io/dashboard
+- Select your app
+- View Metrics, Machines, Volumes tabs
+
+**Deployments:**
+```bash
+fly releases
+# Shows deployment history
+
+fly deploy --strategy rolling
+# Rolling deployment
+
+fly deploy --strategy immediate
+# Immediate replacement
+```
+
+**Health Checks in fly.toml:**
+```toml
+[checks]
+  [checks.health]
+    type = "http"
+    port = 8080
+    path = "/health"
+    interval = "10s"
+    timeout = "2s"
+    grace_period = "30s"
+```
+
+</details>
+
+---
+
+### Task 6 — Documentation & Comparison (3 pts)
+
+**Objective:** Document deployment and compare with Kubernetes.
+
+**Create `FLYIO.md` with:**
+
+1. **Deployment Summary**
+   - App URL
+   - Regions deployed
+   - Configuration used
+
+2. **Screenshots**
+   - Fly.io dashboard
+   - Multi-region machines
+   - Metrics view
+
+3. **Kubernetes vs Fly.io Comparison**
+
+| Aspect | Kubernetes | Fly.io |
+|--------|------------|--------|
+| Setup complexity | | |
+| Deployment speed | | |
+| Global distribution | | |
+| Cost (for small apps) | | |
+| Learning curve | | |
+| Control/flexibility | | |
+| Best use case | | |
+
+4. **When to Use Each**
+   - Scenarios favoring Kubernetes
+   - Scenarios favoring Fly.io
+   - Your recommendation
+
+---
+
+## Checklist
+
+- [ ] Fly.io account created
+- [ ] flyctl CLI installed and authenticated
+- [ ] Application deployed successfully
+- [ ] Multiple regions configured (3+)
+- [ ] Secrets configured
+- [ ] Persistence tested (if applicable)
+- [ ] Health checks working
+- [ ] Metrics accessible
+- [ ] `FLYIO.md` documentation complete
+- [ ] Kubernetes comparison documented
+
+---
+
+## Rubric
+
+| Criteria | Points |
+|----------|--------|
+| **Setup** | 3 pts |
+| **Deployment** | 4 pts |
+| **Multi-Region** | 4 pts |
+| **Secrets & Persistence** | 3 pts |
+| **Monitoring** | 3 pts |
+| **Documentation** | 3 pts |
+| **Total** | **20 pts** |
+
+**Grading:**
+- **18-20:** Excellent global deployment, thorough comparison
+- **16-17:** Working deployment, good documentation
+- **14-15:** Basic deployment, missing regions or docs
+- **<14:** Incomplete deployment
+
+---
+
+## Resources
+
+<details>
+<summary>📚 Fly.io Documentation</summary>
+
+- [Fly.io Docs](https://fly.io/docs/)
+- [flyctl Reference](https://fly.io/docs/flyctl/)
+- [Fly Machines](https://fly.io/docs/machines/)
+- [Fly Volumes](https://fly.io/docs/volumes/)
+
+</details>
+
+<details>
+<summary>🌍 Regions</summary>
+
+- [Available Regions](https://fly.io/docs/reference/regions/)
+- [Region Selection](https://fly.io/docs/reference/scaling/#regions)
+
+</details>
+
+---
+
+**Good luck!** ✈️
+
+> **Remember:** Fly.io is great for global, low-latency applications. Kubernetes gives more control but requires more management. Choose the right tool for your use case.
diff --git a/labs/lab18.md b/labs/lab18.md
new file mode 100644
index 0000000000..3491394659
--- /dev/null
+++ b/labs/lab18.md
@@ -0,0 +1,430 @@
+# Lab 18 — Decentralized Hosting with 4EVERLAND & IPFS
+
+![difficulty](https://img.shields.io/badge/difficulty-intermediate-yellow)
+![topic](https://img.shields.io/badge/topic-Web3%20Infrastructure-blue)
+![points](https://img.shields.io/badge/points-20-orange)
+![type](https://img.shields.io/badge/type-Exam%20Alternative-purple)
+
+> Deploy content to the decentralized web using IPFS and 4EVERLAND for permanent, censorship-resistant hosting.
+
+## Overview
+
+The decentralized web (Web3) offers an alternative to traditional hosting where content is stored across a distributed network rather than centralized servers. IPFS (InterPlanetary File System) is the foundation, and 4EVERLAND provides a user-friendly gateway to this ecosystem.
+
+**This is an Exam Alternative Lab** — Complete both Lab 17 and Lab 18 to replace the final exam.
+
+**What You'll Learn:**
+- IPFS fundamentals and content addressing
+- Decentralized storage concepts
+- Pinning services and persistence
+- 4EVERLAND hosting platform
+- Centralized vs decentralized trade-offs
+
+**Prerequisites:** Basic understanding of web hosting, completed Docker lab
+
+**Tech Stack:** IPFS | 4EVERLAND | Docker | Content Addressing
+
+**Provided Files:**
+- `labs/lab18/index.html` — A beautiful course landing page ready to deploy
+
+---
+
+## Exam Alternative Requirements
+
+| Requirement | Details |
+|-------------|---------|
+| **Deadline** | 1 week before exam date |
+| **Minimum Score** | 16/20 points |
+| **Must Complete** | Both Lab 17 AND Lab 18 |
+| **Total Points** | 40 pts (replaces 40 pt exam) |
+
+---
+
+## Tasks
+
+### Task 1 — IPFS Fundamentals (3 pts)
+
+**Objective:** Understand IPFS concepts and run a local node.
+
+**Requirements:**
+
+1. **Study IPFS Concepts**
+   - Content addressing vs location addressing
+   - CIDs (Content Identifiers)
+   - Pinning and garbage collection
+   - IPFS gateways
+
+2. **Run Local IPFS Node**
+   - Use Docker to run IPFS node
+   - Access the Web UI
+   - Understand node configuration
+
+3. **Add Content Locally**
+   - Add a file to your local IPFS node
+   - Retrieve the CID
+   - Access via local gateway
+
+<details>
+<summary>💡 Hints</summary>
+
+**IPFS Concepts:**
+- **Content Addressing:** Files identified by hash of content, not location
+- **CID:** Unique identifier derived from content hash (e.g., `QmXxx...` or `bafyxxx...`)
+- **Pinning:** Marking content to keep it (prevent garbage collection)
+- **Gateway:** HTTP interface to IPFS network
+
+**Run IPFS with Docker:**
+```bash
+docker run -d --name ipfs \
+  -p 4001:4001 \
+  -p 8080:8080 \
+  -p 5001:5001 \
+  ipfs/kubo:latest
+
+# Web UI at http://localhost:5001/webui
+# Gateway at http://localhost:8080
+```
+
+**Add Content:**
+```bash
+# Create test file
+echo "Hello IPFS from DevOps course!" > hello.txt
+
+# Add to IPFS
+docker exec ipfs ipfs add /hello.txt
+# Returns: added QmXxx... hello.txt
+
+# Access via gateway
+curl http://localhost:8080/ipfs/QmXxx...
+```
+
+**Resources:**
+- [IPFS Docs](https://docs.ipfs.tech/)
+- [IPFS Concepts](https://docs.ipfs.tech/concepts/)
+
+</details>
+
+---
+
+### Task 2 — 4EVERLAND Setup (3 pts)
+
+**Objective:** Set up 4EVERLAND account and explore the platform.
+
+**Requirements:**
+
+1. **Create Account**
+   - Sign up at [4everland.org](https://www.4everland.org/)
+   - Connect with GitHub or wallet
+   - Explore dashboard
+
+2. **Understand Services**
+   - Hosting: Deploy websites/apps
+   - Storage: IPFS pinning
+   - Gateway: Access IPFS content
+
+3. **Explore Free Tier**
+   - Understand limits and capabilities
+   - Review pricing for reference
+
+<details>
+<summary>💡 Hints</summary>
+
+**4EVERLAND Services:**
+- **Hosting:** Deploy from Git repos, automatic builds
+- **Bucket (Storage):** Upload files, get IPFS CIDs
+- **Gateway:** Access content via 4everland.link
+
+**Dashboard:**
+- Projects: Your deployed sites
+- Bucket: File storage
+- Domains: Custom domain setup
+
+**Free Tier Includes:**
+- 100 deployments/month
+- 5GB storage
+- 100GB bandwidth
+
+**Resources:**
+- [4EVERLAND Docs](https://docs.4everland.org/)
+
+</details>
+
+---
+
+### Task 3 — Deploy Static Content (4 pts)
+
+**Objective:** Deploy a static site to 4EVERLAND.
+
+**Requirements:**
+
+1. **Use the Provided Static Site**
+   - A course landing page is provided at `labs/lab18/index.html`
+   - Review the HTML/CSS to understand the structure
+   - You may customize it or create your own
+
+2. **Deploy via 4EVERLAND**
+   - Connect your GitHub repository
+   - Configure build settings
+   - Deploy to IPFS via 4EVERLAND
+
+3. **Verify Deployment**
+   - Access via 4EVERLAND URL
+   - Access via IPFS gateway
+   - Note the CID
+
+4. **Test Permanence**
+   - Understand that content with same hash = same CID
+   - Make a change, redeploy, observe new CID
+
+<details>
+<summary>💡 Hints</summary>
+
+**Provided Static Site:**
+The course provides a beautiful landing page at `labs/lab18/index.html` that you can deploy. It includes:
+- Modern responsive design
+- Course curriculum overview
+- Learning roadmap
+- "Deployed on IPFS" badge
+
+**Deployment Steps:**
+1. Go to 4EVERLAND Dashboard → Hosting
+2. Click "New Project"
+3. Import from GitHub
+4. Select your repository and branch
+5. Configure:
+   - Framework: None (static)
+   - Build command: (leave empty for static)
+   - Output directory: `labs/lab18` (or root if you moved the file)
+6. Deploy
+
+**Alternative: Create Your Own**
+You can also create your own static site. Keep it simple:
+```html
+<!DOCTYPE html>
+<html>
+<head>
+    <title>My DevOps Portfolio</title>
+</head>
+<body>
+    <h1>Welcome to My DevOps Journey</h1>
+    <p>Deployed on IPFS via 4EVERLAND</p>
+</body>
+</html>
+```
+
+**Access URLs:**
+- 4EVERLAND: `https://your-project.4everland.app`
+- IPFS Gateway: `https://ipfs.4everland.link/ipfs/CID`
+
+</details>
+
+---
+
+### Task 4 — IPFS Pinning (4 pts)
+
+**Objective:** Use 4EVERLAND's storage (Bucket) for IPFS pinning.
+
+**Requirements:**
+
+1. **Upload Files to Bucket**
+   - Upload multiple files (images, documents, etc.)
+   - Get CIDs for each file
+
+2. **Create a Directory Structure**
+   - Upload a folder with multiple files
+   - Understand directory CIDs
+
+3. **Access via Multiple Gateways**
+   - Access your content via:
+     - 4EVERLAND gateway
+     - Public IPFS gateways (ipfs.io, dweb.link)
+   - Understand gateway differences
+
+4. **Verify Pinning**
+   - Confirm content is pinned
+   - Understand pinning vs local storage
+
+<details>
+<summary>💡 Hints</summary>
+
+**Bucket Upload:**
+1. Dashboard → Bucket
+2. Create new bucket
+3. Upload files or folders
+4. Get CID from file details
+
+**Multiple Gateways:**
+```bash
+# 4EVERLAND
+https://ipfs.4everland.link/ipfs/QmXxx...
+
+# IPFS.io
+https://ipfs.io/ipfs/QmXxx...
+
+# Cloudflare
+https://cloudflare-ipfs.com/ipfs/QmXxx...
+
+# DWeb.link
+https://dweb.link/ipfs/QmXxx...
+```
+
+**Directory Upload:**
+- Upload entire folder
+- Get directory CID
+- Access files: `gateway/ipfs/DirCID/filename`
+
+**Pinning Importance:**
+- Unpinned content may be garbage collected
+- Pinning services keep content available
+- Multiple pins = more redundancy
+
+</details>
+
+---
+
+### Task 5 — IPNS & Updates (3 pts)
+
+**Objective:** Understand mutable content with IPNS.
+
+**Requirements:**
+
+1. **Understand IPNS**
+   - IPFS = immutable (content changes = new CID)
+   - IPNS = mutable pointer to IPFS content
+   - IPNS name stays same, content can change
+
+2. **Explore 4EVERLAND Domains**
+   - Custom domains for your deployment
+   - How 4EVERLAND handles updates
+
+3. **Update Deployment**
+   - Make changes to your static site
+   - Redeploy
+   - Observe: same URL, new CID
+
+<details>
+<summary>💡 Hints</summary>
+
+**IPFS vs IPNS:**
+- **IPFS CID:** `QmXxx...` - changes when content changes
+- **IPNS Name:** `/ipns/k51xxx...` - stays same, points to current CID
+
+**4EVERLAND Handles This:**
+- Your project URL stays constant
+- Behind scenes, updates the IPNS pointer
+- Users always get latest version
+
+**Domain Configuration:**
+1. Dashboard → Hosting → Your Project
+2. Settings → Domains
+3. Add custom domain or use provided subdomain
+
+</details>
+
+---
+
+### Task 6 — Documentation & Analysis (3 pts)
+
+**Objective:** Document your work and analyze decentralized hosting.
+
+**Create `4EVERLAND.md` with:**
+
+1. **Deployment Summary**
+   - What you deployed
+   - URLs (4EVERLAND and IPFS gateways)
+   - CIDs obtained
+
+2. **Screenshots**
+   - 4EVERLAND dashboard
+   - Deployed site
+   - Bucket storage
+   - Multiple gateway access
+
+3. **Centralized vs Decentralized Comparison**
+
+| Aspect | Traditional Hosting | IPFS/4EVERLAND |
+|--------|---------------------|----------------|
+| Content addressing | | |
+| Single point of failure | | |
+| Censorship resistance | | |
+| Update mechanism | | |
+| Cost model | | |
+| Speed/latency | | |
+| Best use cases | | |
+
+4. **Use Case Analysis**
+   - When decentralized hosting makes sense
+   - When traditional hosting is better
+   - Your recommendations
+
+---
+
+## Checklist
+
+- [ ] IPFS concepts understood
+- [ ] Local IPFS node running
+- [ ] Content added to local IPFS
+- [ ] 4EVERLAND account created
+- [ ] Static site deployed via 4EVERLAND
+- [ ] Files uploaded to Bucket
+- [ ] Content accessed via multiple gateways
+- [ ] IPNS/updates understood
+- [ ] `4EVERLAND.md` documentation complete
+- [ ] Comparison analysis complete
+
+---
+
+## Rubric
+
+| Criteria | Points |
+|----------|--------|
+| **IPFS Fundamentals** | 3 pts |
+| **4EVERLAND Setup** | 3 pts |
+| **Static Deployment** | 4 pts |
+| **IPFS Pinning** | 4 pts |
+| **IPNS & Updates** | 3 pts |
+| **Documentation** | 3 pts |
+| **Total** | **20 pts** |
+
+**Grading:**
+- **18-20:** Excellent understanding, thorough deployment, insightful analysis
+- **16-17:** Working deployment, good documentation
+- **14-15:** Basic deployment, incomplete analysis
+- **<14:** Incomplete deployment
+
+---
+
+## Resources
+
+<details>
+<summary>📚 IPFS Documentation</summary>
+
+- [IPFS Docs](https://docs.ipfs.tech/)
+- [IPFS Concepts](https://docs.ipfs.tech/concepts/)
+- [Content Addressing](https://docs.ipfs.tech/concepts/content-addressing/)
+- [IPNS](https://docs.ipfs.tech/concepts/ipns/)
+
+</details>
+
+<details>
+<summary>🌐 4EVERLAND</summary>
+
+- [4EVERLAND Docs](https://docs.4everland.org/)
+- [Hosting Guide](https://docs.4everland.org/hosting/overview)
+- [Bucket (Storage)](https://docs.4everland.org/storage/bucket)
+
+</details>
+
+<details>
+<summary>🔗 Public Gateways</summary>
+
+- [IPFS Gateway Checker](https://ipfs.github.io/public-gateway-checker/)
+- [Gateway List](https://docs.ipfs.tech/concepts/ipfs-gateway/#gateway-providers)
+
+</details>
+
+---
+
+**Good luck!** 🌐
+
+> **Remember:** Decentralized hosting trades some convenience for resilience and censorship resistance. Content-addressed storage ensures integrity - the same content always has the same identifier.
diff --git a/labs/lab18/app_python/freeze1.txt b/labs/lab18/app_python/freeze1.txt
new file mode 100644
index 0000000000..af266d21cd
--- /dev/null
+++ b/labs/lab18/app_python/freeze1.txt
@@ -0,0 +1 @@
+Flask==3.1.3
diff --git a/labs/lab18/app_python/freeze2.txt b/labs/lab18/app_python/freeze2.txt
new file mode 100644
index 0000000000..af266d21cd
--- /dev/null
+++ b/labs/lab18/app_python/freeze2.txt
@@ -0,0 +1 @@
+Flask==3.1.3
diff --git a/labs/lab18/index.html b/labs/lab18/index.html
new file mode 100644
index 0000000000..b3de65bc8b
--- /dev/null
+++ b/labs/lab18/index.html
@@ -0,0 +1,927 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>DevOps Core Course | Production-Grade Practices</title>
+    <meta name="description" content="Master production-grade DevOps practices through 16 hands-on labs. Build, containerize, deploy, monitor, and scale applications using industry-standard tools.">
+    <link rel="preconnect" href="https://fonts.googleapis.com">
+    <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
+    <link href="https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700&family=JetBrains+Mono:wght@400;500&display=swap" rel="stylesheet">
+    <style>
+        :root {
+            --bg-primary: #0a0a0f;
+            --bg-secondary: #12121a;
+            --bg-card: #1a1a24;
+            --accent-primary: #6366f1;
+            --accent-secondary: #8b5cf6;
+            --accent-tertiary: #06b6d4;
+            --accent-success: #10b981;
+            --accent-warning: #f59e0b;
+            --accent-danger: #ef4444;
+            --text-primary: #f8fafc;
+            --text-secondary: #94a3b8;
+            --text-muted: #64748b;
+            --border-color: #2d2d3a;
+            --gradient-1: linear-gradient(135deg, #6366f1 0%, #8b5cf6 50%, #06b6d4 100%);
+            --gradient-2: linear-gradient(135deg, #1a1a24 0%, #0a0a0f 100%);
+        }
+
+        * {
+            box-sizing: border-box;
+            margin: 0;
+            padding: 0;
+        }
+
+        html {
+            scroll-behavior: smooth;
+        }
+
+        body {
+            font-family: 'Inter', -apple-system, BlinkMacSystemFont, sans-serif;
+            background: var(--bg-primary);
+            color: var(--text-primary);
+            line-height: 1.7;
+            overflow-x: hidden;
+        }
+
+        .container {
+            max-width: 1200px;
+            margin: 0 auto;
+            padding: 0 2rem;
+        }
+
+        /* Navigation */
+        header {
+            position: fixed;
+            top: 0;
+            left: 0;
+            right: 0;
+            z-index: 1000;
+            background: rgba(10, 10, 15, 0.8);
+            backdrop-filter: blur(20px);
+            border-bottom: 1px solid var(--border-color);
+        }
+
+        nav {
+            display: flex;
+            justify-content: space-between;
+            align-items: center;
+            padding: 1rem 2rem;
+            max-width: 1200px;
+            margin: 0 auto;
+        }
+
+        .logo {
+            font-size: 1.25rem;
+            font-weight: 700;
+            background: var(--gradient-1);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            background-clip: text;
+        }
+
+        .nav-links {
+            display: flex;
+            gap: 2rem;
+            list-style: none;
+        }
+
+        .nav-links a {
+            color: var(--text-secondary);
+            text-decoration: none;
+            font-size: 0.9rem;
+            font-weight: 500;
+            transition: color 0.3s ease;
+        }
+
+        .nav-links a:hover {
+            color: var(--text-primary);
+        }
+
+        /* Hero Section */
+        .hero {
+            min-height: 100vh;
+            display: flex;
+            align-items: center;
+            position: relative;
+            padding-top: 80px;
+            overflow: hidden;
+        }
+
+        .hero::before {
+            content: '';
+            position: absolute;
+            top: 0;
+            left: 0;
+            right: 0;
+            bottom: 0;
+            background:
+                radial-gradient(ellipse at 20% 20%, rgba(99, 102, 241, 0.15) 0%, transparent 50%),
+                radial-gradient(ellipse at 80% 80%, rgba(6, 182, 212, 0.1) 0%, transparent 50%),
+                radial-gradient(ellipse at 50% 50%, rgba(139, 92, 246, 0.05) 0%, transparent 70%);
+            pointer-events: none;
+        }
+
+        .hero-content {
+            position: relative;
+            z-index: 1;
+            text-align: center;
+            max-width: 900px;
+            margin: 0 auto;
+        }
+
+        .hero-badge {
+            display: inline-flex;
+            align-items: center;
+            gap: 0.5rem;
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            padding: 0.5rem 1rem;
+            border-radius: 50px;
+            font-size: 0.85rem;
+            color: var(--text-secondary);
+            margin-bottom: 2rem;
+        }
+
+        .hero-badge span {
+            color: var(--accent-success);
+        }
+
+        .hero h1 {
+            font-size: clamp(2.5rem, 6vw, 4.5rem);
+            font-weight: 700;
+            line-height: 1.1;
+            margin-bottom: 1.5rem;
+            background: linear-gradient(135deg, var(--text-primary) 0%, var(--text-secondary) 100%);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            background-clip: text;
+        }
+
+        .hero h1 .highlight {
+            background: var(--gradient-1);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            background-clip: text;
+        }
+
+        .hero p {
+            font-size: 1.25rem;
+            color: var(--text-secondary);
+            max-width: 600px;
+            margin: 0 auto 2.5rem;
+        }
+
+        .hero-buttons {
+            display: flex;
+            gap: 1rem;
+            justify-content: center;
+            flex-wrap: wrap;
+        }
+
+        .btn {
+            display: inline-flex;
+            align-items: center;
+            gap: 0.5rem;
+            padding: 0.875rem 1.75rem;
+            border-radius: 12px;
+            font-size: 1rem;
+            font-weight: 600;
+            text-decoration: none;
+            transition: all 0.3s ease;
+            cursor: pointer;
+            border: none;
+        }
+
+        .btn-primary {
+            background: var(--gradient-1);
+            color: white;
+            box-shadow: 0 4px 20px rgba(99, 102, 241, 0.3);
+        }
+
+        .btn-primary:hover {
+            transform: translateY(-2px);
+            box-shadow: 0 6px 30px rgba(99, 102, 241, 0.4);
+        }
+
+        .btn-secondary {
+            background: var(--bg-card);
+            color: var(--text-primary);
+            border: 1px solid var(--border-color);
+        }
+
+        .btn-secondary:hover {
+            background: var(--bg-secondary);
+            border-color: var(--accent-primary);
+        }
+
+        /* Stats Section */
+        .stats {
+            display: grid;
+            grid-template-columns: repeat(4, 1fr);
+            gap: 2rem;
+            padding: 4rem 0;
+            border-top: 1px solid var(--border-color);
+            border-bottom: 1px solid var(--border-color);
+            margin: 4rem 0;
+        }
+
+        .stat-item {
+            text-align: center;
+        }
+
+        .stat-value {
+            font-size: 2.5rem;
+            font-weight: 700;
+            background: var(--gradient-1);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            background-clip: text;
+        }
+
+        .stat-label {
+            color: var(--text-secondary);
+            font-size: 0.9rem;
+            margin-top: 0.5rem;
+        }
+
+        /* Section Styles */
+        section {
+            padding: 6rem 0;
+        }
+
+        .section-header {
+            text-align: center;
+            max-width: 700px;
+            margin: 0 auto 4rem;
+        }
+
+        .section-header h2 {
+            font-size: 2.5rem;
+            font-weight: 700;
+            margin-bottom: 1rem;
+        }
+
+        .section-header p {
+            color: var(--text-secondary);
+            font-size: 1.1rem;
+        }
+
+        /* Features Grid */
+        .features-grid {
+            display: grid;
+            grid-template-columns: repeat(auto-fit, minmax(300px, 1fr));
+            gap: 2rem;
+        }
+
+        .feature-card {
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            border-radius: 16px;
+            padding: 2rem;
+            transition: all 0.3s ease;
+        }
+
+        .feature-card:hover {
+            border-color: var(--accent-primary);
+            transform: translateY(-4px);
+        }
+
+        .feature-icon {
+            width: 48px;
+            height: 48px;
+            background: var(--gradient-1);
+            border-radius: 12px;
+            display: flex;
+            align-items: center;
+            justify-content: center;
+            font-size: 1.5rem;
+            margin-bottom: 1.5rem;
+        }
+
+        .feature-card h3 {
+            font-size: 1.25rem;
+            margin-bottom: 0.75rem;
+        }
+
+        .feature-card p {
+            color: var(--text-secondary);
+            font-size: 0.95rem;
+        }
+
+        /* Labs Section */
+        .labs-grid {
+            display: grid;
+            grid-template-columns: repeat(auto-fill, minmax(280px, 1fr));
+            gap: 1.5rem;
+        }
+
+        .lab-card {
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            border-radius: 12px;
+            padding: 1.5rem;
+            display: flex;
+            gap: 1rem;
+            align-items: flex-start;
+            transition: all 0.3s ease;
+        }
+
+        .lab-card:hover {
+            border-color: var(--accent-primary);
+        }
+
+        .lab-number {
+            width: 40px;
+            height: 40px;
+            background: var(--bg-secondary);
+            border-radius: 10px;
+            display: flex;
+            align-items: center;
+            justify-content: center;
+            font-weight: 700;
+            font-size: 0.9rem;
+            color: var(--accent-primary);
+            flex-shrink: 0;
+        }
+
+        .lab-card.bonus .lab-number {
+            background: linear-gradient(135deg, var(--accent-warning) 0%, var(--accent-danger) 100%);
+            color: white;
+        }
+
+        .lab-content h4 {
+            font-size: 1rem;
+            margin-bottom: 0.25rem;
+        }
+
+        .lab-content p {
+            color: var(--text-muted);
+            font-size: 0.85rem;
+        }
+
+        .lab-tag {
+            display: inline-block;
+            font-size: 0.7rem;
+            padding: 0.2rem 0.5rem;
+            border-radius: 4px;
+            background: var(--bg-secondary);
+            color: var(--text-secondary);
+            margin-top: 0.5rem;
+        }
+
+        .lab-tag.exam-alt {
+            background: rgba(245, 158, 11, 0.2);
+            color: var(--accent-warning);
+        }
+
+        /* Roadmap */
+        .roadmap {
+            display: grid;
+            gap: 2rem;
+        }
+
+        .phase {
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            border-radius: 16px;
+            padding: 2rem;
+            display: grid;
+            grid-template-columns: auto 1fr;
+            gap: 2rem;
+            align-items: center;
+        }
+
+        .phase-number {
+            width: 80px;
+            height: 80px;
+            background: var(--gradient-1);
+            border-radius: 16px;
+            display: flex;
+            flex-direction: column;
+            align-items: center;
+            justify-content: center;
+            color: white;
+        }
+
+        .phase-number span {
+            font-size: 0.7rem;
+            text-transform: uppercase;
+            letter-spacing: 1px;
+            opacity: 0.8;
+        }
+
+        .phase-number strong {
+            font-size: 1.75rem;
+        }
+
+        .phase-content h3 {
+            font-size: 1.25rem;
+            margin-bottom: 0.5rem;
+        }
+
+        .phase-content p {
+            color: var(--text-secondary);
+        }
+
+        .phase-topics {
+            display: flex;
+            flex-wrap: wrap;
+            gap: 0.5rem;
+            margin-top: 1rem;
+        }
+
+        .topic-tag {
+            background: var(--bg-secondary);
+            border: 1px solid var(--border-color);
+            padding: 0.25rem 0.75rem;
+            border-radius: 6px;
+            font-size: 0.8rem;
+            color: var(--text-secondary);
+        }
+
+        /* CTA Section */
+        .cta {
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            border-radius: 24px;
+            padding: 4rem;
+            text-align: center;
+            position: relative;
+            overflow: hidden;
+        }
+
+        .cta::before {
+            content: '';
+            position: absolute;
+            top: 0;
+            left: 0;
+            right: 0;
+            bottom: 0;
+            background:
+                radial-gradient(ellipse at 30% 0%, rgba(99, 102, 241, 0.1) 0%, transparent 50%),
+                radial-gradient(ellipse at 70% 100%, rgba(6, 182, 212, 0.1) 0%, transparent 50%);
+            pointer-events: none;
+        }
+
+        .cta h2 {
+            font-size: 2rem;
+            margin-bottom: 1rem;
+            position: relative;
+        }
+
+        .cta p {
+            color: var(--text-secondary);
+            margin-bottom: 2rem;
+            position: relative;
+        }
+
+        /* Footer */
+        footer {
+            padding: 3rem 0;
+            border-top: 1px solid var(--border-color);
+            text-align: center;
+        }
+
+        footer p {
+            color: var(--text-muted);
+            font-size: 0.9rem;
+        }
+
+        footer a {
+            color: var(--accent-primary);
+            text-decoration: none;
+        }
+
+        footer a:hover {
+            text-decoration: underline;
+        }
+
+        .footer-links {
+            display: flex;
+            justify-content: center;
+            gap: 2rem;
+            margin-top: 1rem;
+        }
+
+        /* Deployed Badge */
+        .deployed-badge {
+            position: fixed;
+            bottom: 2rem;
+            right: 2rem;
+            background: var(--bg-card);
+            border: 1px solid var(--border-color);
+            border-radius: 12px;
+            padding: 1rem 1.5rem;
+            display: flex;
+            align-items: center;
+            gap: 0.75rem;
+            font-size: 0.85rem;
+            z-index: 100;
+            box-shadow: 0 10px 40px rgba(0, 0, 0, 0.3);
+        }
+
+        .deployed-badge .icon {
+            width: 32px;
+            height: 32px;
+            background: var(--gradient-1);
+            border-radius: 8px;
+            display: flex;
+            align-items: center;
+            justify-content: center;
+        }
+
+        .deployed-badge span {
+            color: var(--text-secondary);
+        }
+
+        .deployed-badge strong {
+            color: var(--accent-tertiary);
+        }
+
+        /* Responsive */
+        @media (max-width: 768px) {
+            .nav-links {
+                display: none;
+            }
+
+            .stats {
+                grid-template-columns: repeat(2, 1fr);
+            }
+
+            .phase {
+                grid-template-columns: 1fr;
+                text-align: center;
+            }
+
+            .phase-number {
+                margin: 0 auto;
+            }
+
+            .phase-topics {
+                justify-content: center;
+            }
+
+            .cta {
+                padding: 2rem;
+            }
+
+            .deployed-badge {
+                bottom: 1rem;
+                right: 1rem;
+                left: 1rem;
+            }
+        }
+    </style>
+</head>
+<body>
+    <header>
+        <nav>
+            <div class="logo">DevOps Core</div>
+            <ul class="nav-links">
+                <li><a href="#features">Features</a></li>
+                <li><a href="#labs">Labs</a></li>
+                <li><a href="#roadmap">Roadmap</a></li>
+                <li><a href="https://github.com/inno-devops-labs/S25-core-course-labs">GitHub</a></li>
+            </ul>
+        </nav>
+    </header>
+
+    <main>
+        <section class="hero">
+            <div class="container">
+                <div class="hero-content">
+                    <div class="hero-badge">
+                        <span>&#x2713;</span> 2026 Edition &mdash; 7th Year &mdash; Evolved every semester
+                    </div>
+                    <h1>Master <span class="highlight">Production-Grade</span> DevOps Practices</h1>
+                    <p>16 lectures and hands-on labs covering Kubernetes, GitOps, CI/CD, Monitoring, and beyond. 18 weeks of learning to build real-world skills.</p>
+                    <div class="hero-buttons">
+                        <a href="https://github.com/inno-devops-labs/S25-core-course-labs" class="btn btn-primary">
+                            Start Learning &rarr;
+                        </a>
+                        <a href="#labs" class="btn btn-secondary">
+                            View Curriculum
+                        </a>
+                    </div>
+                </div>
+            </div>
+        </section>
+
+        <section class="container">
+            <div class="stats">
+                <div class="stat-item">
+                    <div class="stat-value">7</div>
+                    <div class="stat-label">Years Running</div>
+                </div>
+                <div class="stat-item">
+                    <div class="stat-value">1000+</div>
+                    <div class="stat-label">Students Trained</div>
+                </div>
+                <div class="stat-item">
+                    <div class="stat-value">16</div>
+                    <div class="stat-label">Lectures & Labs</div>
+                </div>
+                <div class="stat-item">
+                    <div class="stat-value">18</div>
+                    <div class="stat-label">Weeks of Learning</div>
+                </div>
+            </div>
+        </section>
+
+        <section id="features" class="container">
+            <div class="section-header">
+                <h2>Why This Course?</h2>
+                <p>Build production-ready skills through hands-on practice with tools used by top tech companies worldwide.</p>
+            </div>
+            <div class="features-grid">
+                <div class="feature-card">
+                    <div class="feature-icon">&#x2601;</div>
+                    <h3>Cloud-Native Architecture</h3>
+                    <p>Master Kubernetes, Helm, StatefulSets, and container orchestration for scalable deployments.</p>
+                </div>
+                <div class="feature-card">
+                    <div class="feature-icon">&#x21BB;</div>
+                    <h3>GitOps & Automation</h3>
+                    <p>Implement ArgoCD, Argo Rollouts, and progressive delivery for safe, automated deployments.</p>
+                </div>
+                <div class="feature-card">
+                    <div class="feature-icon">&#x1F512;</div>
+                    <h3>Security & Secrets</h3>
+                    <p>Learn HashiCorp Vault, Kubernetes Secrets, and secure configuration management practices.</p>
+                </div>
+                <div class="feature-card">
+                    <div class="feature-icon">&#x1F4CA;</div>
+                    <h3>Observability</h3>
+                    <p>Build monitoring stacks with Prometheus, Grafana, Loki, and implement effective alerting.</p>
+                </div>
+                <div class="feature-card">
+                    <div class="feature-icon">&#x2699;</div>
+                    <h3>Infrastructure as Code</h3>
+                    <p>Automate infrastructure with Terraform and Ansible for reproducible environments.</p>
+                </div>
+                <div class="feature-card">
+                    <div class="feature-icon">&#x1F310;</div>
+                    <h3>Beyond Kubernetes</h3>
+                    <p>Explore edge computing with Fly.io and decentralized hosting with IPFS and 4EVERLAND.</p>
+                </div>
+            </div>
+        </section>
+
+        <section id="labs" class="container">
+            <div class="section-header">
+                <h2>Lectures & Labs</h2>
+                <p>16 lectures with corresponding hands-on labs, plus 2 bonus labs as exam alternatives.</p>
+            </div>
+            <div class="labs-grid">
+                <div class="lab-card">
+                    <div class="lab-number">01</div>
+                    <div class="lab-content">
+                        <h4>Web Application Development</h4>
+                        <p>Python/Go, Best Practices</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">02</div>
+                    <div class="lab-content">
+                        <h4>Containerization</h4>
+                        <p>Docker, Multi-stage Builds</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">03</div>
+                    <div class="lab-content">
+                        <h4>Continuous Integration</h4>
+                        <p>GitHub Actions, Snyk</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">04</div>
+                    <div class="lab-content">
+                        <h4>Infrastructure as Code</h4>
+                        <p>Terraform, Cloud Providers</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">05</div>
+                    <div class="lab-content">
+                        <h4>Configuration Management</h4>
+                        <p>Ansible Basics</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">06</div>
+                    <div class="lab-content">
+                        <h4>Continuous Deployment</h4>
+                        <p>Ansible Advanced</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">07</div>
+                    <div class="lab-content">
+                        <h4>Logging</h4>
+                        <p>Promtail, Loki, Grafana</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">08</div>
+                    <div class="lab-content">
+                        <h4>Monitoring</h4>
+                        <p>Prometheus, Grafana</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">09</div>
+                    <div class="lab-content">
+                        <h4>Kubernetes Basics</h4>
+                        <p>Minikube, Deployments, Services</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">10</div>
+                    <div class="lab-content">
+                        <h4>Helm Charts</h4>
+                        <p>Templating, Hooks</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">11</div>
+                    <div class="lab-content">
+                        <h4>Secrets Management</h4>
+                        <p>K8s Secrets, HashiCorp Vault</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">12</div>
+                    <div class="lab-content">
+                        <h4>Configuration & Storage</h4>
+                        <p>ConfigMaps, PVCs</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">13</div>
+                    <div class="lab-content">
+                        <h4>GitOps</h4>
+                        <p>ArgoCD</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">14</div>
+                    <div class="lab-content">
+                        <h4>Progressive Delivery</h4>
+                        <p>Argo Rollouts</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">15</div>
+                    <div class="lab-content">
+                        <h4>StatefulSets</h4>
+                        <p>Persistent Storage, Headless Services</p>
+                    </div>
+                </div>
+                <div class="lab-card">
+                    <div class="lab-number">16</div>
+                    <div class="lab-content">
+                        <h4>Cluster Monitoring</h4>
+                        <p>Kube-Prometheus, Init Containers</p>
+                    </div>
+                </div>
+                <div class="lab-card bonus">
+                    <div class="lab-number">17</div>
+                    <div class="lab-content">
+                        <h4>Fly.io Edge Deployment</h4>
+                        <p>Global Distribution, PaaS</p>
+                        <span class="lab-tag exam-alt">Exam Alternative</span>
+                    </div>
+                </div>
+                <div class="lab-card bonus">
+                    <div class="lab-number">18</div>
+                    <div class="lab-content">
+                        <h4>4EVERLAND & IPFS</h4>
+                        <p>Decentralized Hosting</p>
+                        <span class="lab-tag exam-alt">Exam Alternative</span>
+                    </div>
+                </div>
+            </div>
+        </section>
+
+        <section id="roadmap" class="container">
+            <div class="section-header">
+                <h2>Learning Roadmap</h2>
+                <p>A structured 16-week journey from foundations to advanced production patterns, plus 2 weeks for bonus labs or exam preparation.</p>
+            </div>
+            <div class="roadmap">
+                <div class="phase">
+                    <div class="phase-number">
+                        <span>Phase</span>
+                        <strong>1</strong>
+                    </div>
+                    <div class="phase-content">
+                        <h3>Foundations (Weeks 1-6)</h3>
+                        <p>Build core skills in containerization, CI/CD, and infrastructure automation.</p>
+                        <div class="phase-topics">
+                            <span class="topic-tag">Docker</span>
+                            <span class="topic-tag">GitHub Actions</span>
+                            <span class="topic-tag">Terraform</span>
+                            <span class="topic-tag">Ansible</span>
+                        </div>
+                    </div>
+                </div>
+                <div class="phase">
+                    <div class="phase-number">
+                        <span>Phase</span>
+                        <strong>2</strong>
+                    </div>
+                    <div class="phase-content">
+                        <h3>Observability (Weeks 7-8)</h3>
+                        <p>Master logging and monitoring for production visibility.</p>
+                        <div class="phase-topics">
+                            <span class="topic-tag">Prometheus</span>
+                            <span class="topic-tag">Grafana</span>
+                            <span class="topic-tag">Loki</span>
+                            <span class="topic-tag">Alerting</span>
+                        </div>
+                    </div>
+                </div>
+                <div class="phase">
+                    <div class="phase-number">
+                        <span>Phase</span>
+                        <strong>3</strong>
+                    </div>
+                    <div class="phase-content">
+                        <h3>Kubernetes Core (Weeks 9-12)</h3>
+                        <p>Deep dive into Kubernetes orchestration and package management.</p>
+                        <div class="phase-topics">
+                            <span class="topic-tag">Kubernetes</span>
+                            <span class="topic-tag">Helm</span>
+                            <span class="topic-tag">Secrets</span>
+                            <span class="topic-tag">ConfigMaps</span>
+                        </div>
+                    </div>
+                </div>
+                <div class="phase">
+                    <div class="phase-number">
+                        <span>Phase</span>
+                        <strong>4</strong>
+                    </div>
+                    <div class="phase-content">
+                        <h3>Advanced Patterns (Weeks 13-16)</h3>
+                        <p>Implement GitOps, progressive delivery, stateful workloads, and production monitoring.</p>
+                        <div class="phase-topics">
+                            <span class="topic-tag">ArgoCD</span>
+                            <span class="topic-tag">Argo Rollouts</span>
+                            <span class="topic-tag">StatefulSets</span>
+                            <span class="topic-tag">Vault</span>
+                        </div>
+                    </div>
+                </div>
+                <div class="phase">
+                    <div class="phase-number">
+                        <span>Bonus</span>
+                        <strong>+2</strong>
+                    </div>
+                    <div class="phase-content">
+                        <h3>Bonus Labs / Exam Prep (Weeks 17-18)</h3>
+                        <p>Complete exam alternative labs or prepare for the final exam.</p>
+                        <div class="phase-topics">
+                            <span class="topic-tag">Fly.io</span>
+                            <span class="topic-tag">IPFS</span>
+                            <span class="topic-tag">4EVERLAND</span>
+                            <span class="topic-tag">Edge Computing</span>
+                        </div>
+                    </div>
+                </div>
+            </div>
+        </section>
+
+        <section class="container">
+            <div class="cta">
+                <h2>Ready to Start Your DevOps Journey?</h2>
+                <p>Join 1000+ students who have built production-ready skills through this battle-tested curriculum.</p>
+                <a href="https://github.com/inno-devops-labs/S25-core-course-labs" class="btn btn-primary">
+                    Get Started Free &rarr;
+                </a>
+            </div>
+        </section>
+    </main>
+
+    <footer>
+        <div class="container">
+            <p>&copy; 2020&ndash;2026 DevOps Core Course. 7 years of continuous improvement. Open source educational content.</p>
+            <div class="footer-links">
+                <a href="https://github.com/inno-devops-labs/S25-core-course-labs">GitHub</a>
+                <a href="mailto:devops@example.com">Contact</a>
+            </div>
+        </div>
+    </footer>
+
+    <div class="deployed-badge">
+        <div class="icon">&#x1F310;</div>
+        <div>
+            <span>Deployed on</span><br>
+            <strong>IPFS via 4EVERLAND</strong>
+        </div>
+    </div>
+</body>
+</html>
diff --git a/labs/lab8/analysis/ref.txt b/labs/lab8/analysis/ref.txt
new file mode 100644
index 0000000000..3bcabb1889
--- /dev/null
+++ b/labs/lab8/analysis/ref.txt
@@ -0,0 +1 @@
+Using digest ref: localhost:5000/juice-shop@sha256:b029fa83327aa8a3bbcaf161af6269c18c80134942437cb90794233502554e48
diff --git a/labs/monitoring/doc/LAB07.md b/labs/monitoring/doc/LAB07.md
new file mode 100644
index 0000000000..71767a2a65
--- /dev/null
+++ b/labs/monitoring/doc/LAB07.md
@@ -0,0 +1,163 @@
+# Centralized Logging with Loki, Promtail, and Grafana
+
+## Architecture
+
+The monitoring system can be described as:
+```
+Python app (5000) -> Promtail (9800) -> Loki (3100) -> Grafana (3000)
+```
+
+This implements full centralized logging logic
+- Web app send in JSON format
+- Promtail discovers containers via Docker API and reads out logs, pushes to Loki then
+- Grafana queries Loki and displays all found logs
+
+![alt text](./img/chain.png)
+
+
+## Setup Guide
+
+```
+git clone https://github.com/CacucoH/DevOps-Core-Course/tree/lab7
+cd monitoring
+docker compose up -d
+```
+
+Then, go to `http://localhost:3000` and connect Grafana with Loki:
+**In Grafana:**
+1. Go to **Connections** → **Data sources** → **Add data source** → **Loki**
+2. URL: `http://loki:3100`
+3. Click **Save & Test** (should show "Data source connected")
+4. Navigate to **Explore** → Select **Loki** data source
+5. Query: `{job="docker"}` → You should see logs from all containers
+
+Result:
+
+![alt text](./img/grafana.png)
+
+![alt text](./img/grafana2.png)
+
+
+## Configuration
+### Promtail configuration 
+
+`auth_enabled`: false
+- This disables authentication, so anyone who can access Loki can send or read logs.  
+Good for testing or internal networks, but **not secure for production**.
+
+```yml
+common:
+  replication_factor: 1
+  path_prefix: /loki
+  ring:
+    kvstore:
+      store: inmemory
+```
+- replication_factor: Number of data copies. 1 = no replication
+- path_prefix: Base folder for Loki’s internal data
+- ring.kvstore.store: inmemory: Metadata (like which chunk is where) is kept in RAM. Simple but not persistent
+
+
+```yml
+docker_sd_configs:
+  - host: unix:///var/run/docker.sock
+    refresh_interval: 5s
+```
+- Promtail connects directly to Docker socket to discover any running containers and get logs
+
+```yml
+{app="devops-python"}
+```
+- Labels are efficient filtering mechanism for querying logs in Loki
+
+### Loki configuration 
+
+```yml
+server:
+  http_listen_port: 3100
+```
+- Loki listens on port 3100 for HTTP requests
+
+```yml
+common:
+  replication_factor: 1
+  path_prefix: /loki
+```
+- replication_factor: Number of data copies. 1 = no replication
+- path_prefix: Base folder for Loki’s internal data
+
+```yml
+filesystem:
+  directory: /loki/chunks
+
+tsdb_shipper:
+  active_index_directory: /loki/index
+  cache_location: /loki/index_cache
+```
+- filesystem.directory: path for actual log chunks
+- tsdb_shipper.active_index_directory: where index files are stored
+- cache_location: temporary cache for faster queries
+
+The Loki stack: application logs → Docker files → Promtail → Loki stores/indexes → Grafana displays. It provides centralized logging, label-based queries, and interactive dashboards
+
+## Application Logging
+
+I implemented JSON logging using `logging` module. It outputs JSON messages instead of plain text
+Each log entry is a JSON object, for example:
+
+![alt text](./img/logging.png)
+
+
+## Dashboard
+
+Several dashboards created:
+
+For app logs
+![alt text](./img/dash1.png)
+
+```
+{app="testiks"}
+```
+
+For GET queries
+
+![alt text](./img/grafana3.png)
+```
+{app="testiks"} | json | method="GET"
+```
+
+
+Request rate graph
+```
+sum by (app) (rate({app="testiks"}[1m]))
+```
+![alt text](./img/grafana4.png)
+
+
+## Production Practices
+
+Each container has CPU and memory restrictions:
+```yaml
+deploy:
+  resources:
+    limits:
+      cpus: '1.0'
+      memory: 256M
+```
+
+This prevents resource exhaustion
+
+```yml
+- GF_SECURITY_ADMIN_PASSWORD=${GRAFANA_ADMIN_PASSWORD}
+```
+
+Prevents password leakage (its stored in `.env` file)
+
+## Testing
+
+![alt text](./img/runnin.png)
+
+Logs are present too:
+
+![alt text](./img/logs.png)
+
diff --git a/labs/monitoring/doc/img/chain.png b/labs/monitoring/doc/img/chain.png
new file mode 100644
index 0000000000..fd4e80714a
Binary files /dev/null and b/labs/monitoring/doc/img/chain.png differ
diff --git a/labs/monitoring/doc/img/dash1.png b/labs/monitoring/doc/img/dash1.png
new file mode 100644
index 0000000000..39c4ed0bc4
Binary files /dev/null and b/labs/monitoring/doc/img/dash1.png differ
diff --git a/labs/monitoring/doc/img/grafana.png b/labs/monitoring/doc/img/grafana.png
new file mode 100644
index 0000000000..b749ddf48c
Binary files /dev/null and b/labs/monitoring/doc/img/grafana.png differ
diff --git a/labs/monitoring/doc/img/grafana2.png b/labs/monitoring/doc/img/grafana2.png
new file mode 100644
index 0000000000..ba2bd95880
Binary files /dev/null and b/labs/monitoring/doc/img/grafana2.png differ
diff --git a/labs/monitoring/doc/img/grafana3.png b/labs/monitoring/doc/img/grafana3.png
new file mode 100644
index 0000000000..e4b6764917
Binary files /dev/null and b/labs/monitoring/doc/img/grafana3.png differ
diff --git a/labs/monitoring/doc/img/grafana4.png b/labs/monitoring/doc/img/grafana4.png
new file mode 100644
index 0000000000..7241fcb42d
Binary files /dev/null and b/labs/monitoring/doc/img/grafana4.png differ
diff --git a/labs/monitoring/doc/img/logging.png b/labs/monitoring/doc/img/logging.png
new file mode 100644
index 0000000000..94515f6354
Binary files /dev/null and b/labs/monitoring/doc/img/logging.png differ
diff --git a/labs/monitoring/doc/img/logs.png b/labs/monitoring/doc/img/logs.png
new file mode 100644
index 0000000000..5282392038
Binary files /dev/null and b/labs/monitoring/doc/img/logs.png differ
diff --git a/labs/monitoring/doc/img/runnin.png b/labs/monitoring/doc/img/runnin.png
new file mode 100644
index 0000000000..11d1f000a5
Binary files /dev/null and b/labs/monitoring/doc/img/runnin.png differ
diff --git a/labs/monitoring/docker-compose.yml b/labs/monitoring/docker-compose.yml
new file mode 100644
index 0000000000..612d0a3ae6
--- /dev/null
+++ b/labs/monitoring/docker-compose.yml
@@ -0,0 +1,107 @@
+services:
+
+  loki:
+    image: grafana/loki:3.0.0
+    ports:
+      - "3100:3100"
+    command: -config.file=/etc/loki/config.yml
+    volumes:
+      - ./loki/config.yml:/etc/loki/config.yml
+      - loki-data:/loki
+    networks:
+      - monitoring
+    deploy:
+      resources:
+        limits:
+          cpus: '1.0'
+          memory: 256M
+
+
+  promtail:
+    image: grafana/promtail:3.0.0
+    command: -config.file=/etc/promtail/config.yml
+    volumes:
+      - ./promtail/config.yml:/etc/promtail/config.yml
+      - /var/lib/docker/containers:/var/lib/docker/containers:ro
+      - /var/run/docker.sock:/var/run/docker.sock:ro
+    depends_on:
+      - loki
+    ports:
+      - "9080:9080"
+    networks:
+      - monitoring
+    deploy:
+      resources:
+        limits:
+          cpus: '1.0'
+          memory: 256M
+
+
+  grafana:
+    image: grafana/grafana:12.3.1
+    ports:
+      - "3000:3000"
+    volumes:
+      - grafana-data:/var/lib/grafana
+    environment:
+      - GF_SECURITY_ADMIN_PASSWORD=${GRAFANA_ADMIN_PASSWORD}
+      - GF_AUTH_ANONYMOUS_ENABLED=true
+      - GF_AUTH_ANONYMOUS_ORG_ROLE=Admin
+      - GF_SECURITY_ALLOW_EMBEDDING=true
+    networks:
+      - monitoring
+    deploy:
+      resources:
+        limits:
+          cpus: '1.0'
+          memory: 256M
+
+  
+  testiks-app:
+    build: ../../ansible/app_python
+    container_name: testiks
+    ports:
+      - "5000:5000"
+    labels:
+      logging: "promtail"
+      app: "testiks"
+    networks:
+      - monitoring
+    deploy:
+      resources:
+        limits:
+          cpus: '1.0'
+          memory: 256M
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:5000/health || exit 1"]
+      interval: 10s
+      timeout: 5s
+      retries: 5
+
+  prometheus:
+    image: prom/prometheus:v3.9.0
+    ports:
+      - "9090:9090"
+    volumes:
+      - ./prometheus/prometheus.yml:/etc/prometheus/prometheus.yml
+      - prometheus-data:/prometheus
+    networks:
+      - monitoring
+    deploy:
+      resources:
+        limits:
+          cpus: '1.0'
+          memory: 1G
+    healthcheck:
+      test: ["CMD-SHELL", "wget --no-verbose --tries=1 --spider http://localhost:9090/-/healthy || exit 1"]
+      interval: 10s
+      timeout: 5s
+      retries: 5
+
+volumes:
+  prometheus-data:
+  loki-data:
+  grafana-data:
+
+networks:
+  monitoring:
\ No newline at end of file
diff --git a/labs/monitoring/loki/config.yml b/labs/monitoring/loki/config.yml
new file mode 100644
index 0000000000..949f600ae0
--- /dev/null
+++ b/labs/monitoring/loki/config.yml
@@ -0,0 +1,38 @@
+auth_enabled: false
+
+server:
+  http_listen_port: 3100
+
+common:
+  replication_factor: 1
+  path_prefix: /loki
+  ring:
+    kvstore:
+      store: inmemory
+
+schema_config:
+  configs:
+    - from: 2024-01-01
+      store: tsdb
+      object_store: filesystem
+      schema: v13
+      index:
+        prefix: index_
+        period: 24h
+
+storage_config:
+
+  filesystem:
+    directory: /loki/chunks
+
+  tsdb_shipper:
+    active_index_directory: /loki/index
+    cache_location: /loki/index_cache
+
+limits_config:
+  retention_period: 168h
+
+compactor:
+  working_directory: /loki/compactor
+  retention_enabled: true
+  delete_request_store: filesystem
\ No newline at end of file
diff --git a/labs/monitoring/prometheus/prometheus.yml b/labs/monitoring/prometheus/prometheus.yml
new file mode 100644
index 0000000000..390098744b
--- /dev/null
+++ b/labs/monitoring/prometheus/prometheus.yml
@@ -0,0 +1,23 @@
+global:
+  scrape_interval: 15s
+  evaluation_interval: 15s
+  
+scrape_configs:
+  - job_name: 'prometheus'
+    static_configs:
+      - targets: ['localhost:9090']
+
+  - job_name: 'app'
+    static_configs:
+      - targets: ['testiks-app:5000']
+    metrics_path: '/metrics'
+
+  - job_name: 'loki'
+    static_configs:
+      - targets: ['loki:3100']
+    metrics_path: '/metrics'
+
+  - job_name: 'grafana'
+    static_configs:
+      - targets: ['grafana:3000']
+    metrics_path: '/metrics'
\ No newline at end of file
diff --git a/labs/monitoring/promtail/config.yml b/labs/monitoring/promtail/config.yml
new file mode 100644
index 0000000000..828d1f69fd
--- /dev/null
+++ b/labs/monitoring/promtail/config.yml
@@ -0,0 +1,36 @@
+server:
+  http_listen_port: 9080
+  grpc_listen_port: 0
+
+positions:
+  filename: /tmp/positions.yaml
+
+clients:
+  - url: http://loki:3100/loki/api/v1/push
+
+scrape_configs:
+  - job_name: docker
+
+    docker_sd_configs:
+      - host: unix:///var/run/docker.sock
+        refresh_interval: 5s
+        filters:
+          - name: label
+            values: ["logging=promtail"]
+
+    relabel_configs:
+      - source_labels: ['__meta_docker_container_name']
+        regex: '/(.*)'
+        target_label: container
+
+      - source_labels: ['__meta_docker_container_image']
+        target_label: image
+
+      - source_labels: ['__meta_docker_container_id']
+        target_label: container_id
+
+      - source_labels: ['__meta_docker_container_label_app']
+        target_label: app
+
+    pipeline_stages:
+      - docker: {}
\ No newline at end of file
diff --git a/lectures/lec1.md b/lectures/lec1.md
new file mode 100644
index 0000000000..00ead8aabc
--- /dev/null
+++ b/lectures/lec1.md
@@ -0,0 +1,761 @@
+# 📌 Lecture 1 — Introduction to DevOps: From Chaos to Flow
+
+## 📍 Slide 1 – 🚀 Welcome to DevOps
+
+* 🌍 **Software is eating the world** — but shipping it is hard
+* 😰 Teams struggle with slow releases, broken deploys, finger-pointing
+* 🌉 **DevOps bridges the gap** between **building** and **running** software
+* 🎯 This course: practical skills to transform how you deliver software
+
+```mermaid
+flowchart LR
+  Chaos[😱 Chaos] -->|DevOps| Flow[🌊 Flow]
+  Flow --> Value[💎 Deliver Value Faster]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand what DevOps is (and isn't)
+* ✅ Identify problems DevOps solves
+* ✅ Apply DevOps thinking to real scenarios
+* ✅ Map DevOps practices to your future workflow
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Define DevOps and its core principles |
+| 2 | 🔍 Recognize pre-DevOps problems |
+| 3 | 🛠️ Apply DevOps solutions to scenarios |
+| 4 | 🗺️ Navigate the DevOps lifecycle |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + Diagrams** — visual learning
+* 🎮 **Real-world scenarios** — you decide!
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🕹️ **Interactive simulation**: "DevOps as a Game"
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Problem
+Section 2: What DevOps Is
+Section 3: DevOps as a Game       → 📝 MID Quiz
+Section 4: Lifecycle & Metrics
+Section 5: Real Life
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **70%** of IT projects experience significant delays
+* ⏱️ Average time from code complete to production: **weeks to months**
+* 💥 Most outages caused by **changes** (deploys, configs)
+
+> 💬 *"It worked on my machine"* — Every developer, ever
+
+**🤔 Think about it:**
+* Why is software delivery so hard?
+* Why do teams fear deployments?
+* What would "good" look like?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L1_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Problem Before DevOps
+
+* 👨‍💻 **Development** and ⚙️ **Operations** = separate teams, separate goals
+* 🚀 Dev wants: **ship features fast**
+* 🛡️ Ops wants: **keep systems stable**
+* 💥 Result: **conflict, blame, slow delivery**
+
+```mermaid
+flowchart LR
+  Dev[👨‍💻 Dev Team] -->|🎯 New Features| Goal1[Ship Fast]
+  Ops[⚙️ Ops Team] -->|🛡️ Stability| Goal2[Don't Break]
+  Goal1 -.->|❌ Conflict| Goal2
+```
+
+---
+
+## 📍 Slide 7 – 🧱 The Wall of Confusion
+
+* 🧱 **The Wall** = invisible barrier between Dev and Ops
+* 📦 Dev "throws code over the wall"
+* 🔥 Ops catches the blame when it breaks
+* 🔄 Ops rejects changes to avoid risk
+
+```mermaid
+flowchart LR
+  Dev[👨‍💻 Dev Team] -->|📦 Throws code over| Wall[🧱 Wall of Confusion]
+  Wall -->|🔥 Catches blame| Ops[⚙️ Ops Team]
+  Ops -->|❌ Rejects changes| Dev
+```
+
+> 🤔 **Think:** Have you seen this pattern before?
+
+---
+
+## 📍 Slide 8 – 😱 Manual Release Hell
+
+* 📅 Deployments are rare (monthly, quarterly)
+* 🎰 Each release = **high-risk event**
+* 📋 Manual steps, checklists, weekend work
+* 💀 One mistake = hours of rollback
+
+```mermaid
+flowchart TD
+  Code[✅ Code Complete] --> Wait[📅 Wait for Release Window]
+  Wait --> Manual[📋 Manual Deploy Steps]
+  Manual --> Pray[🙏 Pray It Works]
+  Pray -->|💥 Failure| Blame[👉 Blame Game]
+  Pray -->|😮‍💨 Success| Relief[Temporary Relief]
+```
+
+**📊 The Numbers:**
+* 🐢 Average release cycle: **3-6 months**
+* 📉 Success rate: **~60%**
+* ⏱️ Rollback time: **4-8 hours**
+
+---
+
+## 📍 Slide 9 – 😨 Fear and Blame Culture
+
+* 🌙 Incident happens at 2am
+* 👉 First question: *"Who did this?"*
+* 🙈 Engineers hide mistakes
+* 🚫 Nobody wants to deploy on Friday
+* 💀 Innovation stops
+
+> ⚠️ **Fear kills velocity**
+
+**😰 Signs of Blame Culture:**
+* 🔇 People afraid to speak up
+* 📝 Excessive documentation "for protection"
+* 🐌 Slow decision-making
+* 🚪 High turnover
+
+**💬 Discussion:** Why does blame make things worse?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Chaos
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow releases | Lost market opportunity |
+| 📋 Manual processes | Human error, burnout |
+| 👉 Blame culture | Talent leaves |
+| 🙈 No visibility | Firefighting mode |
+
+**📈 Real Numbers:**
+* 🏢 **Amazon pre-DevOps**: deploys took **weeks**
+* 🚀 **Amazon post-DevOps**: deploys every **11.7 seconds**
+
+**💰 Cost of Downtime:**
+* 💵 Small business: **$427/minute**
+* 🏢 Enterprise: **$9,000/minute**
+* 🌐 Amazon: **$220,000/minute**
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What DevOps Really Is
+
+* 🤝 **DevOps** = Development + Operations working as **one team**
+* 🌱 A **culture** of collaboration and shared responsibility
+* 🔧 A set of **practices** for fast, reliable delivery
+* 🚫 NOT just tools, NOT a job title, NOT a team
+
+```mermaid
+flowchart LR
+  Dev[👨‍💻 Development] -->|🤝 Collaboration| DevOps[🚀 DevOps]
+  Ops[⚙️ Operations] -->|🤝 Collaboration| DevOps
+  DevOps --> Value[💎 Fast, Reliable Value]
+```
+
+**📖 Definition:**
+> *DevOps is a set of practices that combines software development (Dev) and IT operations (Ops) to shorten the development lifecycle while delivering features, fixes, and updates frequently in close alignment with business objectives.*
+
+---
+
+## 📍 Slide 12 – 🚫 What DevOps is NOT
+
+| ❌ Myth | ✅ Reality |
+|---------|-----------|
+| "We hired a DevOps engineer, we're done" | 👥 Everyone participates |
+| "DevOps means using Kubernetes" | 🛠️ Tools support culture |
+| "DevOps replaces developers/ops" | 🤝 It unites them |
+| "DevOps = just automation" | 🧩 Automation + Culture + Measurement |
+| "DevOps is a team" | 🌍 It's a way of working |
+
+> 🔥 **Hot take:** You can't buy DevOps. You build it.
+
+**🎯 DevOps is about:**
+* 🧠 Mindset change
+* 🤝 Breaking silos
+* 🔄 Continuous improvement
+* 📊 Data-driven decisions
+
+---
+
+## 📍 Slide 13 – 🔄 The Three Ways of DevOps
+
+```mermaid
+flowchart LR
+  W1[1️⃣ Flow] --> W2[2️⃣ Feedback]
+  W2 --> W3[3️⃣ Learning]
+  W3 --> W1
+```
+
+| 🛤️ Way | 🎯 Focus | 💡 Example |
+|--------|---------|-----------|
+| 1️⃣ **Flow** | Fast Dev → Prod | 🚀 CI/CD pipelines |
+| 2️⃣ **Feedback** | Fast Prod → Dev | 📊 Monitoring, alerts |
+| 3️⃣ **Learning** | Experiment safely | 📝 Blameless postmortems |
+
+**📚 Source:** *The Phoenix Project* by Gene Kim
+
+---
+
+## 📍 Slide 14 – 🧩 The CAMS Model
+
+```mermaid
+graph TD
+  C[🌱 Culture] --> DevOps[🚀 DevOps]
+  A[🤖 Automation] --> DevOps
+  M[📊 Measurement] --> DevOps
+  S[🔗 Sharing] --> DevOps
+```
+
+* 🌱 **C = Culture** — Trust, collaboration, shared ownership
+* 🤖 **A = Automation** — Eliminate manual, error-prone work
+* 📊 **M = Measurement** — Track metrics, decide with data
+* 🔗 **S = Sharing** — Knowledge flows, blameless postmortems
+
+**🎯 Key Metrics:**
+* ⏱️ **MTTR** = Mean Time to Recovery
+* ❌ **CFR** = Change Failure Rate
+* 📦 **DF** = Deployment Frequency
+* 🚀 **LT** = Lead Time
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After DevOps
+
+| 😰 Before | 🚀 After |
+|----------|---------|
+| 📅 Releases every few months | 📆 Releases daily/weekly |
+| 📋 Manual deployments | 🤖 Automated pipelines |
+| 👉 Blame when things break | 📝 Blameless postmortems |
+| 🙅 "Not my problem" | 🤝 Shared ownership |
+| 😨 Fear of change | 💪 Embrace change |
+| 🐌 Weeks to deploy | ⚡ Minutes to deploy |
+
+> 🤔 Which column describes your current environment?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: DevOps as a Game
+
+## 🕹️ Simulation: You're the CTO
+
+* 🏢 Welcome to **FlowStart Inc.** — a growing startup
+* 👥 You have: 5 developers, 2 ops engineers
+* 🌐 A web application with 10K users
+* 📈 Pressure to ship new features
+
+**❓ What could go wrong?**
+
+> 💀 **Everything.**
+
+🎮 **Let's play.**
+
+---
+
+## 📍 Slide 17 – 💥 Scenario 1: Release Failure
+
+**📅 Friday 5pm:**
+* 👨‍💻 Developer pushes "small fix"
+* 🚫 No tests, no review, straight to production
+* 💥 App crashes, users can't log in
+* 🤷 Nobody knows what changed
+
+```mermaid
+flowchart LR
+  Push[📤 Code Push] --> Prod[🌐 Production]
+  Prod --> Crash[💥 Crash]
+  Crash --> Panic[😱 Weekend Panic]
+```
+
+**📊 Impact:**
+* 👥 10,000 users affected
+* ⏱️ 4 hours downtime
+* 💰 $50,000 lost revenue
+* 😤 Angry customers on Twitter
+
+> ❓ **What would you do?**
+
+---
+
+## 📍 Slide 18 – ✅ Solution: CI/CD
+
+## 🛠️ Fix: Continuous Integration & Delivery
+
+```mermaid
+flowchart LR
+  Push[📤 Push] --> CI[🧪 Tests]
+  CI -->|✅ Pass| Review[👀 Review]
+  Review --> CD[🚀 Deploy]
+  CD --> Monitor[📊 Monitor]
+  CI -->|❌ Fail| Fix[🔧 Fix]
+```
+
+* ✅ Every change triggers **automated tests**
+* ✅ **Code review** required before merge
+* ✅ **Automated deployment** pipeline
+* ✅ **One-click rollback**
+
+**🎯 Result:** Deploy with confidence, not prayers
+
+**📊 CI/CD Benefits:**
+* 🐛 Catch bugs early (80% cheaper to fix)
+* 🚀 Deploy 200x more frequently
+* ⏱️ 24x faster recovery from failures
+
+---
+
+## 📍 Slide 19 – 🐾 Scenario 2: Infrastructure Drift
+
+**😰 Situation:**
+* 🖥️ Production server configured manually over 2 years
+* 👋 Ops engineer who set it up **left the company**
+* 📈 Need to scale — but **can't recreate the setup**
+
+```mermaid
+flowchart TD
+  S1[🖥️ Server 1: Ubuntu 18 + mystery configs]
+  S2[🖥️ Server 2: Ubuntu 20 + different configs]
+  S3[🖥️ Server 3: Who knows? 🤷]
+  S1 --> Drift[😱 Configuration Drift]
+  S2 --> Drift
+  S3 --> Drift
+```
+
+> 🐶🐄 **"Pets vs Cattle"** — Which do you have?
+
+**🐶 Pets:** Unique, irreplaceable, nursed back to health
+**🐄 Cattle:** Identical, replaceable, automated
+
+---
+
+## 📍 Slide 20 – ✅ Solution: Infrastructure as Code
+
+## 🛠️ Fix: IaC
+
+* 📝 Define infrastructure in **version-controlled files**
+* 🔄 Servers are **reproducible**, not unique
+* ⚡ Spin up identical environments in **minutes**
+
+```hcl
+# 🌍 Terraform example
+resource "aws_instance" "web" {
+  ami           = "ami-0c55b159cbfafe1f0"
+  instance_type = "t2.micro"
+  count         = 3  # 🔢 3 identical servers
+}
+```
+
+**🎯 Result:** Cattle, not pets. Replace, don't repair.
+
+**🛠️ IaC Tools:**
+* 🌍 **Terraform** — Multi-cloud
+* 🧩 **Ansible** — Configuration management
+* 📦 **Pulumi** — Code-based IaC
+
+---
+
+## 📍 Slide 21 – 🔓 Scenario 3: Secret Leak
+
+**💀 What happened:**
+* 👨‍💻 Developer commits database password to GitHub
+* 🤖 Bot scrapes it within **minutes**
+* 💥 Attackers access production database
+
+```mermaid
+flowchart LR
+  Commit[📤 Commit + Secret] --> GitHub[🐙 Public Repo]
+  GitHub --> Bot[🤖 Scraper Bot]
+  Bot --> Breach[💀 Database Breach]
+```
+
+> ⏱️ **How fast do bots find secrets?** Under 5 minutes.
+
+**📊 Real Stats:**
+* 🔍 GitHub scans 100M+ repos for secrets
+* ⏱️ Average time to exploit: **<1 hour**
+* 💰 Average breach cost: **$4.45 million**
+
+---
+
+## 📍 Slide 22 – ✅ Solution: Secrets Management
+
+## 🛠️ Fix: Vault & Secret Scanning
+
+* 🚫 **Never** store secrets in code
+* 🔐 Use secret management tools (Vault, AWS Secrets Manager)
+* 🔍 Pre-commit hooks scan for secrets
+* 🔄 Rotate credentials automatically
+
+```yaml
+# ❌ Bad
+password: "super_secret_123"
+
+# ✅ Good
+password: ${VAULT_DB_PASSWORD}
+```
+
+**🎯 Result:** Secrets stay secret
+
+**🛠️ Secret Tools:**
+* 🔐 **HashiCorp Vault**
+* 🔑 **AWS Secrets Manager**
+* 🔒 **Azure Key Vault**
+* 🔍 **git-secrets** (pre-commit)
+
+---
+
+## 📍 Slide 23 – 🙈 Scenario 4: Blind Operations
+
+**👥 Users report:** *"App is slow"*
+
+**🤷 Team asks:**
+* Is it? How slow?
+* Which part is slow?
+* Since when?
+* How many users affected?
+
+**😰 Answer:** No idea. No metrics. No logs. No visibility.
+
+⏱️ **Hours spent guessing.**
+
+---
+
+## 📍 Slide 24 – ✅ Solution: Observability
+
+## 🛠️ Fix: Logs, Metrics, Traces
+
+```mermaid
+graph TD
+  Logs[📋 Logs: What happened] --> Obs[🔍 Observability]
+  Metrics[📊 Metrics: How much/fast] --> Obs
+  Traces[🔗 Traces: Where] --> Obs
+  Obs --> Action[⚡ Fix in minutes, not hours]
+```
+
+| 📊 Pillar | 🛠️ Tools |
+|-----------|----------|
+| 📋 Logs | ELK, Loki, CloudWatch |
+| 📊 Metrics | Prometheus, Grafana, Datadog |
+| 🔗 Traces | Jaeger, Zipkin, X-Ray |
+
+**🎯 Result:** See problems before users report them
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L1_MID
+
+---
+
+## 📍 Slide 26 – ♾️ Section 4: DevOps Lifecycle
+
+## 🔄 The Infinity Loop
+
+* ♾️ DevOps is **continuous** — no "done" state
+* 🔄 Each stage feeds the next
+* 🔁 Forever improving
+
+```mermaid
+flowchart LR
+  Plan[📋 Plan] --> Code[💻 Code]
+  Code --> Build[🔨 Build]
+  Build --> Test[🧪 Test]
+  Test --> Release[📦 Release]
+  Release --> Deploy[🚀 Deploy]
+  Deploy --> Operate[⚙️ Operate]
+  Operate --> Monitor[📊 Monitor]
+  Monitor --> Plan
+```
+
+---
+
+## 📍 Slide 27 – 🔁 Lifecycle Phases
+
+| 📍 Phase | 🎯 Activity | 🛠️ Tools |
+|----------|------------|----------|
+| 📋 Plan | Requirements, design | Jira, GitHub Issues |
+| 💻 Code | Write & review | Git, VS Code |
+| 🔨 Build | Compile, package | Docker, npm, Maven |
+| 🧪 Test | Automated testing | pytest, Jest, Selenium |
+| 📦 Release | Version, approve | GitHub Releases, Tags |
+| 🚀 Deploy | Push to environment | ArgoCD, Ansible, Helm |
+| ⚙️ Operate | Run, scale | Kubernetes, Terraform |
+| 📊 Monitor | Observe, alert | Prometheus, Grafana |
+
+---
+
+## 📍 Slide 28 – 🗺️ Course Map
+
+## 📚 How This Course Covers the Lifecycle
+
+```mermaid
+flowchart TD
+  subgraph 📋 Plan & Code
+    L1[🔬 Labs 1-3: Git, GitHub]
+  end
+  subgraph 🔨 Build & Test
+    L2[🐳 Labs 4-6: Docker, CI/CD]
+  end
+  subgraph 🚀 Deploy & Operate
+    L3[☸️ Labs 7-10: K8s, Helm]
+  end
+  subgraph 🔐 Secure & Monitor
+    L4[📊 Labs 11-15: Vault, Monitoring]
+  end
+```
+
+✅ **Every lab maps to a real DevOps skill.**
+
+---
+
+## 📍 Slide 29 – 📊 DORA Metrics
+
+## 📈 Measuring DevOps Success
+
+| 📊 Metric | 📏 Measures | 🏆 Elite |
+|-----------|------------|---------|
+| ⏱️ **Lead Time** | Commit → Prod | < 1 hour |
+| 📦 **Deploy Frequency** | How often | Multiple/day |
+| ❌ **Change Failure Rate** | % broken deploys | < 15% |
+| 🔧 **MTTR** | Recovery time | < 1 hour |
+
+> 📚 These 4 metrics predict software delivery performance.
+> *Source: DORA State of DevOps Report*
+
+**🤔 Question:** Where does your team stand?
+
+---
+
+## 📍 Slide 30 – 🌊 From Chaos to Flow
+
+## 🎯 The Goal
+
+```mermaid
+flowchart LR
+  subgraph 😱 Chaos
+    Manual[📋 Manual Work]
+    Silos[🧱 Silos]
+    Fear[😨 Fear]
+  end
+  subgraph 🌊 Flow
+    Auto[🤖 Automation]
+    Collab[🤝 Collaboration]
+    Confidence[💪 Confidence]
+  end
+  Chaos -->|🚀 DevOps| Flow
+```
+
+**🎯 Flow State:**
+* ⚡ Changes flow smoothly from idea to production
+* 🔄 Feedback loops are fast
+* 📈 Teams continuously improve
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: DevOps in Real Life
+
+## 📅 A Day in DevOps
+
+**☀️ Morning:**
+* 📊 Check dashboards — all green ✅
+* 👀 Review pull requests
+* 🔀 Merge → auto-deploy
+
+**🌤️ Afternoon:**
+* 🚨 Alert: latency spike
+* 🔍 Check traces → slow DB query
+* 🔧 Fix, test, deploy — **20 min total**
+
+**🌙 Evening:**
+* 🤖 Systems run themselves
+* 🏠 Go home on time
+
+---
+
+## 📍 Slide 32 – 👥 DevOps Roles
+
+| 👤 Role | 🎯 Focus |
+|---------|---------|
+| 🔧 **DevOps Engineer** | Pipelines, automation, infra |
+| 🛡️ **SRE** | Reliability, SLOs, incidents |
+| 🏗️ **Platform Engineer** | Developer experience, internal tools |
+| ☁️ **Cloud Engineer** | Cloud infra, cost optimization |
+
+**🔗 Common thread:** Collaboration, automation, ownership
+
+**💰 Salary Range (2024):**
+* 🔧 DevOps Engineer: $100K - $180K
+* 🛡️ SRE: $120K - $200K
+* 🏗️ Platform Engineer: $130K - $220K
+
+---
+
+## 📍 Slide 33 – 🤝 Team Collaboration
+
+```mermaid
+flowchart TD
+  Dev[👨‍💻 Developers] --> Shared[🤝 Shared Ownership]
+  Ops[⚙️ Operations] --> Shared
+  QA[🧪 QA] --> Shared
+  Sec[🔐 Security] --> Shared
+  Shared --> Ship[🚀 Ship Better Software]
+```
+
+**🤝 Collaboration Practices:**
+* 📟 Shared on-call rotations
+* 📝 Blameless incident reviews
+* 👥 Cross-functional squads
+* 🔓 Everyone can deploy
+
+---
+
+## 📍 Slide 34 – 📈 Career Path
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior] --> Mid[💼 Mid-level]
+  Mid --> Senior[⭐ Senior]
+  Senior --> Staff[🏆 Staff/Principal]
+  Senior --> Manager[👔 Manager]
+  Staff --> Architect[🏛️ Architect]
+```
+
+**🛠️ Skills to Build:**
+* 🐧 Linux, networking
+* 📝 Scripting (Bash, Python)
+* 🐳 Containers & K8s
+* 🔄 CI/CD pipelines
+* ☁️ Cloud platforms (AWS, GCP, Azure)
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🎬 Netflix:**
+* 🚀 1000+ deploys/day
+* 🐒 Chaos Monkey breaks things on purpose
+* 🔄 Self-healing infrastructure
+
+**📦 Amazon:**
+* ⚡ Deploy every **11.7 seconds**
+* 🔧 "You build it, you run it"
+* 👥 Two-pizza teams
+
+**🔍 Google:**
+* 🛡️ Invented **SRE**
+* 📊 Error budgets balance speed & reliability
+* 📝 Blameless postmortems
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🧩 **DevOps = Culture + Practices + Tools**
+2. 🧱 **Break down silos** between Dev and Ops
+3. 🤖 **Automate everything** repeatable
+4. 📊 **Measure what matters** (DORA metrics)
+5. 📝 **Learn from failures**, don't assign blame
+
+> 💡 DevOps isn't a destination. It's a direction.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🚀 DevOps Mindset |
+|---------------|------------------|
+| 🙅 "Not my job" | 🤝 "Our responsibility" |
+| 🚫 "Don't touch prod" | 💪 "Deploy with confidence" |
+| 👉 "Who broke it?" | 🔍 "How do we prevent this?" |
+| 😨 "Change is risky" | ✅ "Small changes = less risk" |
+| 💻 "Works on my machine" | 🌍 "Works everywhere" |
+
+> ❓ Which mindset do you want?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Why DevOps emerged and what it solves
+* ✅ The Three Ways and CAMS model
+* ✅ How CI/CD, IaC, and observability fit together
+* ✅ The DevOps lifecycle and how to measure it
+* ✅ Real-world application of DevOps
+
+> 🚀 **You're ready for the labs.**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L1_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Version Control with Git
+
+* 🐙 Git fundamentals
+* 🌿 Branching strategies
+* 🤝 Collaboration workflows
+* 💻 Hands-on: Your first pull request
+
+**🎉 Your journey has begun.**
+
+> 🌊 From chaos to flow — one commit at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Skills[🛠️ DevOps Skills]
+  Skills --> Impact[💎 Real Impact]
+  Impact --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *The Phoenix Project* — Gene Kim
+* 📖 *The DevOps Handbook* — Gene Kim et al.
+* 📖 *Accelerate* — Nicole Forsgren
+
+**🔗 Links:**
+* 🌐 [DORA State of DevOps](https://dora.dev)
+* 🌐 [DevOps Roadmap](https://roadmap.sh/devops)
+* 🌐 [12 Factor App](https://12factor.net)
+
+---
diff --git a/lectures/lec10.md b/lectures/lec10.md
new file mode 100644
index 0000000000..ff30eefd3e
--- /dev/null
+++ b/lectures/lec10.md
@@ -0,0 +1,840 @@
+# 📌 Lecture 10 — Helm Package Management: Templating Kubernetes
+
+## 📍 Slide 1 – 🚀 Welcome to Helm
+
+* 🌍 **Kubernetes manifests are powerful** — but repetitive
+* 😰 Copy-pasting YAML for different environments is error-prone
+* ⛵ **Helm** = the package manager for Kubernetes
+* 🎯 This lecture: master charts, templating, and values management
+
+```mermaid
+flowchart LR
+  Manifests[📝 Raw YAML] -->|⛵ Helm| Charts[📦 Charts]
+  Charts --> Templating[🔧 Templating]
+  Templating --> Environments[🌍 Any Environment]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand Helm architecture and concepts
+* ✅ Create production-ready Helm charts
+* ✅ Use templating for multi-environment deployments
+* ✅ Implement lifecycle hooks for advanced scenarios
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Explain charts, releases, and repositories |
+| 2 | 🔍 Create charts with proper templating |
+| 3 | 🛠️ Manage values for different environments |
+| 4 | 🗺️ Implement hooks for lifecycle management |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + Go templates** — hands-on focus
+* 🎮 **Real-world scenarios** — multi-environment challenges
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Best practices**: DRY, hooks, library charts
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Manifest Problem
+Section 2: Helm Fundamentals
+Section 3: Templating Deep Dive   → 📝 MID Quiz
+Section 4: Hooks & Advanced
+Section 5: Production Helm
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **89%** of Kubernetes users use Helm
+* ⏱️ Managing 100+ YAML files manually is **chaos**
+* 💥 Different configs per environment = **copy-paste errors**
+
+> 💬 *"Is this the dev or prod manifest? Why are they different?"* — Every DevOps engineer
+
+**🤔 Think about it:**
+* How do you manage configs for dev, staging, and prod?
+* How do you share common patterns across applications?
+* How do you version your Kubernetes deployments?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L10_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Manifest Problem
+
+* 📝 **Raw YAML** works for one environment
+* 📋 Need different values for dev, staging, prod
+* 🔧 Copy-paste → divergence → bugs
+* 💥 Result: **manifest sprawl**
+
+```mermaid
+flowchart LR
+  Base[📝 Base YAML] --> Dev[📝 Dev YAML]
+  Base --> Staging[📝 Staging YAML]
+  Base --> Prod[📝 Prod YAML]
+  Dev --> Drift1[😱 Drift]
+  Staging --> Drift2[😱 Drift]
+  Prod --> Drift3[😱 Drift]
+```
+
+---
+
+## 📍 Slide 7 – 😱 YAML Duplication
+
+* 📋 Same deployment, different image tags
+* 📊 Same service, different replicas
+* 🔧 Same ingress, different domains
+* 💀 Changes require updating multiple files
+
+```yaml
+# 😰 dev-deployment.yaml
+replicas: 1
+image: myapp:latest
+
+# 😰 staging-deployment.yaml
+replicas: 2
+image: myapp:v1.2.3
+
+# 😰 prod-deployment.yaml
+replicas: 5
+image: myapp:v1.2.3
+```
+
+**📊 The Problem:**
+* 🔍 Fix a bug? Update 3 files
+* 🆕 New field? Add to all files
+* 😰 Easy to miss one file
+
+---
+
+## 📍 Slide 8 – 🔧 Manual Substitution Problems
+
+* 📝 `sed` and `envsubst` are fragile
+* 🔍 No validation of resulting YAML
+* 📊 No understanding of Kubernetes resources
+* 💀 Silent failures
+
+> ⚠️ **sed is not a package manager**
+
+```bash
+# 😰 This is fragile
+sed -i "s/REPLICAS/3/g" deployment.yaml
+envsubst < deployment.yaml.template > deployment.yaml
+```
+
+**💬 Discussion:** How do you currently manage environment differences?
+
+---
+
+## 📍 Slide 9 – 😨 Version Chaos
+
+* 📅 "Which version is deployed in prod?"
+* 🔧 No rollback mechanism
+* 📋 No deployment history
+* 💀 Can't reproduce past deployments
+
+> ⚠️ **Without versioning, you can't roll back safely**
+
+```mermaid
+flowchart TD
+  Deploy1[📦 Deploy v1] --> Deploy2[📦 Deploy v2]
+  Deploy2 --> Deploy3[📦 Deploy v3]
+  Deploy3 --> Broken[💥 Broken!]
+  Broken --> Question[❓ What was v2?]
+```
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Manifest Sprawl
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Update all files | Slow, error-prone |
+| 📋 Inconsistency | "Works in dev, not prod" |
+| 👉 No history | Can't audit changes |
+| 🙈 No versioning | Risky rollbacks |
+
+**📈 Real Numbers:**
+* 🏢 **Average K8s app**: 5-20 YAML files
+* 🔄 **Environments**: 3-5 (dev, staging, prod, etc.)
+* 📊 **Total files**: 15-100 per app (without Helm)
+* ⛵ **With Helm**: 1 chart, unlimited environments
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Helm Is
+
+* ⛵ **Package manager** for Kubernetes
+* 📦 **Charts** = packages of K8s resources
+* 🔧 **Templating** = dynamic manifest generation
+* 🔄 **Releases** = installed chart instances
+
+```mermaid
+flowchart LR
+  Chart[📦 Chart] -->|🔧 + Values| Template[🔄 Templating]
+  Template --> Manifest[📝 K8s Manifests]
+  Manifest --> Release[🚀 Release]
+```
+
+**📖 Definition:**
+> *Helm is a package manager for Kubernetes that helps you define, install, and upgrade complex Kubernetes applications using charts (packages of pre-configured resources).*
+
+---
+
+## 📍 Slide 12 – 📦 Core Concepts
+
+```mermaid
+flowchart TD
+  Chart[📦 Chart] --> Templates[📝 Templates]
+  Chart --> Values[📊 Values]
+  Chart --> ChartYaml[📋 Chart.yaml]
+  Templates -->|+| Values
+  Values --> Release[🚀 Release]
+```
+
+| 📦 Concept | 🎯 Purpose |
+|-----------|----------|
+| 📦 **Chart** | Package of K8s resources |
+| 🚀 **Release** | Installed instance of chart |
+| 📊 **Values** | Configuration parameters |
+| 📁 **Repository** | Collection of charts |
+
+---
+
+## 📍 Slide 13 – 📁 Chart Structure
+
+```
+mychart/
+├── Chart.yaml          # 📋 Chart metadata
+├── values.yaml         # 📊 Default values
+├── charts/             # 📦 Dependencies
+└── templates/          # 📝 K8s manifests
+    ├── deployment.yaml
+    ├── service.yaml
+    ├── _helpers.tpl    # 🔧 Template helpers
+    └── NOTES.txt       # 📝 Post-install notes
+```
+
+**🔑 Key Files:**
+* 📋 `Chart.yaml` — Name, version, description
+* 📊 `values.yaml` — Default configuration
+* 📝 `templates/` — Go templates for manifests
+* 🔧 `_helpers.tpl` — Reusable template snippets
+
+---
+
+## 📍 Slide 14 – 📋 Chart.yaml
+
+```yaml
+apiVersion: v2
+name: my-web-app
+description: A Helm chart for my web application
+type: application
+
+# 📊 Chart version (SemVer)
+version: 0.1.0
+
+# 📦 Application version
+appVersion: "1.0.0"
+
+# 📦 Dependencies
+dependencies:
+  - name: common
+    version: 0.1.0
+    repository: "file://../common"
+```
+
+**🔑 Important Fields:**
+* `version` — Chart version (bump when chart changes)
+* `appVersion` — Application version (your app's version)
+* `dependencies` — Other charts this depends on
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After Helm
+
+| 😰 Before | 🚀 After |
+|----------|---------|
+| 📅 Multiple YAML files per env | 📊 One values file per env |
+| 📋 Manual substitution | 🔧 Go templating |
+| 👉 No versioning | 📦 SemVer releases |
+| 😨 Risky rollbacks | 🔙 `helm rollback` |
+| 🐌 Copy-paste changes | ⚡ Single source of truth |
+| 📝 No sharing | 📁 Chart repositories |
+
+> 🤔 Ready to package your Kubernetes apps?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Templating Deep Dive
+
+## 🔧 Go Template Basics
+
+```yaml
+# templates/deployment.yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: {{ .Release.Name }}-app
+  labels:
+    app: {{ .Values.appName }}
+spec:
+  replicas: {{ .Values.replicaCount }}
+  template:
+    spec:
+      containers:
+      - name: {{ .Chart.Name }}
+        image: "{{ .Values.image.repository }}:{{ .Values.image.tag }}"
+```
+
+**🔧 Template Syntax:**
+* `{{ }}` — Template action
+* `.Values` — From values.yaml
+* `.Release` — Release information
+* `.Chart` — From Chart.yaml
+
+---
+
+## 📍 Slide 17 – 📊 Values Management
+
+```yaml
+# values.yaml (defaults)
+replicaCount: 1
+appName: my-app
+
+image:
+  repository: myuser/myapp
+  tag: latest
+  pullPolicy: IfNotPresent
+
+service:
+  type: ClusterIP
+  port: 80
+
+resources:
+  limits:
+    cpu: 200m
+    memory: 256Mi
+  requests:
+    cpu: 100m
+    memory: 128Mi
+```
+
+**🔧 Override Values:**
+```bash
+# File override
+helm install myrelease ./mychart -f values-prod.yaml
+
+# Command line override
+helm install myrelease ./mychart --set replicaCount=5
+```
+
+---
+
+## 📍 Slide 18 – 🌍 Multi-Environment Values
+
+```yaml
+# values-dev.yaml
+replicaCount: 1
+image:
+  tag: latest
+resources:
+  limits:
+    cpu: 100m
+    memory: 128Mi
+
+# values-prod.yaml
+replicaCount: 5
+image:
+  tag: v1.2.3
+resources:
+  limits:
+    cpu: 500m
+    memory: 512Mi
+```
+
+**🚀 Deploy to Different Environments:**
+```bash
+# Development
+helm install myapp-dev ./mychart -f values-dev.yaml
+
+# Production
+helm install myapp-prod ./mychart -f values-prod.yaml
+```
+
+---
+
+## 📍 Slide 19 – 🔧 Template Functions
+
+```yaml
+# Using functions
+name: {{ .Values.name | lower | trunc 63 }}
+
+# Default values
+tag: {{ .Values.image.tag | default .Chart.AppVersion }}
+
+# Conditional
+{{- if .Values.ingress.enabled }}
+# ... ingress resource
+{{- end }}
+
+# Range (loop)
+{{- range .Values.env }}
+- name: {{ .name }}
+  value: {{ .value | quote }}
+{{- end }}
+```
+
+**🔧 Common Functions:**
+| 🔧 Function | 🎯 Purpose |
+|------------|----------|
+| `default` | Provide fallback value |
+| `quote` | Add quotes |
+| `lower/upper` | Case conversion |
+| `trunc` | Truncate string |
+| `include` | Include template |
+
+---
+
+## 📍 Slide 20 – 🔧 Helper Templates
+
+```yaml
+# templates/_helpers.tpl
+{{/*
+Create chart name and version as used by the chart label.
+*/}}
+{{- define "mychart.chart" -}}
+{{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" }}
+{{- end }}
+
+{{/*
+Common labels
+*/}}
+{{- define "mychart.labels" -}}
+helm.sh/chart: {{ include "mychart.chart" . }}
+app.kubernetes.io/name: {{ .Chart.Name }}
+app.kubernetes.io/instance: {{ .Release.Name }}
+app.kubernetes.io/version: {{ .Chart.AppVersion | quote }}
+app.kubernetes.io/managed-by: {{ .Release.Service }}
+{{- end }}
+```
+
+**🔧 Using Helpers:**
+```yaml
+metadata:
+  labels:
+    {{- include "mychart.labels" . | nindent 4 }}
+```
+
+---
+
+## 📍 Slide 21 – 📊 Built-in Objects
+
+```mermaid
+flowchart TD
+  Objects[📦 Built-in Objects]
+  Objects --> Values[.Values]
+  Objects --> Chart[.Chart]
+  Objects --> Release[.Release]
+  Objects --> Template[.Template]
+  Objects --> Files[.Files]
+```
+
+| 📦 Object | 🎯 Contains |
+|----------|----------|
+| `.Values` | Values from values.yaml + overrides |
+| `.Chart` | Contents of Chart.yaml |
+| `.Release` | Release name, namespace, revision |
+| `.Template` | Current template info |
+| `.Files` | Access to non-template files |
+
+---
+
+## 📍 Slide 22 – 🧪 Testing Charts
+
+```bash
+# 📋 Lint chart for errors
+helm lint ./mychart
+
+# 📝 Render templates locally
+helm template myrelease ./mychart
+
+# 🔍 Dry run against cluster
+helm install --dry-run --debug myrelease ./mychart
+
+# 📊 Show computed values
+helm get values myrelease
+
+# 📝 Show rendered manifests
+helm get manifest myrelease
+```
+
+**🧪 Testing Workflow:**
+1. 📋 `helm lint` — syntax check
+2. 📝 `helm template` — verify output
+3. 🔍 `--dry-run` — validate against cluster
+4. 🚀 `helm install` — deploy
+
+---
+
+## 📍 Slide 23 – 📊 Helm Commands
+
+```bash
+# 📦 Create new chart
+helm create mychart
+
+# 🚀 Install chart
+helm install myrelease ./mychart
+
+# 📋 List releases
+helm list
+
+# 🔄 Upgrade release
+helm upgrade myrelease ./mychart
+
+# 🔙 Rollback release
+helm rollback myrelease 1
+
+# 🗑️ Uninstall release
+helm uninstall myrelease
+
+# 📊 Show release history
+helm history myrelease
+```
+
+---
+
+## 📍 Slide 24 – 🔗 Chart Dependencies
+
+```yaml
+# Chart.yaml
+dependencies:
+  - name: postgresql
+    version: 12.0.0
+    repository: https://charts.bitnami.com/bitnami
+    condition: postgresql.enabled
+```
+
+```bash
+# Download dependencies
+helm dependency update ./mychart
+
+# Build dependencies
+helm dependency build ./mychart
+```
+
+**🔗 Dependency Features:**
+* 📦 Include other charts as sub-charts
+* 🔧 Override sub-chart values
+* 🔀 Conditional inclusion
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L10_MID
+
+---
+
+## 📍 Slide 26 – 🎣 Section 4: Lifecycle Hooks
+
+## 🎣 What Are Hooks?
+
+* 🎯 **Execute actions** at specific points
+* 📦 Run jobs before/after install/upgrade
+* 🗑️ Cleanup after completion
+* 🔧 Database migrations, tests, notifications
+
+```mermaid
+flowchart LR
+  PreInstall[🎣 pre-install] --> Install[🚀 Install]
+  Install --> PostInstall[🎣 post-install]
+```
+
+---
+
+## 📍 Slide 27 – 🎣 Hook Types
+
+| 🎣 Hook | ⏱️ When |
+|--------|--------|
+| `pre-install` | Before resources installed |
+| `post-install` | After all resources ready |
+| `pre-upgrade` | Before upgrade |
+| `post-upgrade` | After upgrade complete |
+| `pre-delete` | Before deletion |
+| `post-delete` | After deletion |
+| `pre-rollback` | Before rollback |
+| `post-rollback` | After rollback |
+
+---
+
+## 📍 Slide 28 – 📝 Hook Example
+
+```yaml
+# templates/pre-install-job.yaml
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: {{ .Release.Name }}-pre-install
+  annotations:
+    "helm.sh/hook": pre-install
+    "helm.sh/hook-weight": "-5"
+    "helm.sh/hook-delete-policy": hook-succeeded
+spec:
+  template:
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: pre-install
+        image: busybox
+        command: ['sh', '-c', 'echo Pre-install running && sleep 5']
+```
+
+**🔑 Hook Annotations:**
+* `helm.sh/hook` — Hook type
+* `helm.sh/hook-weight` — Execution order (lower first)
+* `helm.sh/hook-delete-policy` — When to delete
+
+---
+
+## 📍 Slide 29 – 🏗️ Library Charts
+
+```mermaid
+flowchart TD
+  Library[📚 Library Chart] --> App1[📦 App 1]
+  Library --> App2[📦 App 2]
+  Library --> App3[📦 App 3]
+```
+
+**📚 Library Chart:**
+* 🚫 Cannot be installed directly
+* 📝 Contains only templates
+* 🔄 Shared across multiple charts
+
+```yaml
+# Chart.yaml
+apiVersion: v2
+name: common-lib
+type: library  # 📚 Library type
+version: 0.1.0
+```
+
+---
+
+## 📍 Slide 30 – 📊 Helm Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| 📦 **Chart Version** | Tracking | SemVer |
+| 🔄 **Release Revision** | Upgrade count | Documented |
+| ⏱️ **Deploy Time** | Chart install | < 5 min |
+| 🧪 **Lint Errors** | Chart quality | 0 |
+
+> 📚 Version everything!
+
+**🤔 Question:** How do you track what's deployed?
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: Production Helm
+
+## 📅 A Day with Helm
+
+**☀️ Morning:**
+* 📋 Review chart PR
+* 🧪 `helm lint` and `helm template`
+* ✅ Merge changes
+
+**🌤️ Afternoon:**
+* 📊 Update values-prod.yaml
+* 🚀 `helm upgrade myapp ./mychart -f values-prod.yaml`
+* 📈 Watch rollout: `kubectl rollout status`
+
+**🌙 Evening:**
+* 💥 Issue detected
+* 🔙 `helm rollback myapp 3`
+* ⏱️ **Rollback in 30 seconds**
+
+---
+
+## 📍 Slide 32 – 👥 Team Helm Workflow
+
+| 👤 Role | 🎯 Helm Responsibility |
+|---------|----------------------|
+| 👨‍💻 **Developer** | Define values requirements |
+| 🔧 **DevOps** | Create and maintain charts |
+| 🛡️ **SRE** | Manage releases, rollbacks |
+| 📊 **Platform** | Build chart standards |
+
+**🔗 GitOps Flow:**
+```mermaid
+flowchart LR
+  PR[📝 Chart PR] --> Lint[🧪 Lint]
+  Lint --> Review[👀 Review]
+  Review --> Merge[✅ Merge]
+  Merge --> ArgoCD[🔄 ArgoCD]
+  ArgoCD --> Helm[⛵ Helm Install]
+```
+
+---
+
+## 📍 Slide 33 – 🔐 Production Best Practices
+
+```yaml
+# ✅ Good: Specific versions
+image:
+  tag: v1.2.3  # Not 'latest'
+
+# ✅ Good: Resource limits always
+resources:
+  limits:
+    cpu: 500m
+    memory: 512Mi
+
+# ✅ Good: Health probes always
+livenessProbe:
+  enabled: true
+readinessProbe:
+  enabled: true
+```
+
+**🛡️ Production Checklist:**
+* ✅ Specific image tags (not `latest`)
+* ✅ Resource limits defined
+* ✅ Health probes enabled
+* ✅ Values documented
+* ✅ Chart versioned with SemVer
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: Helm Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Using charts] --> Mid[💼 Mid: Creating charts]
+  Mid --> Senior[⭐ Senior: Library charts & standards]
+  Senior --> Principal[🏆 Principal: Chart ecosystem]
+```
+
+**🛠️ Skills to Build:**
+* 📝 Go template fluency
+* 📦 Chart design patterns
+* 🔗 Dependency management
+* 🎣 Hook implementation
+* 📁 Repository management
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 Helm at Scale:**
+* 📦 **Bitnami**: 100+ production charts
+* 🔍 **Google**: GKE uses Helm internally
+* 🎬 **Netflix**: Custom chart ecosystem
+
+**☁️ Public Charts:**
+* 📊 **Prometheus**: helm-charts/prometheus
+* 📋 **Grafana**: helm-charts/grafana
+* 🐘 **PostgreSQL**: bitnami/postgresql
+
+**📊 Stats:**
+* ⛵ **10,000+** public charts
+* 📦 **89%** K8s users use Helm
+* 🏢 **Standard** for K8s packaging
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. ⛵ **Helm is the package manager** for Kubernetes
+2. 📦 **Charts package** related K8s resources
+3. 🔧 **Templating** enables multi-environment deploys
+4. 📊 **Values** customize without changing templates
+5. 🎣 **Hooks** handle lifecycle events
+
+> 💡 Never hardcode in templates — parametrize everything.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | ⛵ Helm Mindset |
+|---------------|------------------|
+| 🙅 "Copy YAML for each env" | 📊 "Different values, same chart" |
+| 🚫 "sed for substitution" | 🔧 "Go templates" |
+| 👉 "Manual versioning" | 📦 "SemVer releases" |
+| 😨 "Risky rollbacks" | 🔙 "helm rollback" |
+| 💻 "My chart, my rules" | 📚 "Shared libraries" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Helm architecture and concepts
+* ✅ Chart creation and structure
+* ✅ Go template syntax
+* ✅ Multi-environment values management
+* ✅ Lifecycle hooks
+
+> 🚀 **You're ready for Lab 10: Helm Charts**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L10_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Course Continuation
+
+* 🔐 Lab 11: Secrets with Vault
+* ⚙️ Lab 12: ConfigMaps
+* 🔄 Lab 13: ArgoCD GitOps
+* 📊 Lab 14: StatefulSets
+* 🔍 Lab 15: K8s Monitoring
+
+**🎉 You've completed the Helm fundamentals!**
+
+> ⛵ From raw YAML to packaged charts — one template at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Helm[⛵ Helm Skills]
+  Helm --> Packaging[📦 K8s Packaging]
+  Packaging --> Career[🚀 Career Growth]
+```
+
+**👋 Continue your DevOps journey!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Learning Helm* — Matt Butcher
+* 📖 *Helm in Action* — Matt Palmer
+* 📖 *Kubernetes Patterns* — Bilgin Ibryam
+
+**🔗 Links:**
+* 🌐 [Helm Documentation](https://helm.sh/docs/)
+* 🌐 [Chart Best Practices](https://helm.sh/docs/chart_best_practices/)
+* 🌐 [Artifact Hub](https://artifacthub.io/)
+
+---
diff --git a/lectures/lec11.md b/lectures/lec11.md
new file mode 100644
index 0000000000..779e7917bd
--- /dev/null
+++ b/lectures/lec11.md
@@ -0,0 +1,759 @@
+# 📌 Lecture 11 — Secret Management: Protecting Your Crown Jewels
+
+## 📍 Slide 1 – 🔐 Welcome to Secret Management
+
+* 🌍 **Your Helm charts are beautiful** — but where do passwords go?
+* 😰 Hardcoded secrets in code = ticking time bomb
+* 🔐 **Secret management** = keeping credentials safe AND accessible
+* 🎯 This lecture: from base64 encoding to enterprise-grade Vault
+
+```mermaid
+flowchart LR
+  Bad[😱 Hardcoded] -->|🔐 Secrets| K8s[☸️ K8s Secrets]
+  K8s -->|🏰 Enterprise| Vault[🔒 HashiCorp Vault]
+  Vault --> Secure[✅ Secure Apps]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand why secret management matters
+* ✅ Create and consume Kubernetes Secrets
+* ✅ Recognize encoding vs encryption difference
+* ✅ Integrate HashiCorp Vault with Kubernetes
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Explain the risks of poor secret management |
+| 2 | 🔍 Create K8s Secrets via kubectl and Helm |
+| 3 | 🛠️ Configure Vault sidecar injection |
+| 4 | 🗺️ Choose appropriate secret management strategy |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 🔐 **Security-first mindset** — think like an attacker
+* 🎮 **Real breach scenarios** — learn from others' mistakes
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Hands-on patterns**: Secrets, Vault, injection
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction           → 📝 PRE Quiz
+Section 1: The Secrets Problem
+Section 2: Kubernetes Secrets
+Section 3: Encoding vs Encryption → 📝 MID Quiz
+Section 4: HashiCorp Vault
+Section 5: Production Patterns    → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – 💀 The Big Question
+
+> 💬 *"The only truly secure system is one that is powered off, cast in a block of concrete and sealed in a lead-lined room with armed guards."* — Gene Spafford
+
+**🔥 Shocking Stats:**
+* 😱 **83%** of organizations have experienced credential theft
+* 💸 Average cost of data breach: **$4.45 million** (2023)
+* ⏱️ Average time to detect breach: **277 days**
+
+> 🤔 **Think:** How many passwords are hardcoded in YOUR projects right now?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L11_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Secrets Problem
+
+* 🎯 **The Challenge:** Apps need credentials to function
+* ⚔️ **The Conflict:** Security vs Convenience
+
+```mermaid
+flowchart LR
+  subgraph 😰 Developer
+    D1[🚀 Ship Fast]
+    D2[🔧 Easy Access]
+  end
+  subgraph 🔐 Security
+    S1[🛡️ Protect Data]
+    S2[📋 Audit Access]
+  end
+  D1 <-->|⚔️ Tension| S1
+  D2 <-->|⚔️ Tension| S2
+```
+
+> 🤔 **Discussion:** Have you ever committed a password to git?
+
+---
+
+## 📍 Slide 7 – 😱 The Hardcoding Horror
+
+**❌ What developers actually do:**
+
+```python
+# ❌ BAD: Hardcoded in code
+DATABASE_URL = "postgres://admin:SuperSecret123@db.prod.com/myapp"
+API_KEY = "sk-1234567890abcdef"
+
+# ❌ BAD: In docker-compose.yml committed to git
+environment:
+  - DB_PASSWORD=MyPassword123
+```
+
+**💥 What can go wrong:**
+* 🔍 Git history is forever (even after deletion)
+* 🌍 Public repos = public secrets
+* 👥 Every developer has production passwords
+* 📝 No audit trail of who accessed what
+
+---
+
+## 📍 Slide 8 – 💥 Real Breach: Uber 2016
+
+**📰 What Happened:**
+* 😱 Developers hardcoded AWS credentials in GitHub repo
+* 🔓 Attackers found credentials, accessed S3 bucket
+* 💾 **57 million** user records stolen
+* 💸 **$148 million** settlement
+
+```mermaid
+flowchart LR
+  A[👨‍💻 Dev commits AWS keys] --> B[🔍 Attacker finds repo]
+  B --> C[🔓 Access S3 bucket]
+  C --> D[💾 57M records stolen]
+  D --> E[💸 $148M settlement]
+```
+
+> ⚠️ **Lesson:** Secrets in code = breach waiting to happen
+
+---
+
+## 📍 Slide 9 – 🔓 Environment Variables: Better but Not Enough
+
+**✅ Better than hardcoding:**
+```bash
+export DATABASE_PASSWORD="secret123"
+```
+
+**❌ Still problematic:**
+* 📋 `ps aux` can expose env vars
+* 🐳 Docker inspect shows environment
+* 📝 No encryption at rest
+* 🔄 No rotation mechanism
+* 👥 No access control
+
+```bash
+# Anyone on the system can see:
+$ docker inspect myapp | grep -A 10 "Env"
+```
+
+> 🤔 **Think:** Where do YOUR environment variables come from?
+
+---
+
+## 📍 Slide 10 – 📊 The Cost of Poor Secret Management
+
+| 🔥 Problem | 💥 Impact | 📊 Stats |
+|------------|-----------|----------|
+| 😱 Leaked credentials | 🔓 Unauthorized access | 83% of breaches |
+| 🔄 No rotation | 📅 Stale passwords | Avg age: 2+ years |
+| 👥 Shared secrets | 🕵️ No accountability | 65% share creds |
+| 📝 No audit | 🤷 Unknown access | 70% can't audit |
+
+**💡 The Solution Spectrum:**
+
+```mermaid
+flowchart LR
+  A[😱 Hardcoded] --> B[🔧 Env Vars]
+  B --> C[☸️ K8s Secrets]
+  C --> D[🔒 Vault]
+  style A fill:#ff6b6b
+  style B fill:#ffd93d
+  style C fill:#6bcb77
+  style D fill:#4d96ff
+```
+
+---
+
+## 📍 Slide 11 – ☸️ Section 2: Kubernetes Secrets
+
+**🎯 What are K8s Secrets?**
+* 📦 First-class Kubernetes objects for sensitive data
+* 🔐 Separate from ConfigMaps (security-focused)
+* 🚀 Native integration with pods
+
+```mermaid
+flowchart TD
+  Secret[🔐 Secret] --> |Volume| Pod1[📦 Pod]
+  Secret --> |Env Var| Pod2[📦 Pod]
+  Secret --> |API| Pod3[📦 Pod]
+```
+
+**📋 Secret Types:**
+* 🔑 `Opaque` — generic key-value
+* 🐳 `docker-registry` — image pull credentials
+* 🔒 `tls` — TLS certificates
+
+---
+
+## 📍 Slide 12 – 🛠️ Creating Secrets with kubectl
+
+**📝 From literals:**
+```bash
+kubectl create secret generic db-creds \
+  --from-literal=username=admin \
+  --from-literal=password=SuperSecret123
+```
+
+**📁 From files:**
+```bash
+kubectl create secret generic tls-cert \
+  --from-file=cert.pem \
+  --from-file=key.pem
+```
+
+**👀 Viewing secrets:**
+```bash
+kubectl get secret db-creds -o yaml
+# Data is base64 encoded
+
+# Decode:
+echo "U3VwZXJTZWNyZXQxMjM=" | base64 -d
+# Output: SuperSecret123
+```
+
+---
+
+## 📍 Slide 13 – ⚠️ The Base64 Trap
+
+> ⚠️ **Critical Understanding:** Base64 is ENCODING, not ENCRYPTION!
+
+```bash
+# Encoding (reversible by anyone):
+echo "password123" | base64
+# cGFzc3dvcmQxMjMK
+
+# Decoding (no key needed):
+echo "cGFzc3dvcmQxMjMK" | base64 -d
+# password123
+```
+
+**🔐 Encryption vs Encoding:**
+
+| 🔄 Encoding | 🔐 Encryption |
+|-------------|---------------|
+| ✅ Reversible by anyone | 🔑 Needs key to decrypt |
+| 📝 Not secure | 🔒 Mathematically secure |
+| 🚀 Fast, no overhead | ⚡ Computational cost |
+| 📦 Data format change | 🛡️ Confidentiality |
+
+---
+
+## 📍 Slide 14 – 📦 Consuming Secrets in Pods
+
+**🔧 As environment variables:**
+```yaml
+env:
+  - name: DB_PASSWORD
+    valueFrom:
+      secretKeyRef:
+        name: db-creds
+        key: password
+```
+
+**📁 As volume mount:**
+```yaml
+volumes:
+  - name: secret-volume
+    secret:
+      secretName: db-creds
+containers:
+  - volumeMounts:
+      - name: secret-volume
+        mountPath: /etc/secrets
+        readOnly: true
+```
+
+> 💡 **Best Practice:** Volume mounts are more secure than env vars (not visible in `docker inspect`)
+
+---
+
+## 📍 Slide 15 – 📊 Before vs After: Basic Secret Management
+
+| 😱 Before (Hardcoded) | ✅ After (K8s Secrets) |
+|-----------------------|------------------------|
+| 📝 Secrets in code | 📦 Secrets in K8s API |
+| 🌍 Visible in git history | 🔐 Separate from code |
+| 👥 Everyone has access | 🛡️ RBAC controls |
+| 🔄 Change = redeploy code | 🔧 Change secret only |
+| 📋 No audit trail | 📝 K8s audit logs |
+
+> 🤔 **Question:** Is K8s Secrets enough for production?
+
+---
+
+## 📍 Slide 16 – 🔒 Section 3: etcd Encryption
+
+**😰 The Problem:**
+* 🗄️ K8s stores secrets in etcd
+* 📝 By default: base64 encoded only
+* 🔓 etcd access = all secrets exposed
+
+**✅ The Solution: Encryption at Rest**
+```yaml
+apiVersion: apiserver.config.k8s.io/v1
+kind: EncryptionConfiguration
+resources:
+  - resources:
+      - secrets
+    providers:
+      - aescbc:
+          keys:
+            - name: key1
+              secret: <base64-encoded-key>
+      - identity: {}
+```
+
+---
+
+## 📍 Slide 17 – 🔐 K8s Secrets Limitations
+
+**⚠️ Still Missing:**
+* 🔄 **No automatic rotation** — manual process
+* 📊 **Limited audit** — who accessed what?
+* 🌍 **K8s-only** — what about non-K8s apps?
+* 🔑 **Static secrets** — no dynamic generation
+* 🏢 **No centralization** — per-cluster management
+
+```mermaid
+flowchart TD
+  subgraph 😰 Limitations
+    A[🔄 No Rotation]
+    B[📊 Limited Audit]
+    C[🌍 K8s Only]
+    D[🔑 Static Only]
+  end
+  E[🏰 Need: Enterprise Solution] --> F[🔒 HashiCorp Vault]
+```
+
+---
+
+## 📍 Slide 18 – 📝 QUIZ — DEVOPS_L11_MID
+
+---
+
+## 📍 Slide 19 – 🏰 Section 4: HashiCorp Vault
+
+**🎯 What is Vault?**
+* 🔐 Enterprise-grade secret management
+* 🔑 Dynamic secret generation
+* 📊 Complete audit logging
+* 🔄 Automatic rotation
+* 🌍 Platform agnostic
+
+```mermaid
+flowchart LR
+  subgraph 🏰 Vault
+    A[🔐 Secret Engine]
+    B[🔑 Auth Methods]
+    C[📋 Policies]
+    D[📊 Audit]
+  end
+  K8s[☸️ Kubernetes] --> B
+  B --> A
+  A --> Apps[📦 Applications]
+  D --> Logs[📝 Audit Logs]
+```
+
+---
+
+## 📍 Slide 20 – 🏗️ Vault Architecture
+
+```mermaid
+flowchart TD
+  subgraph 👥 Clients
+    K8s[☸️ K8s Pods]
+    CLI[💻 CLI]
+    API[🔌 API]
+  end
+  subgraph 🏰 Vault Server
+    Auth[🔑 Auth Methods]
+    Policy[📋 Policies]
+    Secrets[🔐 Secret Engines]
+    Audit[📊 Audit Device]
+  end
+  subgraph 💾 Storage
+    Backend[🗄️ Storage Backend]
+  end
+  K8s --> Auth
+  CLI --> Auth
+  API --> Auth
+  Auth --> Policy
+  Policy --> Secrets
+  Secrets --> Backend
+  Auth --> Audit
+```
+
+**🔑 Key Concepts:**
+* 🔐 **Secret Engines** — where secrets live (KV, database, PKI)
+* 🔑 **Auth Methods** — how clients authenticate
+* 📋 **Policies** — who can access what
+
+---
+
+## 📍 Slide 21 – 🔑 Vault Auth Methods
+
+| 🔑 Method | 📝 Description | 🎯 Use Case |
+|-----------|----------------|-------------|
+| ☸️ Kubernetes | Service account JWT | K8s pods |
+| 🔐 AppRole | Role ID + Secret ID | CI/CD pipelines |
+| 👤 Userpass | Username/password | Humans |
+| 🌐 OIDC | SSO integration | Enterprise SSO |
+| ☁️ AWS/GCP/Azure | Cloud IAM | Cloud workloads |
+
+**☸️ Kubernetes Auth Flow:**
+```mermaid
+sequenceDiagram
+  Pod->>Vault: JWT token (ServiceAccount)
+  Vault->>K8s API: Validate token
+  K8s API->>Vault: Token valid ✅
+  Vault->>Pod: Vault token + secrets
+```
+
+---
+
+## 📍 Slide 22 – 📋 Vault Policies
+
+**🎯 Policies control access:**
+```hcl
+# Allow read on specific path
+path "secret/data/myapp/*" {
+  capabilities = ["read", "list"]
+}
+
+# Deny access to admin secrets
+path "secret/data/admin/*" {
+  capabilities = ["deny"]
+}
+```
+
+**🛡️ Principle of Least Privilege:**
+* ✅ Apps only access their secrets
+* ✅ Read-only where possible
+* ✅ Separate policies per environment
+
+---
+
+## 📍 Slide 23 – 💉 Vault Agent Sidecar Injection
+
+**🎯 The Pattern:**
+* 📦 Vault Agent runs as sidecar container
+* 🔄 Automatically fetches and renews secrets
+* 📁 Writes secrets to shared volume
+* 🚀 App reads from filesystem
+
+```mermaid
+flowchart LR
+  subgraph 📦 Pod
+    App[🚀 App Container]
+    Agent[🔐 Vault Agent]
+    Vol[📁 Shared Volume]
+  end
+  Vault[🏰 Vault Server]
+  Agent -->|🔑 Auth| Vault
+  Vault -->|🔐 Secrets| Agent
+  Agent -->|📝 Write| Vol
+  App -->|📖 Read| Vol
+```
+
+---
+
+## 📍 Slide 24 – 🏷️ Vault Annotations
+
+**📝 Enable injection:**
+```yaml
+metadata:
+  annotations:
+    vault.hashicorp.com/agent-inject: "true"
+    vault.hashicorp.com/role: "myapp"
+    vault.hashicorp.com/agent-inject-secret-config: "secret/data/myapp/config"
+```
+
+**📁 Secrets appear at:**
+```
+/vault/secrets/config
+```
+
+**🔧 Template for custom format:**
+```yaml
+vault.hashicorp.com/agent-inject-template-config: |
+  {{- with secret "secret/data/myapp/config" -}}
+  DB_PASSWORD={{ .Data.data.password }}
+  {{- end -}}
+```
+
+---
+
+## 📍 Slide 25 – 🚀 Vault in Kubernetes: Full Flow
+
+```mermaid
+sequenceDiagram
+  participant Pod
+  participant Injector as Vault Injector
+  participant Agent as Vault Agent
+  participant Vault
+
+  Pod->>Injector: Pod created with annotations
+  Injector->>Pod: Inject sidecar container
+  Agent->>Vault: Authenticate (K8s JWT)
+  Vault->>Agent: Return Vault token
+  Agent->>Vault: Request secrets
+  Vault->>Agent: Return secrets
+  Agent->>Pod: Write to /vault/secrets/
+  Pod->>Pod: App reads secrets
+```
+
+---
+
+## 📍 Slide 26 – 🔄 Section 5: Dynamic Secrets
+
+**🎯 Static vs Dynamic:**
+
+| 🔑 Static Secrets | 🔄 Dynamic Secrets |
+|-------------------|-------------------|
+| 📝 Created manually | 🤖 Generated on-demand |
+| ♾️ Live forever | ⏱️ Short TTL |
+| 👥 Shared | 👤 Unique per request |
+| 🔄 Manual rotation | 🔄 Auto-expires |
+
+**💡 Example: Database credentials**
+```bash
+vault read database/creds/readonly
+# Key             Value
+# lease_id        database/creds/readonly/abc123
+# lease_duration  1h
+# username        v-kubernetes-readonly-xyz789
+# password        A1b2C3d4E5f6G7h8
+```
+
+---
+
+## 📍 Slide 27 – 📊 Secret Management Comparison
+
+| 🔧 Feature | 🔓 Env Vars | ☸️ K8s Secrets | 🏰 Vault |
+|------------|-------------|----------------|----------|
+| 🔐 Encryption | ❌ None | ⚠️ Optional | ✅ Always |
+| 🔄 Rotation | ❌ Manual | ❌ Manual | ✅ Auto |
+| 📊 Audit | ❌ None | ⚠️ Basic | ✅ Full |
+| 🔑 Dynamic | ❌ No | ❌ No | ✅ Yes |
+| 🌍 Multi-platform | ✅ Yes | ❌ K8s only | ✅ Yes |
+| 📈 Complexity | 🟢 Low | 🟡 Medium | 🔴 High |
+
+---
+
+## 📍 Slide 28 – 🗺️ Course Context: Where Secrets Fit
+
+```mermaid
+flowchart TD
+  subgraph 🏗️ Foundation
+    L2[📦 Lab 2: Docker]
+    L10[⛵ Lab 10: Helm]
+  end
+  subgraph 🔐 Security
+    L11[🔒 Lab 11: Secrets]
+  end
+  subgraph 📋 Config
+    L12[📁 Lab 12: ConfigMaps]
+  end
+  subgraph 🚀 Deployment
+    L13[🔄 Lab 13: ArgoCD]
+  end
+  L2 --> L10
+  L10 --> L11
+  L11 --> L12
+  L12 --> L13
+  style L11 fill:#4d96ff
+```
+
+---
+
+## 📍 Slide 29 – 📈 Security Metrics
+
+| 📊 Metric | 📝 Description | 🎯 Target |
+|-----------|----------------|-----------|
+| 🔄 Secret Age | Time since rotation | < 90 days |
+| 📊 Access Audit | % of accesses logged | 100% |
+| 🔐 Encryption | % secrets encrypted | 100% |
+| 👥 Shared Secrets | Secrets used by >1 app | 0 |
+| ⏱️ TTL Compliance | Secrets with TTL | > 80% |
+
+> 🤔 **Question:** How would you measure secret security in your organization?
+
+---
+
+## 📍 Slide 30 – ✅ Secret Management Best Practices
+
+**🛡️ The Golden Rules:**
+
+1. 🚫 **Never commit secrets** to version control
+2. 🔄 **Rotate regularly** — automate where possible
+3. 📋 **Audit everything** — know who accessed what
+4. 🔐 **Encrypt at rest** — etcd encryption minimum
+5. 👤 **Least privilege** — only what's needed
+6. ⏱️ **Short-lived** — dynamic secrets when possible
+
+```mermaid
+flowchart LR
+  A[🔐 Encrypt] --> B[🔄 Rotate]
+  B --> C[📋 Audit]
+  C --> D[👤 Least Privilege]
+  D --> A
+```
+
+---
+
+## 📍 Slide 31 – 👨‍💻 Day in the Life: Secret Management
+
+**☀️ Morning:**
+* ☕ Check Vault audit logs for anomalies
+* 🔄 Review expiring secrets dashboard
+* 📋 Approve new secret access requests
+
+**🌤️ Afternoon:**
+* 🛠️ Help dev team configure Vault injection
+* 📝 Update policies for new microservice
+* 🔐 Rotate database credentials (automated)
+
+**🌙 Evening:**
+* 📊 Review daily access report
+* 🔔 Set up alerts for unusual patterns
+* 📚 Document new secret paths
+
+---
+
+## 📍 Slide 32 – 👥 Roles & Secret Management
+
+| 👤 Role | 🔐 Secret Responsibilities |
+|---------|---------------------------|
+| 🧑‍💻 Developer | Use secrets correctly, never commit |
+| 🔧 DevOps | Configure injection, manage policies |
+| 🛡️ Security | Audit access, define requirements |
+| 🏗️ Platform | Maintain Vault infrastructure |
+| 📋 Compliance | Ensure rotation, audit trails |
+
+> 💡 **Common Thread:** Everyone shares responsibility for secrets
+
+---
+
+## 📍 Slide 33 – 🏢 Real-World: How Companies Handle Secrets
+
+**🎬 Netflix:**
+* 🔐 Custom secret management platform
+* 🔄 Automatic rotation every 24 hours
+* 📊 Real-time access monitoring
+
+**📦 Shopify:**
+* 🏰 HashiCorp Vault at scale
+* 🔑 Dynamic database credentials
+* 👤 Per-service unique credentials
+
+**🚗 Uber:**
+* 📚 Learned from 2016 breach
+* 🔐 Zero hardcoded secrets policy
+* 🤖 Automated secret scanning in CI
+
+---
+
+## 📍 Slide 34 – 🎯 Decision Framework: Choosing a Solution
+
+```mermaid
+flowchart TD
+  Start[🤔 Need Secret Management] --> Q1{Small team?<br/>Simple app?}
+  Q1 -->|Yes| K8s[☸️ K8s Secrets + etcd encryption]
+  Q1 -->|No| Q2{Multi-platform?<br/>Compliance needs?}
+  Q2 -->|Yes| Vault[🏰 HashiCorp Vault]
+  Q2 -->|No| Q3{Cloud-native only?}
+  Q3 -->|Yes| Cloud[☁️ Cloud Secret Manager]
+  Q3 -->|No| Vault
+```
+
+---
+
+## 📍 Slide 35 – 📝 Key Takeaways
+
+1. 🚫 **Never hardcode secrets** — it's a breach waiting to happen
+2. 🔄 **Base64 ≠ encryption** — K8s Secrets need etcd encryption
+3. 🏰 **Vault for enterprise** — when you need rotation, audit, dynamic
+4. 💉 **Sidecar injection** — cleanest pattern for K8s + Vault
+5. 📋 **Audit everything** — you can't secure what you can't see
+
+> 💬 *"Security is not a product, but a process."* — Bruce Schneier
+
+---
+
+## 📍 Slide 36 – 🔄 Mindset Shift
+
+| 😰 Old Mindset | 🚀 New Mindset |
+|----------------|----------------|
+| "Hardcode for convenience" | "Secrets are separate from code" |
+| "Base64 is secure enough" | "Encryption at rest is mandatory" |
+| "Rotate when breached" | "Rotate proactively and automatically" |
+| "Trust developers" | "Least privilege for everyone" |
+| "Hope nobody finds it" | "Assume breach, audit everything" |
+
+> 🤔 **Which mindset do you currently have?**
+
+---
+
+## 📍 Slide 37 – ✅ Your Progress
+
+**🎓 You can now:**
+- [x] 🧠 Explain why secret management matters
+- [x] 🔍 Create K8s Secrets via kubectl and Helm
+- [x] ⚠️ Recognize encoding vs encryption
+- [x] 🛠️ Configure Vault sidecar injection
+- [x] 🗺️ Choose appropriate secret management strategy
+
+**🚀 Ready for:** Lab 11 — Kubernetes Secrets & HashiCorp Vault
+
+---
+
+## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L11_POST
+
+---
+
+## 📍 Slide 39 – 🚀 What's Next
+
+**📅 Next Lecture:** Configuration & Persistent Storage
+* 📁 ConfigMaps for non-sensitive config
+* 💾 Persistent Volumes for data
+* 🔧 Mounting strategies
+
+```mermaid
+flowchart LR
+  Now[🔐 Secrets] --> Next[📁 ConfigMaps]
+  Next --> Storage[💾 Storage]
+  Storage --> GitOps[🔄 GitOps]
+```
+
+> 💪 *"You've secured the secrets. Now let's configure everything else!"*
+
+---
+
+## 📚 Resources
+
+**📖 Books:**
+* "HashiCorp Vault: Securing Secrets" — by various authors
+* "Kubernetes Security" — by Liz Rice
+* "Zero Trust Networks" — by Evan Gilman
+
+**🔗 Links:**
+* [Vault Documentation](https://developer.hashicorp.com/vault/docs)
+* [K8s Secrets Best Practices](https://kubernetes.io/docs/concepts/security/secrets-good-practices/)
+* [OWASP Secrets Management](https://cheatsheetseries.owasp.org/cheatsheets/Secrets_Management_Cheat_Sheet.html)
diff --git a/lectures/lec12.md b/lectures/lec12.md
new file mode 100644
index 0000000000..ef8ff54778
--- /dev/null
+++ b/lectures/lec12.md
@@ -0,0 +1,854 @@
+# 📌 Lecture 12 — Configuration & Storage: Externalizing Application State
+
+> 🎯 **From hardcoded configs to dynamic, portable applications**
+
+---
+
+## 📍 Slide 1 – 🚀 Welcome to Configuration Management
+
+Last lecture we secured our **secrets**. But what about everything else?
+
+* 🔧 **Database URLs** — different per environment
+* 📊 **Feature flags** — enable/disable features dynamically
+* 📁 **Data persistence** — where does your app store files?
+* ⚙️ **App settings** — logging levels, timeouts, cache sizes
+
+```mermaid
+flowchart LR
+  A[😰 Hardcoded Config] --> B[🔧 Externalized Config]
+  B --> C[🚀 Portable Apps]
+  C --> D[💎 Any Environment]
+```
+
+> 🎯 **Goal:** Build applications that run anywhere without code changes
+
+---
+
+## 📍 Slide 2 – 📚 Learning Outcomes
+
+By the end of this lecture, you will:
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | ✅ Understand the **12-Factor App** configuration principle |
+| 2 | ✅ Create and use **ConfigMaps** for non-sensitive configuration |
+| 3 | ✅ Differentiate between **ConfigMaps** and **Secrets** |
+| 4 | ✅ Understand **Persistent Volumes** and storage in Kubernetes |
+| 5 | ✅ Implement **PersistentVolumeClaims** for stateful applications |
+| 6 | ✅ Apply configuration management **best practices** |
+
+---
+
+## 📍 Slide 3 – 🗺️ Lecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  SECTION 0: Introduction                    (Slides 1-4)   │
+├─────────────────────────────────────────────────────────────┤
+│  📝 PRE QUIZ                                (Slide 5)      │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 1: The Configuration Problem       (Slides 6-10)  │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 2: ConfigMaps Deep Dive            (Slides 11-15) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 3: Hands-on Scenarios              (Slides 16-24) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 MID QUIZ                                (Slide 25)     │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 4: Persistent Storage              (Slides 26-32) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 5: Production Patterns             (Slides 33-37) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 POST QUIZ                               (Slide 38)     │
+├─────────────────────────────────────────────────────────────┤
+│  FINAL: What's Next                         (Slide 39)     │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 📍 Slide 4 – 🤔 The Big Question
+
+> 💬 *"Store config in the environment, not in the code."*
+> — The Twelve-Factor App
+
+**Consider this:**
+
+* 🏭 You have the **same application** running in dev, staging, and production
+* 🔧 Each environment needs **different database URLs**
+* 📊 You want to change **log levels without redeploying**
+* 💾 Your app needs to **persist user uploads** somewhere
+
+> 🤔 **Think:** How do you build ONE container image that works everywhere?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L12_PRE
+
+---
+
+## 📍 Slide 6 – ⚠️ Section 1: The Configuration Problem
+
+**The Anti-Pattern: Hardcoded Configuration**
+
+```mermaid
+flowchart TD
+  subgraph 😰 Hardcoded
+    A[app-dev.jar] --> D1[Dev DB]
+    B[app-staging.jar] --> D2[Staging DB]
+    C[app-prod.jar] --> D3[Prod DB]
+  end
+
+  subgraph 🚀 Externalized
+    E[app.jar] --> F{Config}
+    F --> D1
+    F --> D2
+    F --> D3
+  end
+```
+
+* 😰 **Hardcoded:** Different artifact per environment
+* 🚀 **Externalized:** One artifact, configuration injected at runtime
+
+---
+
+## 📍 Slide 7 – 🔥 Pain Point 1: Environment-Specific Builds
+
+**The Problem:**
+
+```dockerfile
+# ❌ Bad: Environment-specific Dockerfile
+FROM python:3.12
+ENV DATABASE_URL=postgres://dev-server:5432/mydb  # 😱 Hardcoded!
+ENV LOG_LEVEL=DEBUG
+COPY . /app
+```
+
+* 🔄 Need to **rebuild** for each environment
+* 🐛 **"Works on my machine"** — config differs
+* 🔍 Can't trace which **version** is where
+* 💀 Accidentally deploying **dev config to production**
+
+> 😱 **Horror Story:** Company deployed with `DEBUG=true` to production, logging credit card numbers
+
+---
+
+## 📍 Slide 8 – 🔥 Pain Point 2: Configuration Drift
+
+**What happens over time:**
+
+| 📅 Month | 🔧 Dev Config | 🎭 Staging Config | 🏭 Prod Config |
+|----------|---------------|-------------------|----------------|
+| January  | `timeout=30` | `timeout=30` | `timeout=30` |
+| March    | `timeout=60` | `timeout=30` | `timeout=30` |
+| June     | `timeout=60` | `timeout=45` | `timeout=30` |
+| Now      | 😵 Nobody knows what's deployed where |
+
+* 🔄 **Manual changes** accumulate
+* 📋 No **version control** for configuration
+* 🐛 **Staging doesn't match production** — bugs slip through
+
+---
+
+## 📍 Slide 9 – 🔥 Pain Point 3: Data Loss
+
+**Stateless containers + persistent data = 💥**
+
+```mermaid
+flowchart LR
+  A[📦 Container v1] --> B[💾 /app/uploads]
+  B --> C[🔄 Deployment]
+  C --> D[📦 Container v2]
+  D --> E[💾 /app/uploads]
+  E --> F[😱 Empty!]
+```
+
+* 📦 Containers are **ephemeral** — data inside is lost on restart
+* 💾 User uploads, databases, caches — all **gone**
+* 🔄 Rolling updates = **data loss** without proper storage
+
+> 🤔 **Discussion:** Where should container applications store their data?
+
+---
+
+## 📍 Slide 10 – 💰 The Cost of Poor Configuration
+
+| 🔥 Problem | 💥 Impact | 📊 Statistics |
+|-----------|----------|---------------|
+| Config drift | Inconsistent behavior | 62% of outages involve config changes |
+| Hardcoded secrets | Security breaches | Covered in Lecture 11! |
+| Data loss | Customer impact | Average $150K per incident |
+| Manual config | Human error | 70% of failures are human error |
+
+**Root causes of production incidents (2024 survey):**
+* 🔧 Configuration changes: **41%**
+* 📦 Code deployments: **31%**
+* 🔌 Infrastructure failures: **28%**
+
+---
+
+## 📍 Slide 11 – ✅ Section 2: ConfigMaps to the Rescue
+
+**What is a ConfigMap?**
+
+* 📋 Kubernetes object that stores **non-confidential** configuration data
+* 🔑 Key-value pairs or **entire files**
+* 🔄 Decouples configuration from container images
+* ⚡ Can be updated **without rebuilding** the application
+
+```mermaid
+flowchart LR
+  A[📋 ConfigMap] --> B[📦 Pod]
+  A --> C[📦 Pod]
+  A --> D[📦 Pod]
+
+  E[🔐 Secret] --> B
+  E --> C
+  E --> D
+```
+
+> 💡 **Key Insight:** ConfigMaps for config, Secrets for sensitive data
+
+---
+
+## 📍 Slide 12 – 🚫 ConfigMaps: What They're NOT
+
+| 🚫 Myth | ✅ Reality |
+|---------|----------|
+| ConfigMaps are secure | ❌ Stored in plain text in etcd |
+| ConfigMaps replace Secrets | ❌ Use Secrets for sensitive data |
+| ConfigMaps auto-reload apps | ❌ Apps must implement hot-reload |
+| ConfigMaps have no size limit | ❌ Limited to 1MB per ConfigMap |
+
+> ⚠️ **Warning:** Never store passwords, tokens, or keys in ConfigMaps!
+
+**When to use which:**
+
+| 📋 ConfigMap | 🔐 Secret |
+|-------------|----------|
+| Database URLs (without password) | Database passwords |
+| Feature flags | API keys |
+| Log levels | TLS certificates |
+| Application settings | OAuth tokens |
+
+---
+
+## 📍 Slide 13 – 🛠️ Creating ConfigMaps
+
+**Method 1: From literal values**
+```bash
+kubectl create configmap app-config \
+  --from-literal=LOG_LEVEL=INFO \
+  --from-literal=CACHE_TTL=3600
+```
+
+**Method 2: From a file**
+```bash
+kubectl create configmap nginx-config \
+  --from-file=nginx.conf
+```
+
+**Method 3: From YAML manifest**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: app-config
+data:
+  LOG_LEVEL: "INFO"
+  DATABASE_HOST: "postgres.default.svc"
+  config.yaml: |
+    server:
+      port: 8080
+      timeout: 30s
+```
+
+---
+
+## 📍 Slide 14 – 🔌 Consuming ConfigMaps
+
+**Option 1: Environment Variables**
+```yaml
+# ✅ Individual keys
+env:
+  - name: LOG_LEVEL
+    valueFrom:
+      configMapKeyRef:
+        name: app-config
+        key: LOG_LEVEL
+
+# ✅ All keys at once
+envFrom:
+  - configMapRef:
+      name: app-config
+```
+
+**Option 2: Volume Mounts (for files)**
+```yaml
+volumes:
+  - name: config-volume
+    configMap:
+      name: nginx-config
+volumeMounts:
+  - name: config-volume
+    mountPath: /etc/nginx/nginx.conf
+    subPath: nginx.conf
+```
+
+---
+
+## 📍 Slide 15 – 📊 Before vs After: Configuration
+
+| 📋 Aspect | 😰 Before (Hardcoded) | 🚀 After (ConfigMaps) |
+|----------|----------------------|----------------------|
+| Build per environment | Yes, multiple images | No, one image |
+| Change config | Rebuild & redeploy | Update ConfigMap |
+| Version control | In code (scattered) | Centralized, declarative |
+| Environment parity | Difficult | Easy |
+| Rollback | Redeploy old image | Apply old ConfigMap |
+| Audit trail | Git history (code) | K8s + Git history |
+
+> 🤔 **Think:** What configuration in your applications could be externalized?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Let's Simulate!
+
+**Scenario:** You're a DevOps engineer at **CloudMart** 🛒
+
+Your application:
+* 🐍 Python/Go web service
+* 📊 Needs different configs per environment
+* 💾 Stores user uploads
+* 🔧 Frequently changes feature flags
+
+**What could go wrong?** Everything! Let's fix it.
+
+---
+
+## 📍 Slide 17 – 💥 Scenario 1: Wrong Environment Config
+
+**Situation:** Developer accidentally deploys with staging database URL to production
+
+```mermaid
+flowchart LR
+  A[👨‍💻 Dev pushes] --> B[🔄 CI/CD]
+  B --> C[📦 Deploy to Prod]
+  C --> D[🔗 Connects to Staging DB]
+  D --> E[😱 Production reads staging data!]
+```
+
+* 😱 **Impact:** Customers see test data
+* ⏱️ **Detection time:** 2 hours
+* 💰 **Cost:** Lost sales, reputation damage
+
+> 🤔 **Question:** How do we prevent this?
+
+---
+
+## 📍 Slide 18 – ✅ Solution 1: Environment-Specific ConfigMaps
+
+**Fix:** Namespace-isolated ConfigMaps
+
+```yaml
+# configmap-prod.yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: app-config
+  namespace: production  # 🔑 Namespace isolation
+data:
+  DATABASE_HOST: "prod-db.internal"
+  ENVIRONMENT: "production"
+---
+# configmap-staging.yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: app-config
+  namespace: staging
+data:
+  DATABASE_HOST: "staging-db.internal"
+  ENVIRONMENT: "staging"
+```
+
+* ✅ **Same ConfigMap name**, different namespaces
+* ✅ **Impossible** to mix environments
+* ✅ **GitOps friendly** — config in version control
+
+---
+
+## 📍 Slide 19 – 💥 Scenario 2: Config Change Causes Outage
+
+**Situation:** Changed `CACHE_TTL` from 3600 to 36 (typo!) — cache expires every 36 seconds
+
+```mermaid
+flowchart TD
+  A[⌨️ Typo: 3600 → 36] --> B[📋 ConfigMap Updated]
+  B --> C[📦 Pods reload config]
+  C --> D[🔥 Cache thrashing]
+  D --> E[💀 Database overloaded]
+  E --> F[😱 Site down!]
+```
+
+* 😱 **Impact:** 30-minute outage
+* 🔍 **Root cause:** No validation, no review
+
+---
+
+## 📍 Slide 20 – ✅ Solution 2: Immutable ConfigMaps + Versioning
+
+**Fix:** Treat ConfigMaps as immutable, version them
+
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: app-config-v3  # 🔑 Versioned name
+  labels:
+    version: "3"
+immutable: true  # 🔒 Cannot be modified
+data:
+  CACHE_TTL: "3600"
+```
+
+**Deployment references specific version:**
+```yaml
+envFrom:
+  - configMapRef:
+      name: app-config-v3  # 🔑 Explicit version
+```
+
+* ✅ **Rollback** = change reference to previous version
+* ✅ **Audit trail** — which version when
+* ✅ **Validation** in CI/CD before applying
+
+---
+
+## 📍 Slide 21 – 💥 Scenario 3: User Uploads Disappear
+
+**Situation:** Deployment rolls out new pods, user uploads are gone
+
+```mermaid
+flowchart TD
+  A[📦 Pod v1] --> B[💾 /app/uploads]
+  B --> C[📸 User uploads photo]
+  C --> D[🔄 Rolling Update]
+  D --> E[📦 Pod v2]
+  E --> F[💾 /app/uploads - Empty!]
+  F --> G[😱 User: Where's my photo?!]
+```
+
+* 💾 Container filesystem is **ephemeral**
+* 🔄 New container = **fresh filesystem**
+* 😱 All data is **lost**
+
+---
+
+## 📍 Slide 22 – ✅ Solution 3: Persistent Volumes
+
+**Fix:** External storage that survives pod restarts
+
+```yaml
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: uploads-pvc
+spec:
+  accessModes:
+    - ReadWriteOnce
+  resources:
+    requests:
+      storage: 10Gi
+---
+# In Deployment
+volumes:
+  - name: uploads
+    persistentVolumeClaim:
+      claimName: uploads-pvc
+volumeMounts:
+  - name: uploads
+    mountPath: /app/uploads
+```
+
+```mermaid
+flowchart LR
+  A[📦 Pod v1] --> B[💾 PVC]
+  C[📦 Pod v2] --> B
+  D[📦 Pod v3] --> B
+  B --> E[🗄️ Persistent Storage]
+```
+
+---
+
+## 📍 Slide 23 – 💥 Scenario 4: ConfigMap Update Not Applied
+
+**Situation:** Updated ConfigMap, but app still uses old values
+
+```mermaid
+flowchart LR
+  A[📋 ConfigMap Updated] --> B[📦 Pod still running]
+  B --> C[⚠️ Using old config!]
+  C --> D[🤔 Why isn't it working?]
+```
+
+* 🔄 ConfigMap updates **don't automatically restart** pods
+* 📦 Pod keeps the config from when it started
+
+---
+
+## 📍 Slide 24 – ✅ Solution 4: Config Reload Strategies
+
+**Strategy 1: Restart Deployment**
+```bash
+kubectl rollout restart deployment/myapp
+```
+
+**Strategy 2: Use a hash annotation (GitOps-friendly)**
+```yaml
+metadata:
+  annotations:
+    checksum/config: {{ sha256sum .Values.config | quote }}
+```
+
+**Strategy 3: App-level hot reload**
+* 📂 Mount ConfigMap as volume
+* 👀 Watch for file changes
+* 🔄 Reload configuration in-memory
+
+**Strategy 4: Reloader controller**
+* 🤖 Automatically restarts pods when ConfigMap changes
+* 📦 `stakater/reloader` — popular open source solution
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L12_MID
+
+---
+
+## 📍 Slide 26 – 💾 Section 4: Persistent Storage Deep Dive
+
+**The Storage Stack in Kubernetes:**
+
+```mermaid
+flowchart TD
+  A[📦 Pod] --> B[📁 Volume Mount]
+  B --> C[💾 PersistentVolumeClaim]
+  C --> D[🗄️ PersistentVolume]
+  D --> E[☁️ Storage Backend]
+
+  F[📋 StorageClass] -.-> C
+  F -.-> D
+```
+
+* 📦 **Pod:** Uses the storage via mount
+* 💾 **PVC:** Request for storage ("I need 10GB")
+* 🗄️ **PV:** Actual storage resource
+* ☁️ **Backend:** AWS EBS, GCE PD, NFS, local disk
+* 📋 **StorageClass:** Template for dynamic provisioning
+
+---
+
+## 📍 Slide 27 – 📋 Storage Concepts Breakdown
+
+| 🔧 Concept | 📝 Description | 🎯 Analogy |
+|-----------|---------------|-----------|
+| **PersistentVolume (PV)** | A piece of storage in the cluster | A physical hard drive |
+| **PersistentVolumeClaim (PVC)** | A request for storage | "I need a 100GB drive" |
+| **StorageClass** | Template for provisioning | "Give me SSD storage" |
+| **Access Modes** | How pods can access | ReadWriteOnce, ReadWriteMany |
+| **Reclaim Policy** | What happens when PVC deleted | Retain, Delete, Recycle |
+
+**Access Modes:**
+* 🔒 **ReadWriteOnce (RWO):** One node can mount read-write
+* 📖 **ReadOnlyMany (ROX):** Many nodes can mount read-only
+* 📝 **ReadWriteMany (RWX):** Many nodes can mount read-write
+
+---
+
+## 📍 Slide 28 – 🔄 Dynamic Provisioning
+
+**Without Dynamic Provisioning (Manual):**
+```mermaid
+flowchart LR
+  A[👨‍💻 Admin creates PV] --> B[📋 PV available]
+  B --> C[👨‍💻 Dev creates PVC]
+  C --> D[🔗 PVC binds to PV]
+```
+
+**With Dynamic Provisioning (Automatic):**
+```mermaid
+flowchart LR
+  A[👨‍💻 Dev creates PVC] --> B[📋 StorageClass]
+  B --> C[🤖 Auto-create PV]
+  C --> D[🔗 PVC binds to PV]
+```
+
+```yaml
+apiVersion: storage.k8s.io/v1
+kind: StorageClass
+metadata:
+  name: fast-ssd
+provisioner: kubernetes.io/gce-pd  # Cloud-specific
+parameters:
+  type: pd-ssd
+reclaimPolicy: Delete
+volumeBindingMode: WaitForFirstConsumer
+```
+
+---
+
+## 📍 Slide 29 – ⚠️ Storage Pitfalls
+
+| ⚠️ Pitfall | 💥 Impact | ✅ Solution |
+|-----------|----------|------------|
+| Wrong access mode | Pod scheduling fails | Match mode to use case |
+| No storage class | PVC pending forever | Set default StorageClass |
+| Reclaim = Delete | Data lost on PVC delete | Use Retain for important data |
+| Zone mismatch | Pod can't mount volume | Use topology-aware provisioning |
+| Insufficient capacity | PVC pending | Monitor storage usage |
+
+**Common error:**
+```
+Warning  FailedScheduling  pod has unbound immediate PersistentVolumeClaims
+```
+
+> 🔍 **Debug:** `kubectl describe pvc <name>` — check events
+
+---
+
+## 📍 Slide 30 – 📊 Volume Types Comparison
+
+| 📦 Volume Type | 🎯 Use Case | ⚡ Performance | 💰 Cost |
+|---------------|------------|---------------|--------|
+| **emptyDir** | Temp data, cache | Fast (node storage) | Free |
+| **hostPath** | Node-specific data | Fast | Free |
+| **NFS** | Shared storage | Medium | Varies |
+| **Cloud (EBS, PD)** | Production workloads | Configurable | $$$ |
+| **Local PV** | Databases, high IOPS | Very fast | Node-dependent |
+
+**Decision tree:**
+```mermaid
+flowchart TD
+  A[Need persistent storage?] --> |No| B[emptyDir]
+  A --> |Yes| C[Shared across pods?]
+  C --> |No| D[Cloud Block Storage]
+  C --> |Yes| E[NFS or Cloud File Storage]
+```
+
+---
+
+## 📍 Slide 31 – 🔧 Practical PVC Example
+
+**Complete example for a web application:**
+
+```yaml
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: app-uploads
+spec:
+  accessModes:
+    - ReadWriteOnce
+  storageClassName: standard
+  resources:
+    requests:
+      storage: 5Gi
+---
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: webapp
+spec:
+  template:
+    spec:
+      containers:
+        - name: app
+          volumeMounts:
+            - name: uploads
+              mountPath: /app/uploads
+      volumes:
+        - name: uploads
+          persistentVolumeClaim:
+            claimName: app-uploads
+```
+
+---
+
+## 📍 Slide 32 – 📈 Storage Lifecycle
+
+```mermaid
+stateDiagram-v2
+  [*] --> Pending: PVC Created
+  Pending --> Bound: PV Available
+  Bound --> Released: PVC Deleted
+  Released --> Available: Reclaim
+  Released --> [*]: Delete Policy
+
+  note right of Pending: Waiting for PV
+  note right of Bound: In use
+  note right of Released: Data still exists
+```
+
+**Key states:**
+* ⏳ **Pending:** Waiting for matching PV
+* ✅ **Bound:** PVC matched to PV
+* 🔓 **Released:** PVC deleted, PV still has data
+* ❌ **Failed:** Error in provisioning
+
+---
+
+## 📍 Slide 33 – 🏭 Section 5: Production Patterns
+
+**Pattern 1: GitOps Configuration Management**
+
+```mermaid
+flowchart LR
+  A[📝 Git Repo] --> B[🔄 ArgoCD]
+  B --> C[📋 ConfigMaps]
+  B --> D[🔐 Secrets]
+  B --> E[📦 Deployments]
+
+  C --> F[🎯 Cluster]
+  D --> F
+  E --> F
+```
+
+* 📋 **All configuration in Git** — single source of truth
+* 🔄 **ArgoCD syncs** to cluster
+* 🔍 **Audit trail** — who changed what, when
+* ↩️ **Rollback** — `git revert`
+
+---
+
+## 📍 Slide 34 – 🔧 Pattern 2: Environment Hierarchy
+
+**Kustomize for environment-specific configs:**
+
+```
+base/
+  ├── deployment.yaml
+  ├── service.yaml
+  └── configmap.yaml
+overlays/
+  ├── dev/
+  │   └── kustomization.yaml
+  ├── staging/
+  │   └── kustomization.yaml
+  └── prod/
+      └── kustomization.yaml
+```
+
+```yaml
+# overlays/prod/kustomization.yaml
+resources:
+  - ../../base
+configMapGenerator:
+  - name: app-config
+    literals:
+      - LOG_LEVEL=WARN
+      - REPLICAS=5
+```
+
+* ✅ **DRY** — Don't Repeat Yourself
+* ✅ **Environment-specific** overrides
+* ✅ **Consistent** base configuration
+
+---
+
+## 📍 Slide 35 – 🔐 Pattern 3: Secrets + ConfigMaps Together
+
+**Combining Secrets and ConfigMaps:**
+
+```yaml
+spec:
+  containers:
+    - name: app
+      env:
+        # 📋 From ConfigMap (non-sensitive)
+        - name: DATABASE_HOST
+          valueFrom:
+            configMapKeyRef:
+              name: app-config
+              key: DATABASE_HOST
+        # 🔐 From Secret (sensitive)
+        - name: DATABASE_PASSWORD
+          valueFrom:
+            secretKeyRef:
+              name: app-secrets
+              key: db-password
+```
+
+**Best Practice:**
+* 📋 **ConfigMap:** URLs, ports, feature flags
+* 🔐 **Secret:** Passwords, tokens, certificates
+* 🔒 **Never mix** sensitive and non-sensitive data
+
+---
+
+## 📍 Slide 36 – 📊 Configuration Best Practices
+
+| 🔧 Practice | 📝 Description |
+|------------|---------------|
+| **Version ConfigMaps** | Include version in name (`app-config-v2`) |
+| **Use namespaces** | Isolate environments (dev, staging, prod) |
+| **Validate in CI** | Check config syntax before deploy |
+| **Document defaults** | What happens if config missing? |
+| **Monitor changes** | Alert on ConfigMap updates |
+| **Limit size** | Keep ConfigMaps under 1MB |
+| **Use labels** | Tag configs with app, version, environment |
+
+---
+
+## 📍 Slide 37 – 🎯 Key Takeaways
+
+1. 📋 **ConfigMaps** separate configuration from code — one image, any environment
+2. 🔐 **ConfigMaps ≠ Secrets** — never store sensitive data in ConfigMaps
+3. 💾 **PVCs** provide persistent storage that survives pod restarts
+4. 🔄 **Dynamic provisioning** automates storage management
+5. 📁 **Version your configs** — treat them like code
+6. 🏭 **GitOps** — configuration in Git is the source of truth
+
+> 💬 *"Configuration belongs in the environment, not the artifact."*
+> — 12-Factor App
+
+---
+
+## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L12_POST
+
+---
+
+## 📍 Slide 39 – 🚀 What's Next?
+
+**Coming up: Lecture 13 — GitOps with ArgoCD**
+
+```mermaid
+flowchart LR
+  A[📝 Git] --> B[🔄 ArgoCD]
+  B --> C[☸️ Kubernetes]
+  C --> D[🎯 Desired State]
+```
+
+* 🔄 **Continuous Deployment** automated
+* 📝 **Git as single source of truth**
+* 🔍 **Drift detection** and auto-sync
+* ↩️ **Easy rollbacks** with git revert
+
+> 🎯 **Lab 12:** Apply these concepts — create ConfigMaps, use PVCs, externalize your app configuration!
+
+---
+
+## 📚 Resources
+
+**Documentation:**
+* 📖 [Kubernetes ConfigMaps](https://kubernetes.io/docs/concepts/configuration/configmap/)
+* 📖 [Persistent Volumes](https://kubernetes.io/docs/concepts/storage/persistent-volumes/)
+* 📖 [12-Factor App — Config](https://12factor.net/config)
+
+**Tools:**
+* 🔧 [Kustomize](https://kustomize.io/)
+* 🔧 [Reloader](https://github.com/stakater/Reloader)
+
+**Books:**
+* 📕 *Kubernetes Patterns* by Bilgin Ibryam & Roland Huß
+* 📕 *Cloud Native DevOps with Kubernetes* by John Arundel & Justin Domingus
diff --git a/lectures/lec13.md b/lectures/lec13.md
new file mode 100644
index 0000000000..370ae7821a
--- /dev/null
+++ b/lectures/lec13.md
@@ -0,0 +1,830 @@
+# 📌 Lecture 13 — GitOps with ArgoCD: Git as the Source of Truth
+
+> 🎯 **From manual deployments to automated, auditable, self-healing infrastructure**
+
+---
+
+## 📍 Slide 1 – 🚀 Welcome to GitOps
+
+We've learned to store configuration in **ConfigMaps** and **Secrets**. But who deploys them?
+
+* 👨‍💻 **Manual kubectl?** — "Who ran that command?"
+* 🔄 **CI/CD pipeline?** — Push-based, fragile
+* 🤔 **What about drift?** — Reality vs desired state
+
+```mermaid
+flowchart LR
+  A[😰 Manual Deploys] --> B[🔄 CI/CD Push]
+  B --> C[🚀 GitOps Pull]
+  C --> D[💎 Self-healing Infrastructure]
+```
+
+> 🎯 **Goal:** Git becomes the single source of truth for your entire infrastructure
+
+---
+
+## 📍 Slide 2 – 📚 Learning Outcomes
+
+By the end of this lecture, you will:
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | ✅ Understand **GitOps principles** and benefits |
+| 2 | ✅ Differentiate **push vs pull** deployment models |
+| 3 | ✅ Deploy applications using **ArgoCD** |
+| 4 | ✅ Configure **sync policies** and **auto-healing** |
+| 5 | ✅ Handle **secrets** in GitOps workflows |
+| 6 | ✅ Implement **multi-environment** deployments |
+
+---
+
+## 📍 Slide 3 – 🗺️ Lecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  SECTION 0: Introduction                    (Slides 1-4)   │
+├─────────────────────────────────────────────────────────────┤
+│  📝 PRE QUIZ                                (Slide 5)      │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 1: The Deployment Problem          (Slides 6-10)  │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 2: GitOps Principles               (Slides 11-15) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 3: ArgoCD in Action                (Slides 16-24) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 MID QUIZ                                (Slide 25)     │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 4: Advanced Patterns               (Slides 26-32) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 5: Production GitOps               (Slides 33-37) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 POST QUIZ                               (Slide 38)     │
+├─────────────────────────────────────────────────────────────┤
+│  FINAL: What's Next                         (Slide 39)     │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 📍 Slide 4 – 🤔 The Big Question
+
+> 💬 *"If it's not in Git, it doesn't exist."*
+> — GitOps Mantra
+
+**Consider this scenario:**
+
+* 🌙 **3 AM alert:** Production is down
+* 🔍 **Investigation:** Someone changed a deployment
+* ❓ **Questions:** Who? When? What changed? How to rollback?
+* 😱 **Answer:** Nobody knows...
+
+> 🤔 **Think:** How do we ensure every change is tracked, auditable, and reversible?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L13_PRE
+
+---
+
+## 📍 Slide 6 – ⚠️ Section 1: The Deployment Problem
+
+**Traditional Deployment Models:**
+
+```mermaid
+flowchart TD
+  subgraph 😰 Manual
+    A[👨‍💻 Developer] --> B[⌨️ kubectl apply]
+    B --> C[☸️ Cluster]
+  end
+
+  subgraph 🔄 CI/CD Push
+    D[📝 Git Push] --> E[🔧 CI Pipeline]
+    E --> F[⌨️ kubectl apply]
+    F --> G[☸️ Cluster]
+  end
+```
+
+* 😰 **Manual:** No audit trail, human error, inconsistent
+* 🔄 **CI/CD Push:** Better, but credentials in pipeline, cluster access
+
+---
+
+## 📍 Slide 7 – 🔥 Pain Point 1: The "It Works on My Machine" Problem
+
+**Symptoms:**
+
+* 👨‍💻 **Dev:** "I deployed it, it's working!"
+* 🏭 **Prod:** "It's completely broken!"
+* 🔍 **Investigation:** Configs don't match
+
+```mermaid
+flowchart LR
+  A[👨‍💻 Local kubectl] --> B[🎭 Staging]
+  C[👨‍💻 Different kubectl] --> D[🏭 Production]
+  B --> E[😵 Different States]
+  D --> E
+```
+
+* 🔧 **No single source of truth**
+* 📋 **Manual processes** lead to drift
+* 😱 **"Emergency fixes"** bypass procedures
+
+---
+
+## 📍 Slide 8 – 🔥 Pain Point 2: Configuration Drift
+
+**Drift:** When actual state ≠ desired state
+
+| 📅 Time | 📝 Git (Desired) | ☸️ Cluster (Actual) | 😱 Drift |
+|---------|------------------|---------------------|----------|
+| Day 1 | replicas: 3 | replicas: 3 | ✅ None |
+| Day 5 | replicas: 3 | replicas: 5 (scaled manually) | ⚠️ Drift! |
+| Day 10 | replicas: 3 | replicas: 5, extra env var | 🔥 More drift! |
+| Day 30 | 🤷 Unknown | 🤷 Unknown | 💀 Chaos |
+
+**Real impact:**
+* 🔄 **Deployments fail** because actual state differs
+* 📋 **Documentation lies** — cluster is reality
+* 🔍 **Debugging nightmare** — which version is deployed?
+
+---
+
+## 📍 Slide 9 – 🔥 Pain Point 3: Credential Sprawl
+
+**Push-based CI/CD security concerns:**
+
+```mermaid
+flowchart TD
+  A[🔐 Cluster Credentials] --> B[📦 CI Server]
+  A --> C[💻 Dev Machines]
+  A --> D[🔧 Scripts]
+  A --> E[📋 Pipeline Configs]
+
+  B --> F[😱 Breach Vector]
+  C --> F
+  D --> F
+  E --> F
+```
+
+* 🔐 **Credentials everywhere** — CI servers, dev machines
+* 🎯 **Attack surface** expands with each tool
+* 🔑 **Shared secrets** — who has access?
+
+---
+
+## 📍 Slide 10 – 💰 The Cost of Manual Deployments
+
+| 🔥 Problem | 💥 Impact | 📊 Data |
+|-----------|----------|---------|
+| No audit trail | Compliance failures | 73% fail audits without GitOps |
+| Manual errors | Outages | 70% of outages are human error |
+| Credential sprawl | Security breaches | Average breach cost: $4.45M |
+| Slow recovery | Downtime | MTTR 4x longer without GitOps |
+
+> 💬 *"The cost of a breach is not the breach itself, but the inability to respond quickly."*
+
+---
+
+## 📍 Slide 11 – ✅ Section 2: GitOps Principles
+
+**What is GitOps?**
+
+* 📝 **Git as single source of truth** — declarative desired state
+* 🔄 **Continuous reconciliation** — actual → desired
+* 🔀 **Pull-based deployment** — agent pulls from Git
+* 🔒 **Immutable, auditable** — every change tracked
+
+```mermaid
+flowchart LR
+  A[📝 Git Repo] --> |Pull| B[🤖 ArgoCD Agent]
+  B --> |Reconcile| C[☸️ Cluster]
+  C --> |Report Status| B
+```
+
+> 💡 **Key Insight:** The cluster pulls changes, no credentials leave the cluster!
+
+---
+
+## 📍 Slide 12 – 🚫 GitOps: What It's NOT
+
+| 🚫 Myth | ✅ Reality |
+|---------|----------|
+| Just using Git for YAML files | A complete operational model with reconciliation |
+| Another CI/CD tool | Continuous deployment, not continuous integration |
+| Only for Kubernetes | Works for any declarative infrastructure |
+| Complicated to adopt | Can start simple, grow incrementally |
+
+> 🔥 **Hot take:** "Putting YAML in Git is not GitOps. GitOps is about the reconciliation loop."
+
+**The Four Principles (from OpenGitOps):**
+1. 📝 **Declarative** — Desired state expressed declaratively
+2. 🔄 **Versioned and Immutable** — Stored in Git
+3. 🤖 **Pulled Automatically** — Agents pull desired state
+4. ♾️ **Continuously Reconciled** — Agents ensure actual = desired
+
+---
+
+## 📍 Slide 13 – 🔄 Push vs Pull Deployment
+
+```mermaid
+flowchart TD
+  subgraph 🔄 Push Model
+    A[📝 Git] --> B[🔧 CI/CD]
+    B --> |Push credentials needed| C[☸️ Cluster]
+  end
+
+  subgraph 🚀 Pull Model - GitOps
+    D[📝 Git] --> |Pull| E[🤖 Agent in Cluster]
+    E --> |Apply| F[☸️ Same Cluster]
+  end
+```
+
+| 📋 Aspect | 🔄 Push | 🚀 Pull (GitOps) |
+|----------|--------|------------------|
+| Credentials | CI needs cluster creds | Agent has local access |
+| Drift detection | None | Continuous |
+| Audit trail | CI logs (external) | Git history |
+| Recovery | Re-run pipeline | Automatic reconciliation |
+
+---
+
+## 📍 Slide 14 – 🛠️ GitOps Tools Landscape
+
+| 🛠️ Tool | 📝 Description | ⭐ Best For |
+|---------|---------------|------------|
+| **ArgoCD** | Declarative GitOps for K8s | Most Kubernetes use cases |
+| **Flux** | Toolkit approach, CNCF project | Composable, extensible setups |
+| **Jenkins X** | CI/CD + GitOps combined | Jenkins-heavy organizations |
+| **Rancher Fleet** | Multi-cluster GitOps | Managing many clusters |
+
+**Why ArgoCD?**
+* 🎯 Most adopted (70%+ of GitOps users)
+* 🖥️ Excellent UI for visualization
+* 🔧 Rich feature set out of the box
+* 📚 Large community, good documentation
+
+---
+
+## 📍 Slide 15 – 📊 Before vs After: Deployment
+
+| 📋 Aspect | 😰 Before (Manual/Push) | 🚀 After (GitOps) |
+|----------|-------------------------|-------------------|
+| Change process | kubectl, scripts, pipelines | Git PR → merge → auto-sync |
+| Audit trail | Scattered logs | Complete Git history |
+| Rollback | "Which version was before?" | `git revert` |
+| Drift | Undetected until failure | Detected immediately |
+| Credentials | Spread across tools | Stay in cluster |
+| Recovery | Manual intervention | Self-healing |
+
+> 🤔 **Think:** How would GitOps have helped in your last deployment issue?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: ArgoCD in Action
+
+**ArgoCD Architecture:**
+
+```mermaid
+flowchart TD
+  A[📝 Git Repository] --> B[🤖 ArgoCD Server]
+  B --> C[🔄 Application Controller]
+  C --> D[☸️ Kubernetes API]
+  E[👨‍💻 User] --> F[🖥️ ArgoCD UI / CLI]
+  F --> B
+  D --> C
+```
+
+**Components:**
+* 🖥️ **API Server:** UI, CLI, webhook endpoints
+* 🔄 **Application Controller:** Reconciliation engine
+* 📦 **Repository Server:** Caches Git repos, renders manifests
+* 🔗 **Dex:** SSO authentication (optional)
+
+---
+
+## 📍 Slide 17 – 💥 Scenario 1: First ArgoCD Deployment
+
+**Situation:** Deploy your first application with ArgoCD
+
+```yaml
+# Application manifest
+apiVersion: argoproj.io/v1alpha1
+kind: Application
+metadata:
+  name: my-app
+  namespace: argocd
+spec:
+  project: default
+  source:
+    repoURL: https://github.com/org/app-manifests
+    path: environments/dev
+    targetRevision: main
+  destination:
+    server: https://kubernetes.default.svc
+    namespace: dev
+```
+
+```mermaid
+flowchart LR
+  A[📝 Create App] --> B[🔄 ArgoCD Syncs]
+  B --> C[📦 Resources Created]
+  C --> D[✅ App Running]
+```
+
+---
+
+## 📍 Slide 18 – ✅ Solution 1: Understanding Sync
+
+**Sync States:**
+
+| 🔄 State | 📝 Meaning | 🎯 Action |
+|----------|-----------|----------|
+| **Synced** | Cluster matches Git | ✅ Good! |
+| **OutOfSync** | Cluster differs from Git | 🔄 Sync needed |
+| **Unknown** | Can't determine state | 🔍 Check connection |
+| **Missing** | Resources don't exist yet | 🔄 Initial sync |
+
+**Health States:**
+
+| 💚 Health | 📝 Meaning |
+|----------|-----------|
+| **Healthy** | All resources running correctly |
+| **Progressing** | Resources being updated |
+| **Degraded** | Some resources have issues |
+| **Suspended** | Manually paused |
+
+---
+
+## 📍 Slide 19 – 💥 Scenario 2: Handling Drift
+
+**Situation:** Someone manually changed replicas in the cluster
+
+```mermaid
+flowchart TD
+  A[📝 Git: replicas=3] --> B[🤖 ArgoCD]
+  C[👨‍💻 kubectl scale replicas=5] --> D[☸️ Cluster]
+  B --> |Detects| E[⚠️ OutOfSync]
+  E --> |Auto-sync enabled| F[🔄 Restore to 3]
+```
+
+**ArgoCD detects drift immediately!**
+* 🔍 **Visibility:** Shows exactly what differs
+* 🔄 **Options:** Manual sync or auto-sync
+* 📋 **Audit:** Who changed Git matters, not who ran kubectl
+
+---
+
+## 📍 Slide 20 – ✅ Solution 2: Sync Policies
+
+**Configure automatic reconciliation:**
+
+```yaml
+spec:
+  syncPolicy:
+    automated:
+      prune: true        # Delete resources not in Git
+      selfHeal: true     # Revert manual changes
+    syncOptions:
+      - CreateNamespace=true
+      - PruneLast=true
+```
+
+**Options explained:**
+* 🔄 **automated:** Enable auto-sync on Git changes
+* 🗑️ **prune:** Delete resources removed from Git
+* 💚 **selfHeal:** Revert manual cluster changes
+* 📦 **CreateNamespace:** Create namespace if missing
+
+---
+
+## 📍 Slide 21 – 💥 Scenario 3: Multi-Environment Deployment
+
+**Situation:** Same app, different configs for dev/staging/prod
+
+```
+repo/
+├── base/
+│   ├── deployment.yaml
+│   └── service.yaml
+└── overlays/
+    ├── dev/
+    │   └── kustomization.yaml
+    ├── staging/
+    │   └── kustomization.yaml
+    └── prod/
+        └── kustomization.yaml
+```
+
+```mermaid
+flowchart TD
+  A[📝 Git Repo] --> B[🤖 ArgoCD]
+  B --> C[📦 App-Dev]
+  B --> D[📦 App-Staging]
+  B --> E[📦 App-Prod]
+  C --> F[☸️ Dev Cluster]
+  D --> G[☸️ Staging Cluster]
+  E --> H[☸️ Prod Cluster]
+```
+
+---
+
+## 📍 Slide 22 – ✅ Solution 3: ApplicationSet
+
+**Deploy to multiple environments with one definition:**
+
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: ApplicationSet
+metadata:
+  name: my-app
+spec:
+  generators:
+    - list:
+        elements:
+          - env: dev
+            namespace: dev
+          - env: staging
+            namespace: staging
+          - env: prod
+            namespace: prod
+  template:
+    metadata:
+      name: 'my-app-{{env}}'
+    spec:
+      source:
+        repoURL: https://github.com/org/manifests
+        path: 'overlays/{{env}}'
+      destination:
+        namespace: '{{namespace}}'
+```
+
+---
+
+## 📍 Slide 23 – 💥 Scenario 4: Secrets in GitOps
+
+**Problem:** Secrets shouldn't be in Git... but GitOps needs everything in Git!
+
+```mermaid
+flowchart TD
+  A[🔐 Secret] --> B{Where to store?}
+  B --> |❌ Plain Git| C[😱 Security breach]
+  B --> |✅ Encrypted| D[🔒 Sealed Secrets]
+  B --> |✅ External| E[🔐 Vault + ESO]
+```
+
+**The dilemma:**
+* 📝 GitOps: Everything in Git
+* 🔐 Security: Secrets NOT in Git
+* 🤔 How to reconcile?
+
+---
+
+## 📍 Slide 24 – ✅ Solution 4: Secrets Management Patterns
+
+**Option 1: Sealed Secrets**
+```yaml
+apiVersion: bitnami.com/v1alpha1
+kind: SealedSecret
+metadata:
+  name: my-secret
+spec:
+  encryptedData:
+    password: AgBghY8... # Encrypted, safe to commit!
+```
+
+**Option 2: External Secrets Operator + Vault**
+```yaml
+apiVersion: external-secrets.io/v1beta1
+kind: ExternalSecret
+metadata:
+  name: my-secret
+spec:
+  secretStoreRef:
+    name: vault-backend
+  target:
+    name: my-secret
+  data:
+    - secretKey: password
+      remoteRef:
+        key: app/database
+        property: password
+```
+
+* ✅ **Encrypted in Git** (Sealed Secrets)
+* ✅ **Reference only in Git** (External Secrets)
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L13_MID
+
+---
+
+## 📍 Slide 26 – 🔧 Section 4: Advanced ArgoCD Patterns
+
+**Sync Waves & Hooks:**
+
+```yaml
+metadata:
+  annotations:
+    argocd.argoproj.io/sync-wave: "1"  # Order of deployment
+    argocd.argoproj.io/hook: PreSync   # Run before main sync
+```
+
+```mermaid
+flowchart LR
+  A[🔄 PreSync Hooks] --> B[📦 Wave 0]
+  B --> C[📦 Wave 1]
+  C --> D[📦 Wave 2]
+  D --> E[✅ PostSync Hooks]
+```
+
+**Use cases:**
+* 📊 **Database migrations** before app deploy
+* 🧹 **Cleanup jobs** after deployment
+* 🔍 **Health checks** between phases
+
+---
+
+## 📍 Slide 27 – 🔄 Sync Options Deep Dive
+
+| 🔧 Option | 📝 Purpose |
+|----------|-----------|
+| `Replace` | Replace instead of apply (for immutable fields) |
+| `PruneLast` | Delete resources after all others sync |
+| `ApplyOutOfSyncOnly` | Only apply changed resources |
+| `ServerSideApply` | Use server-side apply (K8s 1.22+) |
+| `FailOnSharedResource` | Fail if resource owned by another app |
+
+```yaml
+syncPolicy:
+  syncOptions:
+    - CreateNamespace=true
+    - PrunePropagationPolicy=foreground
+    - PruneLast=true
+```
+
+---
+
+## 📍 Slide 28 – 🏗️ Repository Structure Patterns
+
+**Pattern 1: Monorepo**
+```
+repo/
+├── apps/
+│   ├── app1/
+│   └── app2/
+└── infrastructure/
+    ├── prometheus/
+    └── argocd/
+```
+
+**Pattern 2: Repo per App**
+```
+app1-config/     # App 1 manifests
+app2-config/     # App 2 manifests
+infrastructure/  # Shared infra
+```
+
+**Pattern 3: Environment Repos**
+```
+dev-cluster/     # All dev apps
+prod-cluster/    # All prod apps
+```
+
+> 💡 **Recommendation:** Start with monorepo, split when it gets complex
+
+---
+
+## 📍 Slide 29 – 📊 ArgoCD Metrics & Monitoring
+
+**Key metrics to watch:**
+
+| 📊 Metric | 📝 Meaning | ⚠️ Alert When |
+|----------|-----------|--------------|
+| `argocd_app_sync_total` | Total syncs | Unusually high |
+| `argocd_app_health_status` | App health | Not healthy |
+| `argocd_app_reconcile_duration` | Sync time | > 5 minutes |
+| `argocd_cluster_api_resource_objects` | Total objects | Growing unexpectedly |
+
+**Dashboard integration:**
+* 📊 Grafana dashboards available
+* 🔔 Alertmanager integration
+* 📝 Slack/Teams notifications
+
+---
+
+## 📍 Slide 30 – 🔐 RBAC & Multi-tenancy
+
+**ArgoCD RBAC:**
+
+```yaml
+# argocd-rbac-cm ConfigMap
+policy.csv: |
+  p, role:dev-team, applications, get, dev-project/*, allow
+  p, role:dev-team, applications, sync, dev-project/*, allow
+  p, role:ops-team, applications, *, */*, allow
+
+  g, dev-group, role:dev-team
+  g, ops-group, role:ops-team
+```
+
+**Projects for isolation:**
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: AppProject
+metadata:
+  name: dev-project
+spec:
+  sourceRepos:
+    - 'https://github.com/org/dev-*'
+  destinations:
+    - namespace: 'dev-*'
+      server: https://kubernetes.default.svc
+```
+
+---
+
+## 📍 Slide 31 – 🚨 Disaster Recovery
+
+**Git is your backup!**
+
+```mermaid
+flowchart TD
+  A[💀 Cluster Gone] --> B[🆕 New Cluster]
+  B --> C[📦 Install ArgoCD]
+  C --> D[🔗 Connect to Git]
+  D --> E[🔄 Sync All Apps]
+  E --> F[✅ Fully Restored]
+```
+
+**Recovery steps:**
+1. 🆕 Create new cluster
+2. 📦 Install ArgoCD
+3. 🔗 Point to Git repository
+4. ☕ Wait for sync
+5. ✅ Everything restored!
+
+> 💡 **Key insight:** If Git has everything, recovery is just a sync away
+
+---
+
+## 📍 Slide 32 – 📋 GitOps Workflow Summary
+
+```mermaid
+flowchart TD
+  A[👨‍💻 Developer] --> |PR| B[📝 Git Repo]
+  B --> |Review| C[✅ Merge]
+  C --> |Webhook| D[🤖 ArgoCD]
+  D --> |Sync| E[☸️ Cluster]
+  E --> |Status| D
+  D --> |Notify| F[💬 Slack]
+
+  G[🔍 Drift Detection] --> D
+  D --> |Self-heal| E
+```
+
+**The complete loop:**
+1. 📝 **Change:** Developer creates PR
+2. 👀 **Review:** Team reviews and approves
+3. 🔀 **Merge:** Changes merge to main
+4. 🤖 **Detect:** ArgoCD detects new commit
+5. 🔄 **Sync:** Resources deployed to cluster
+6. 💚 **Verify:** Health checks pass
+7. 📢 **Notify:** Team informed of deployment
+
+---
+
+## 📍 Slide 33 – 🏭 Section 5: Production GitOps
+
+**Enterprise Patterns:**
+
+```mermaid
+flowchart TD
+  subgraph Git
+    A[📝 Feature Branch] --> B[📝 Main Branch]
+    B --> C[📝 Release Branch]
+  end
+
+  subgraph ArgoCD
+    D[🤖 Dev App] --> E[🤖 Staging App]
+    E --> F[🤖 Prod App]
+  end
+
+  B --> D
+  C --> F
+```
+
+* 🔀 **Branch strategy:** Main for dev, release for prod
+* 🎯 **Progressive delivery:** Dev → Staging → Prod
+* ✅ **Promotion:** PR from main to release
+
+---
+
+## 📍 Slide 34 – 🏢 Real-World GitOps: Intuit
+
+**Case Study: Intuit's GitOps Journey**
+
+* 📊 **Scale:** 2,000+ applications
+* 🔄 **Deployments:** 500+ per day
+* ⏱️ **MTTR:** Reduced by 80%
+
+**What they learned:**
+* 📋 Start small, grow incrementally
+* 🔧 Standardize templates early
+* 👥 Train teams on Git workflows
+* 📊 Monitor everything
+
+> 💬 *"GitOps turned our deployment from a ceremony into a non-event."* — Intuit Engineer
+
+---
+
+## 📍 Slide 35 – 🔧 Migration Strategy
+
+**Adopting GitOps incrementally:**
+
+```mermaid
+flowchart LR
+  A[1️⃣ Non-critical app] --> B[2️⃣ Dev environment]
+  B --> C[3️⃣ More apps]
+  C --> D[4️⃣ Staging]
+  D --> E[5️⃣ Production]
+```
+
+**Phases:**
+1. 🧪 **Pilot:** One non-critical app in dev
+2. 📚 **Learn:** Document patterns, train team
+3. 📦 **Expand:** More apps, still dev
+4. 🎭 **Staging:** Full staging environment
+5. 🏭 **Production:** Controlled rollout
+
+---
+
+## 📍 Slide 36 – 🎯 Key Takeaways
+
+1. 📝 **Git is the source of truth** — not the cluster, not CI/CD
+2. 🔄 **Pull > Push** — credentials stay in cluster
+3. 💚 **Self-healing** — drift is detected and corrected
+4. 🔍 **Complete audit trail** — git log is your history
+5. ↩️ **Easy rollback** — `git revert` reverts infrastructure
+6. 🔐 **Secrets need special handling** — Sealed Secrets or External Secrets
+
+> 💬 *"Operations by Pull Request"*
+> — Kelsey Hightower
+
+---
+
+## 📍 Slide 37 – 🧠 Mindset Shift
+
+| 😰 Old Mindset | 🚀 New Mindset |
+|---------------|----------------|
+| "I'll just kubectl this" | "Let me create a PR" |
+| "The cluster is truth" | "Git is truth" |
+| "We need cluster access" | "We need Git access" |
+| "Rollback is scary" | "Rollback is git revert" |
+| "Who changed what?" | "Check git log" |
+| "Emergency fix!" | "Emergency PR with fast review" |
+
+> 🤔 **Question:** Which mindset do you operate with today?
+
+---
+
+## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L13_POST
+
+---
+
+## 📍 Slide 39 – 🚀 What's Next?
+
+**Coming up: Lecture 14 — Progressive Delivery with Argo Rollouts**
+
+```mermaid
+flowchart LR
+  A[📦 v1] --> B[🚀 Canary 10%]
+  B --> C[🚀 Canary 50%]
+  C --> D[🚀 Full Rollout]
+```
+
+* 🐤 **Canary deployments** — test with small traffic
+* 🔵 **Blue-green deployments** — instant switchover
+* 📊 **Automated analysis** — metrics-driven promotion
+* ↩️ **Automatic rollback** — on failure
+
+> 🎯 **Lab 13:** Set up ArgoCD and deploy your application using GitOps!
+
+---
+
+## 📚 Resources
+
+**Documentation:**
+* 📖 [ArgoCD Docs](https://argo-cd.readthedocs.io/)
+* 📖 [OpenGitOps](https://opengitops.dev/)
+* 📖 [Sealed Secrets](https://sealed-secrets.netlify.app/)
+* 📖 [External Secrets Operator](https://external-secrets.io/)
+
+**Tools:**
+* 🔧 [ArgoCD](https://argoproj.github.io/cd/)
+* 🔧 [Flux](https://fluxcd.io/)
+* 🔧 [Kustomize](https://kustomize.io/)
+
+**Books:**
+* 📕 *GitOps and Kubernetes* by Billy Yuen, et al.
+* 📕 *Continuous Delivery* by Jez Humble & David Farley
diff --git a/lectures/lec14.md b/lectures/lec14.md
new file mode 100644
index 0000000000..9ca7297ccd
--- /dev/null
+++ b/lectures/lec14.md
@@ -0,0 +1,825 @@
+# 📌 Lecture 14 — Progressive Delivery: Deploying with Confidence
+
+> 🎯 **From risky big-bang deployments to controlled, observable releases**
+
+---
+
+## 📍 Slide 1 – 🚀 Welcome to Progressive Delivery
+
+GitOps solved **how** we deploy. But **when things go wrong**...
+
+* 💥 **Traditional deploy:** 100% traffic instantly → all users affected
+* 🐤 **Canary:** 5% traffic first → catch issues early
+* 🔵 **Blue-green:** Switch traffic instantly → easy rollback
+
+```mermaid
+flowchart LR
+  A[😰 Big Bang] --> B[🎲 Hope it works]
+  C[🐤 Canary] --> D[📊 Observe]
+  D --> E[✅ Promote or ↩️ Rollback]
+```
+
+> 🎯 **Goal:** Deploy changes safely with automated analysis and rollback
+
+---
+
+## 📍 Slide 2 – 📚 Learning Outcomes
+
+By the end of this lecture, you will:
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | ✅ Understand **progressive delivery** concepts and benefits |
+| 2 | ✅ Implement **canary deployments** with Argo Rollouts |
+| 3 | ✅ Configure **blue-green deployments** for instant rollback |
+| 4 | ✅ Set up **automated analysis** with metrics |
+| 5 | ✅ Design **traffic management** strategies |
+| 6 | ✅ Handle **rollback scenarios** gracefully |
+
+---
+
+## 📍 Slide 3 – 🗺️ Lecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  SECTION 0: Introduction                    (Slides 1-4)   │
+├─────────────────────────────────────────────────────────────┤
+│  📝 PRE QUIZ                                (Slide 5)      │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 1: The Deployment Risk Problem     (Slides 6-10)  │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 2: Progressive Delivery Concepts   (Slides 11-15) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 3: Argo Rollouts in Action         (Slides 16-24) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 MID QUIZ                                (Slide 25)     │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 4: Advanced Strategies             (Slides 26-32) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 5: Production Patterns             (Slides 33-37) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 POST QUIZ                               (Slide 38)     │
+├─────────────────────────────────────────────────────────────┤
+│  FINAL: What's Next                         (Slide 39)     │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 📍 Slide 4 – 🤔 The Big Question
+
+> 💬 *"We don't want to move fast and break things. We want to move fast and fix things."*
+> — Facebook (ironically, after many outages)
+
+**Consider this:**
+
+* 🚀 You deploy a new feature at **5 PM Friday**
+* 💥 It has a subtle bug affecting **10% of requests**
+* ⏰ By the time you notice: **100,000 users affected**
+* 😱 Rollback takes **15 minutes** of downtime
+
+> 🤔 **Think:** What if you could test with 1% of users first?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L14_PRE
+
+---
+
+## 📍 Slide 6 – ⚠️ Section 1: The Deployment Risk Problem
+
+**Traditional "Big Bang" Deployment:**
+
+```mermaid
+flowchart TD
+  A[📦 v1 Running] --> B[🚀 Deploy v2]
+  B --> C[⚡ 100% Traffic to v2]
+  C --> D{Works?}
+  D --> |Yes| E[✅ Success]
+  D --> |No| F[💀 100% Users Affected]
+  F --> G[😱 Emergency Rollback]
+```
+
+* ⚡ **All-or-nothing:** No gradual validation
+* 😱 **High blast radius:** Everyone affected immediately
+* ⏱️ **Slow detection:** Issues found in production
+
+---
+
+## 📍 Slide 7 – 🔥 Pain Point 1: Silent Failures
+
+**Scenario:** Memory leak that only triggers under load
+
+```mermaid
+flowchart LR
+  A[🧪 Tests Pass] --> B[🎭 Staging OK]
+  B --> C[🏭 Deploy to Prod]
+  C --> D[📈 Real Traffic]
+  D --> E[💥 OOM after 2 hours]
+```
+
+* 🧪 **Tests pass** — synthetic load is different
+* 🎭 **Staging works** — not enough traffic to trigger
+* 🏭 **Production crashes** — after hours of operation
+
+**Real impact:**
+* 😱 Facebook 2021: 6-hour outage from config change
+* 💰 Estimated loss: $100 million
+
+---
+
+## 📍 Slide 8 – 🔥 Pain Point 2: Slow Rollback
+
+**Traditional rollback process:**
+
+| ⏱️ Step | 📝 Action | ⌛ Time |
+|---------|----------|--------|
+| 1 | Detect the issue | 10 min |
+| 2 | Confirm it's the deploy | 5 min |
+| 3 | Find previous version | 2 min |
+| 4 | Rebuild/redeploy | 10 min |
+| 5 | Verify rollback | 5 min |
+| **Total** | **Downtime** | **32+ min** |
+
+* 🐌 **Slow detection:** Monitoring lag
+* 🤔 **Decision paralysis:** "Is it really the deploy?"
+* 🔧 **Manual process:** Error-prone under pressure
+
+---
+
+## 📍 Slide 9 – 🔥 Pain Point 3: No Gradual Validation
+
+**What we want:**
+
+```
+Deploy → Observe → Decide → Promote/Rollback
+```
+
+**What we get:**
+
+```
+Deploy → 🙏 Hope → React when broken
+```
+
+* 📊 **No metrics integration** — can't auto-decide
+* 👨‍💻 **Human in the loop** — for every deploy
+* 🎲 **Risk acceptance** — every release is a gamble
+
+---
+
+## 📍 Slide 10 – 💰 The Cost of Bad Deployments
+
+| 🔥 Problem | 💥 Impact | 📊 Industry Data |
+|-----------|----------|------------------|
+| Failed deployments | Service degradation | 46% experience monthly failures |
+| Slow rollback | Extended outages | Avg 30 min to rollback |
+| No canary testing | Full user impact | 100% blast radius |
+| Manual promotion | Human error | 70% of incidents |
+
+**DORA metrics show:**
+* 🏆 **Elite teams:** Deploy multiple times per day with <1% failure rate
+* 😰 **Low performers:** Monthly deploys with 15%+ failure rate
+
+---
+
+## 📍 Slide 11 – ✅ Section 2: Progressive Delivery Concepts
+
+**What is Progressive Delivery?**
+
+* 🐤 **Gradual rollout:** Incrementally shift traffic
+* 📊 **Observability:** Measure success at each step
+* 🤖 **Automation:** Promote or rollback based on metrics
+* 🎯 **Targeted:** Control which users see changes
+
+```mermaid
+flowchart LR
+  A[📦 v2] --> |5%| B[🎯 Test]
+  B --> |Metrics OK| C[25%]
+  C --> |Metrics OK| D[50%]
+  D --> |Metrics OK| E[100%]
+
+  B --> |Metrics Bad| F[↩️ Rollback]
+```
+
+---
+
+## 📍 Slide 12 – 🚫 Progressive Delivery: What It's NOT
+
+| 🚫 Myth | ✅ Reality |
+|---------|----------|
+| Just slow deployments | Strategic, metrics-driven progression |
+| Replaces testing | Complements testing with real traffic |
+| Only for big companies | Available via Argo Rollouts, Flagger |
+| Complicated to implement | Start simple, add automation gradually |
+
+> 🔥 **Hot take:** "If you're not doing progressive delivery, you're gambling with every deploy."
+
+**Progressive Delivery is:**
+* 🎯 **Risk reduction** — smaller blast radius
+* 📊 **Data-driven** — metrics decide promotion
+* 🔄 **Continuous** — part of the deployment pipeline
+
+---
+
+## 📍 Slide 13 – 🐤 Canary Deployments Explained
+
+**Named after "canary in a coal mine"** — early warning system
+
+```mermaid
+flowchart TD
+  subgraph Production
+    A[📦 v1 - 95%] --> C[🌐 Users]
+    B[📦 v2 - 5%] --> C
+  end
+
+  D[📊 Metrics] --> E{Healthy?}
+  E --> |Yes| F[📦 v2 - 100%]
+  E --> |No| G[↩️ v1 - 100%]
+```
+
+**How it works:**
+1. 🚀 Deploy new version alongside old
+2. 🎯 Route small % of traffic to new
+3. 📊 Compare metrics (errors, latency)
+4. ✅ Gradually increase or ↩️ rollback
+
+---
+
+## 📍 Slide 14 – 🔵 Blue-Green Deployments Explained
+
+**Two identical environments, instant switchover**
+
+```mermaid
+flowchart LR
+  subgraph Before
+    A[🔵 Blue v1] --> |100%| C[🌐 Traffic]
+    B[🟢 Green v2] --> |0%| C
+  end
+
+  subgraph After Switch
+    D[🔵 Blue v1] --> |0%| F[🌐 Traffic]
+    E[🟢 Green v2] --> |100%| F
+  end
+```
+
+**Characteristics:**
+* ⚡ **Instant switch:** Traffic moves all at once
+* ↩️ **Fast rollback:** Switch back to blue
+* 💰 **Resource cost:** Double infrastructure during deploy
+* 🎯 **Use case:** Database migrations, breaking changes
+
+---
+
+## 📍 Slide 15 – 📊 Canary vs Blue-Green
+
+| 📋 Aspect | 🐤 Canary | 🔵 Blue-Green |
+|----------|----------|---------------|
+| Traffic shift | Gradual (5% → 25% → 100%) | Instant (0% → 100%) |
+| Rollback speed | Instant | Instant |
+| Resource usage | Minimal overhead | Double during deploy |
+| Risk exposure | Minimal (small %) | Full (100% at switch) |
+| Complexity | Higher (traffic splitting) | Lower (simple switch) |
+| Best for | Most deployments | Major version changes |
+
+> 🤔 **Think:** Which strategy would you use for a database schema change?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Argo Rollouts in Action
+
+**What is Argo Rollouts?**
+
+* 🔄 Kubernetes controller for progressive delivery
+* 📦 Replaces standard Deployment resource
+* 🎯 Supports canary, blue-green, and more
+* 📊 Integrates with metrics providers
+
+```mermaid
+flowchart TD
+  A[📝 Rollout Resource] --> B[🤖 Argo Rollouts Controller]
+  B --> C[📦 ReplicaSets]
+  C --> D[☸️ Pods]
+  E[📊 Prometheus] --> B
+  B --> F[🎯 Traffic Management]
+```
+
+---
+
+## 📍 Slide 17 – 💥 Scenario 1: First Canary Rollout
+
+**Basic canary configuration:**
+
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Rollout
+metadata:
+  name: my-app
+spec:
+  replicas: 10
+  strategy:
+    canary:
+      steps:
+        - setWeight: 20
+        - pause: {duration: 5m}
+        - setWeight: 50
+        - pause: {duration: 5m}
+        - setWeight: 100
+  selector:
+    matchLabels:
+      app: my-app
+  template:
+    # Pod template (same as Deployment)
+```
+
+```mermaid
+flowchart LR
+  A[0%] --> |Step 1| B[20%]
+  B --> |5min pause| C[50%]
+  C --> |5min pause| D[100%]
+```
+
+---
+
+## 📍 Slide 18 – ✅ Solution 1: Traffic Progression
+
+**What happens during canary:**
+
+| 🕐 Time | 📦 Stable | 🐤 Canary | 📊 Status |
+|---------|----------|----------|-----------|
+| T+0 | 100% | 0% | Rollout started |
+| T+1 | 80% | 20% | setWeight: 20 |
+| T+6 | 50% | 50% | pause completed |
+| T+11 | 0% | 100% | Full promotion |
+
+**Rollout states:**
+* 🔄 **Progressing:** Moving through steps
+* ⏸️ **Paused:** Waiting (manual or timed)
+* ✅ **Healthy:** Rollout complete
+* 💥 **Degraded:** Issues detected
+
+---
+
+## 📍 Slide 19 – 💥 Scenario 2: Blue-Green with Argo Rollouts
+
+**Blue-green configuration:**
+
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Rollout
+metadata:
+  name: my-app
+spec:
+  replicas: 5
+  strategy:
+    blueGreen:
+      activeService: my-app-active
+      previewService: my-app-preview
+      autoPromotionEnabled: false  # Manual promotion
+      scaleDownDelaySeconds: 30
+  selector:
+    matchLabels:
+      app: my-app
+```
+
+```mermaid
+flowchart TD
+  A[🔵 Active Service] --> B[📦 Stable Pods]
+  C[🟢 Preview Service] --> D[📦 New Pods]
+  E[👨‍💻 QA] --> C
+  F[🌐 Users] --> A
+```
+
+---
+
+## 📍 Slide 20 – ✅ Solution 2: Preview and Promote
+
+**Blue-green workflow:**
+
+1. 🚀 **Deploy:** New pods created, preview service points to them
+2. 🧪 **Test:** QA validates via preview service
+3. ✅ **Promote:** Traffic switches to new pods
+4. 🗑️ **Cleanup:** Old pods scaled down after delay
+
+**Commands:**
+```bash
+# Check rollout status
+kubectl argo rollouts get rollout my-app
+
+# Promote preview to active
+kubectl argo rollouts promote my-app
+
+# Abort and rollback
+kubectl argo rollouts abort my-app
+```
+
+---
+
+## 📍 Slide 21 – 💥 Scenario 3: Automated Analysis
+
+**Problem:** Manual observation doesn't scale
+
+```mermaid
+flowchart TD
+  A[🐤 Canary] --> B[📊 Metrics]
+  B --> C{Error rate < 1%?}
+  C --> |Yes| D{Latency < 500ms?}
+  D --> |Yes| E[✅ Promote]
+  C --> |No| F[↩️ Rollback]
+  D --> |No| F
+```
+
+**Solution:** AnalysisTemplate
+
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: AnalysisTemplate
+metadata:
+  name: success-rate
+spec:
+  metrics:
+    - name: success-rate
+      interval: 1m
+      successCondition: result[0] >= 0.99
+      provider:
+        prometheus:
+          query: |
+            sum(rate(http_requests_total{status=~"2.*"}[5m])) /
+            sum(rate(http_requests_total[5m]))
+```
+
+---
+
+## 📍 Slide 22 – ✅ Solution 3: Analysis Integration
+
+**Connecting analysis to rollout:**
+
+```yaml
+strategy:
+  canary:
+    steps:
+      - setWeight: 20
+      - analysis:
+          templates:
+            - templateName: success-rate
+          args:
+            - name: service-name
+              value: my-app
+      - setWeight: 50
+      - analysis:
+          templates:
+            - templateName: success-rate
+      - setWeight: 100
+```
+
+**Analysis outcomes:**
+* ✅ **Successful:** All metrics pass → continue
+* ❌ **Failed:** Metric fails → automatic rollback
+* ⚠️ **Inconclusive:** Not enough data → pause
+
+---
+
+## 📍 Slide 23 – 💥 Scenario 4: Traffic Management
+
+**Problem:** Need fine-grained traffic control
+
+**Solutions:**
+
+| 🛠️ Traffic Manager | 📝 Description |
+|-------------------|---------------|
+| **Nginx Ingress** | Canary annotations |
+| **Istio** | VirtualService routing |
+| **AWS ALB** | Target group weights |
+| **Traefik** | TraefikService |
+
+```yaml
+# With Istio
+strategy:
+  canary:
+    trafficRouting:
+      istio:
+        virtualService:
+          name: my-app-vsvc
+        destinationRule:
+          name: my-app-destrule
+          canarySubsetName: canary
+          stableSubsetName: stable
+```
+
+---
+
+## 📍 Slide 24 – ✅ Solution 4: Nginx Ingress Canary
+
+**Simple traffic splitting with Nginx:**
+
+```yaml
+strategy:
+  canary:
+    canaryService: my-app-canary
+    stableService: my-app-stable
+    trafficRouting:
+      nginx:
+        stableIngress: my-app-ingress
+```
+
+**How it works:**
+* 🔧 Argo Rollouts creates canary ingress
+* 📊 Sets `nginx.ingress.kubernetes.io/canary-weight`
+* 🔄 Updates weight as rollout progresses
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L14_MID
+
+---
+
+## 📍 Slide 26 – 🔧 Section 4: Advanced Strategies
+
+**Experiment: A/B Testing**
+
+```yaml
+apiVersion: argoproj.io/v1alpha1
+kind: Experiment
+metadata:
+  name: ab-test
+spec:
+  duration: 1h
+  templates:
+    - name: baseline
+      specRef: stable
+      replicas: 1
+    - name: canary
+      specRef: canary
+      replicas: 1
+  analyses:
+    - name: compare-versions
+      templateName: compare-metrics
+```
+
+**Use cases:**
+* 🧪 **Feature testing:** Compare feature A vs B
+* 📊 **Performance testing:** Baseline vs optimized
+* 🎯 **User experience:** Different UIs
+
+---
+
+## 📍 Slide 27 – 📊 Metrics for Analysis
+
+**Common metrics to analyze:**
+
+| 📊 Metric | 📝 What it Measures | ⚠️ Threshold |
+|----------|-------------------|-------------|
+| Error rate | % of failed requests | < 1% |
+| Latency P99 | Slowest 1% of requests | < 500ms |
+| Saturation | Resource utilization | < 80% |
+| Success rate | % of successful operations | > 99% |
+
+**Prometheus queries:**
+```promql
+# Error rate
+sum(rate(http_requests_total{status=~"5.*"}[5m])) /
+sum(rate(http_requests_total[5m]))
+
+# P99 latency
+histogram_quantile(0.99, rate(http_duration_seconds_bucket[5m]))
+```
+
+---
+
+## 📍 Slide 28 – 🔄 Rollback Strategies
+
+**Automatic rollback triggers:**
+
+```yaml
+strategy:
+  canary:
+    steps:
+      - setWeight: 20
+      - analysis:
+          templates:
+            - templateName: error-rate
+    # If analysis fails, automatic rollback
+```
+
+**Manual rollback:**
+```bash
+# Abort current rollout
+kubectl argo rollouts abort my-app
+
+# Undo to previous version
+kubectl argo rollouts undo my-app
+
+# Retry after fix
+kubectl argo rollouts retry rollout my-app
+```
+
+```mermaid
+flowchart TD
+  A[💥 Analysis Failed] --> B[🤖 Auto Rollback]
+  B --> C[📦 Scale down canary]
+  C --> D[🔄 Restore stable]
+  D --> E[✅ Service restored]
+```
+
+---
+
+## 📍 Slide 29 – ⏸️ Pause and Resume
+
+**Manual gates in rollout:**
+
+```yaml
+steps:
+  - setWeight: 20
+  - pause: {}  # Manual pause - requires promotion
+  - setWeight: 50
+  - pause: {duration: 10m}  # Timed pause
+  - setWeight: 100
+```
+
+**Commands:**
+```bash
+# Resume paused rollout
+kubectl argo rollouts promote my-app
+
+# Skip all remaining steps
+kubectl argo rollouts promote my-app --full
+```
+
+**Use cases:**
+* 👀 **Manual verification** before wider rollout
+* 🕐 **Business hours** — pause overnight
+* 🧪 **QA sign-off** required
+
+---
+
+## 📍 Slide 30 – 🔗 ArgoCD + Argo Rollouts
+
+**GitOps + Progressive Delivery:**
+
+```mermaid
+flowchart TD
+  A[📝 Git Push] --> B[🤖 ArgoCD]
+  B --> |Sync| C[📦 Rollout Resource]
+  C --> D[🤖 Argo Rollouts Controller]
+  D --> E[🐤 Canary Progression]
+  E --> F[📊 Analysis]
+  F --> |Pass| G[✅ Promoted]
+  F --> |Fail| H[↩️ Rollback]
+```
+
+**Benefits:**
+* 📝 **Declarative:** Rollout strategy in Git
+* 🔄 **Automated:** ArgoCD syncs, Rollouts executes
+* 🔍 **Observable:** Both tools have UIs
+
+---
+
+## 📍 Slide 31 – 📊 Dashboard and Visualization
+
+**Argo Rollouts Dashboard:**
+
+```bash
+# Install dashboard
+kubectl argo rollouts dashboard
+
+# Access at localhost:3100
+```
+
+**Features:**
+* 📊 **Real-time status:** See rollout progression
+* 🎛️ **Controls:** Promote, abort, retry
+* 📈 **History:** Past rollouts and outcomes
+* 🔗 **Integration:** Links to metrics
+
+---
+
+## 📍 Slide 32 – 🎯 Best Practices
+
+| 📋 Practice | 📝 Why |
+|------------|--------|
+| Start with simple canary | Learn before adding complexity |
+| Always have analysis | Don't rely only on time-based |
+| Set appropriate thresholds | Too strict = never promotes |
+| Monitor canary metrics | Catch issues before promotion |
+| Test rollback procedure | Know it works before you need it |
+| Use GitOps | Keep strategy in version control |
+
+---
+
+## 📍 Slide 33 – 🏭 Section 5: Production Patterns
+
+**Netflix Progressive Delivery:**
+
+```mermaid
+flowchart LR
+  A[📦 v2] --> B[🎯 Internal 1%]
+  B --> C[🌍 One Region 5%]
+  C --> D[🌍 All Regions 25%]
+  D --> E[🚀 Full 100%]
+```
+
+**Their learnings:**
+* 🎯 **Internal first:** Employees as first canaries
+* 🌍 **Regional:** Test in one region before global
+* 📊 **Metrics-driven:** Automated promotion
+* 🐌 **Patience:** Days, not minutes
+
+---
+
+## 📍 Slide 34 – 🔧 Anti-Patterns to Avoid
+
+| ❌ Anti-Pattern | ✅ Better Approach |
+|----------------|-------------------|
+| Canary with no metrics | Add analysis, even basic |
+| Too fast progression | Allow time for issues to surface |
+| Ignoring saturation | Include resource metrics |
+| Manual-only promotion | Automate with analysis |
+| Skip staging canary | Test progressive delivery in staging |
+
+---
+
+## 📍 Slide 35 – 📈 Measuring Success
+
+**DORA metrics with progressive delivery:**
+
+| 📊 Metric | 😰 Before | 🚀 After |
+|----------|----------|---------|
+| Deployment frequency | Weekly | Multiple/day |
+| Change failure rate | 15% | < 1% |
+| MTTR | 30 min | 2 min |
+| Lead time | Days | Hours |
+
+**Why improvement:**
+* 🐤 **Catch issues early** — smaller blast radius
+* ↩️ **Fast rollback** — seconds, not minutes
+* 📊 **Data-driven** — objective decisions
+* 🔄 **Confidence** — deploy more often
+
+---
+
+## 📍 Slide 36 – 🎯 Key Takeaways
+
+1. 🐤 **Canary deployments** test with small traffic before full rollout
+2. 🔵 **Blue-green** enables instant rollback via traffic switch
+3. 📊 **Automated analysis** removes human guesswork
+4. 🎯 **Argo Rollouts** makes progressive delivery accessible
+5. 🔗 **GitOps integration** keeps strategy declarative
+6. ↩️ **Fast rollback** is as important as deployment
+
+> 💬 *"Deploy frequently, observe constantly, rollback automatically."*
+
+---
+
+## 📍 Slide 37 – 🧠 Mindset Shift
+
+| 😰 Old Mindset | 🚀 New Mindset |
+|---------------|----------------|
+| "Let's hope it works" | "Let's measure and know" |
+| "Deploy and pray" | "Deploy, observe, decide" |
+| "Rollback is failure" | "Rollback is success" |
+| "Testing is enough" | "Testing + production validation" |
+| "Deploy once a week (safe)" | "Deploy often (safer)" |
+| "100% or nothing" | "Progressive and controlled" |
+
+> 🤔 **Question:** Which deployment approach does your team use today?
+
+---
+
+## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L14_POST
+
+---
+
+## 📍 Slide 39 – 🚀 What's Next?
+
+**Coming up: Lecture 15 — Stateful Applications & Observability**
+
+```mermaid
+flowchart LR
+  A[📦 Deployment] --> B[🗄️ StatefulSet]
+  B --> C[💾 Persistent Storage]
+  C --> D[📊 Monitoring]
+```
+
+* 🗄️ **StatefulSets:** Managing stateful applications
+* 💾 **Persistent storage:** Beyond ephemeral pods
+* 📊 **Observability:** Prometheus, Grafana
+* 🔍 **Alerting:** Know before users complain
+
+> 🎯 **Lab 14:** Implement canary deployments with Argo Rollouts!
+
+---
+
+## 📚 Resources
+
+**Documentation:**
+* 📖 [Argo Rollouts Docs](https://argoproj.github.io/argo-rollouts/)
+* 📖 [Progressive Delivery](https://www.weave.works/blog/progressive-delivery)
+* 📖 [Canary Deployments](https://martinfowler.com/bliki/CanaryRelease.html)
+
+**Tools:**
+* 🔧 [Argo Rollouts](https://argoproj.github.io/argo-rollouts/)
+* 🔧 [Flagger](https://flagger.app/)
+* 🔧 [Istio](https://istio.io/)
+
+**Books:**
+* 📕 *Accelerate* by Nicole Forsgren, Jez Humble, Gene Kim
+* 📕 *Continuous Delivery* by Jez Humble & David Farley
diff --git a/lectures/lec15.md b/lectures/lec15.md
new file mode 100644
index 0000000000..eb828de609
--- /dev/null
+++ b/lectures/lec15.md
@@ -0,0 +1,821 @@
+# 📌 Lecture 15 — Stateful Applications & Observability: The Complete Picture
+
+> 🎯 **From stateless simplicity to production-ready stateful workloads with full observability**
+
+---
+
+## 📍 Slide 1 – 🚀 The Final Pieces of Production Kubernetes
+
+We've deployed applications, managed configs, and implemented GitOps. Two challenges remain:
+
+* 🗄️ **Stateful apps:** Databases, message queues, caches — they need identity and stable storage
+* 📊 **Observability:** If you can't see it, you can't fix it
+
+```mermaid
+flowchart LR
+  A[📦 Stateless Apps] --> B[🗄️ StatefulSets]
+  B --> C[📊 Monitoring]
+  C --> D[🔔 Alerting]
+  D --> E[💎 Production Ready]
+```
+
+> 🎯 **Goal:** Master stateful workloads and comprehensive cluster observability
+
+---
+
+## 📍 Slide 2 – 📚 Learning Outcomes
+
+By the end of this lecture, you will:
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | ✅ Understand when to use **StatefulSets** vs Deployments |
+| 2 | ✅ Implement **headless services** for pod discovery |
+| 3 | ✅ Configure **VolumeClaimTemplates** for per-pod storage |
+| 4 | ✅ Deploy **Prometheus** for metrics collection |
+| 5 | ✅ Create **Grafana dashboards** for visualization |
+| 6 | ✅ Set up **alerting** for proactive incident response |
+
+---
+
+## 📍 Slide 3 – 🗺️ Lecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  SECTION 0: Introduction                    (Slides 1-4)   │
+├─────────────────────────────────────────────────────────────┤
+│  📝 PRE QUIZ                                (Slide 5)      │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 1: Stateful Workload Challenges    (Slides 6-10)  │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 2: StatefulSets Deep Dive          (Slides 11-18) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 MID QUIZ                                (Slide 19)     │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 3: Observability Fundamentals      (Slides 20-28) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 4: Production Monitoring           (Slides 29-36) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 POST QUIZ                               (Slide 37)     │
+├─────────────────────────────────────────────────────────────┤
+│  FINAL: What's Next                         (Slide 38)     │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 📍 Slide 4 – 🤔 The Big Question
+
+> 💬 *"You can't manage what you can't measure."*
+> — Peter Drucker
+
+**Consider these scenarios:**
+
+* 🗄️ **Database cluster:** Pods need stable identity for replication
+* 📊 **3 AM alert:** Is the app slow, or is it the database?
+* 🔍 **Debugging:** "What changed in the last hour?"
+* 🔮 **Capacity planning:** "Will we run out of storage next month?"
+
+> 🤔 **Think:** How do you know your system is healthy right now?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L15_PRE
+
+---
+
+## 📍 Slide 6 – ⚠️ Section 1: Why Stateless Isn't Always Enough
+
+**Deployments (Stateless) characteristics:**
+
+```mermaid
+flowchart TD
+  A[📦 Deployment] --> B[📦 Pod-abc123]
+  A --> C[📦 Pod-def456]
+  A --> D[📦 Pod-ghi789]
+
+  E[Pods are interchangeable]
+  F[Random names]
+  G[Any pod can be replaced]
+```
+
+* ✅ **Great for:** Web servers, API services, workers
+* ❌ **Problem for:** Databases, message queues, distributed systems
+
+---
+
+## 📍 Slide 7 – 🔥 Pain Point 1: Pod Identity
+
+**Stateful apps need stable identity:**
+
+| 🗄️ Application | 🔑 Why Identity Matters |
+|---------------|------------------------|
+| **PostgreSQL** | Primary/replica must know who is who |
+| **MongoDB** | Replica set members have specific roles |
+| **Kafka** | Brokers identified by stable IDs |
+| **Redis Cluster** | Nodes need persistent slots |
+| **Elasticsearch** | Nodes join cluster by name |
+
+**With Deployment:**
+```
+pod-abc123 → restarts → pod-xyz789 (new name!)
+```
+
+**The problem:** Other pods can't find it anymore
+
+---
+
+## 📍 Slide 8 – 🔥 Pain Point 2: Storage Persistence
+
+**Scenario:** 3-node MongoDB replica set
+
+```mermaid
+flowchart TD
+  A[📦 Deployment] --> B[📦 Pod 1]
+  A --> C[📦 Pod 2]
+  A --> D[📦 Pod 3]
+
+  E[💾 Shared PVC] --> B
+  E --> C
+  E --> D
+
+  F[😱 Problem: All pods fighting for same storage!]
+```
+
+**What we need:**
+* 📦 Pod 1 → 💾 Volume 1 (its own data)
+* 📦 Pod 2 → 💾 Volume 2 (its own data)
+* 📦 Pod 3 → 💾 Volume 3 (its own data)
+
+---
+
+## 📍 Slide 9 – 🔥 Pain Point 3: Ordered Operations
+
+**Database cluster startup order matters:**
+
+```mermaid
+flowchart LR
+  A[🥇 Primary starts] --> B[🥈 Replica 1 joins]
+  B --> C[🥉 Replica 2 joins]
+```
+
+**Deployment behavior:** All pods start simultaneously
+* 😱 Race condition: Who is primary?
+* 💥 Data corruption risk
+
+**Shutdown order matters too:**
+* 🥉 Replicas drain first
+* 🥇 Primary shuts down last
+
+---
+
+## 📍 Slide 10 – 📊 Deployment vs StatefulSet
+
+| 📋 Aspect | 📦 Deployment | 🗄️ StatefulSet |
+|----------|--------------|----------------|
+| Pod names | Random suffix | Stable ordinal (app-0, app-1) |
+| Storage | Shared or none | Per-pod PVCs |
+| Scaling | Parallel | Sequential |
+| Updates | Rolling (parallel) | Rolling (sequential) |
+| Network identity | Via Service | Stable DNS per pod |
+| Use case | Stateless apps | Stateful apps |
+
+---
+
+## 📍 Slide 11 – ✅ Section 2: StatefulSets to the Rescue
+
+**StatefulSet provides:**
+
+```mermaid
+flowchart TD
+  A[🗄️ StatefulSet] --> B[📦 app-0]
+  A --> C[📦 app-1]
+  A --> D[📦 app-2]
+
+  B --> E[💾 data-app-0]
+  C --> F[💾 data-app-1]
+  D --> G[💾 data-app-2]
+
+  H[🌐 Headless Service] --> B
+  H --> C
+  H --> D
+```
+
+* 🔢 **Stable, unique network IDs:** `app-0`, `app-1`, `app-2`
+* 💾 **Stable, persistent storage:** Each pod gets its own PVC
+* 📊 **Ordered deployment:** `app-0` first, then `app-1`, then `app-2`
+* 🔄 **Ordered termination:** Reverse order
+
+---
+
+## 📍 Slide 12 – 🌐 Headless Services Explained
+
+**Regular Service vs Headless Service:**
+
+```yaml
+# Regular Service - Load balances
+apiVersion: v1
+kind: Service
+metadata:
+  name: my-app
+spec:
+  clusterIP: 10.0.0.100  # Gets an IP
+  ports:
+    - port: 80
+---
+# Headless Service - Direct pod access
+apiVersion: v1
+kind: Service
+metadata:
+  name: my-app-headless
+spec:
+  clusterIP: None  # No IP assigned!
+  ports:
+    - port: 80
+```
+
+**DNS resolution:**
+* **Regular:** `my-app.namespace.svc` → `10.0.0.100`
+* **Headless:** `my-app-headless.namespace.svc` → `10.1.2.3, 10.1.2.4, 10.1.2.5` (all pod IPs)
+
+---
+
+## 📍 Slide 13 – 🔗 Pod DNS in StatefulSets
+
+**Each pod gets a stable DNS name:**
+
+```
+<pod-name>.<service-name>.<namespace>.svc.cluster.local
+```
+
+**Example with MongoDB:**
+```
+mongodb-0.mongodb-headless.default.svc.cluster.local
+mongodb-1.mongodb-headless.default.svc.cluster.local
+mongodb-2.mongodb-headless.default.svc.cluster.local
+```
+
+```mermaid
+flowchart LR
+  A[🔍 DNS Query: mongodb-0.mongodb-headless] --> B[📦 mongodb-0]
+  C[🔍 DNS Query: mongodb-1.mongodb-headless] --> D[📦 mongodb-1]
+```
+
+* ✅ Other apps can connect to specific pods
+* ✅ Pods can discover each other by name
+* ✅ Names stay the same even after restart
+
+---
+
+## 📍 Slide 14 – 💾 VolumeClaimTemplates
+
+**Automatic PVC creation per pod:**
+
+```yaml
+apiVersion: apps/v1
+kind: StatefulSet
+metadata:
+  name: mongodb
+spec:
+  serviceName: mongodb-headless
+  replicas: 3
+  volumeClaimTemplates:
+    - metadata:
+        name: data
+      spec:
+        accessModes: ["ReadWriteOnce"]
+        storageClassName: standard
+        resources:
+          requests:
+            storage: 10Gi
+```
+
+**Result:**
+```
+PVC: data-mongodb-0 → bound to mongodb-0
+PVC: data-mongodb-1 → bound to mongodb-1
+PVC: data-mongodb-2 → bound to mongodb-2
+```
+
+---
+
+## 📍 Slide 15 – 🔄 Scaling Behavior
+
+**Scale up (sequential):**
+```mermaid
+flowchart LR
+  A[app-0 ready] --> B[app-1 starts]
+  B --> C[app-1 ready]
+  C --> D[app-2 starts]
+```
+
+**Scale down (reverse order):**
+```mermaid
+flowchart LR
+  A[app-2 terminates] --> B[app-2 gone]
+  B --> C[app-1 terminates]
+  C --> D[app-1 gone]
+```
+
+**Key points:**
+* 🔄 Next pod only starts when previous is **Ready**
+* 🗑️ Scaling down starts from highest ordinal
+* 💾 PVCs are **NOT deleted** on scale down (data preserved)
+
+---
+
+## 📍 Slide 16 – 🔄 Update Strategies
+
+**RollingUpdate (default):**
+```yaml
+spec:
+  updateStrategy:
+    type: RollingUpdate
+    rollingUpdate:
+      partition: 0  # Update all pods
+```
+
+**Partition for canary:**
+```yaml
+rollingUpdate:
+  partition: 2  # Only update pods >= 2
+```
+
+```mermaid
+flowchart LR
+  A[app-0: v1] --> B[app-1: v1]
+  B --> C[app-2: v2 - canary]
+```
+
+* ✅ Test new version on highest ordinal first
+* ✅ Gradually lower partition to update more pods
+
+---
+
+## 📍 Slide 17 – 🗄️ Complete StatefulSet Example
+
+```yaml
+apiVersion: apps/v1
+kind: StatefulSet
+metadata:
+  name: mongodb
+spec:
+  selector:
+    matchLabels:
+      app: mongodb
+  serviceName: mongodb-headless
+  replicas: 3
+  template:
+    metadata:
+      labels:
+        app: mongodb
+    spec:
+      containers:
+        - name: mongodb
+          image: mongo:7
+          ports:
+            - containerPort: 27017
+          volumeMounts:
+            - name: data
+              mountPath: /data/db
+  volumeClaimTemplates:
+    - metadata:
+        name: data
+      spec:
+        accessModes: ["ReadWriteOnce"]
+        resources:
+          requests:
+            storage: 10Gi
+```
+
+---
+
+## 📍 Slide 18 – ⚠️ StatefulSet Gotchas
+
+| ⚠️ Gotcha | 📝 Solution |
+|----------|------------|
+| PVCs not deleted on scale down | Manual deletion if needed |
+| Pod stuck in Pending | Check PVC binding, storage class |
+| Headless service required | Must create before StatefulSet |
+| Slow scaling | Increase `podManagementPolicy: Parallel` |
+| Data loss on PVC deletion | Use `reclaimPolicy: Retain` |
+
+**Important:** StatefulSets are **more complex** than Deployments. Use only when needed!
+
+---
+
+## 📍 Slide 19 – 📝 QUIZ — DEVOPS_L15_MID
+
+---
+
+## 📍 Slide 20 – 📊 Section 3: The Three Pillars of Observability
+
+**Observability = Understanding system behavior from outputs**
+
+```mermaid
+flowchart TD
+  A[📊 Metrics] --> D[🔍 Observability]
+  B[📝 Logs] --> D
+  C[🔗 Traces] --> D
+  D --> E[💡 Understanding]
+```
+
+| 📊 Pillar | 📝 What It Answers | 🛠️ Tools |
+|----------|-------------------|----------|
+| **Metrics** | What is happening? (numbers) | Prometheus, Grafana |
+| **Logs** | What happened? (events) | Loki, ELK |
+| **Traces** | Where did it happen? (requests) | Jaeger, Zipkin |
+
+---
+
+## 📍 Slide 21 – 📈 Prometheus: The Metrics Foundation
+
+**What is Prometheus?**
+
+* 📊 Time-series database for metrics
+* 🔍 Pull-based metric collection
+* 📝 Powerful query language (PromQL)
+* 🔔 Built-in alerting
+
+```mermaid
+flowchart LR
+  A[📦 App with /metrics] --> |Pull| B[📊 Prometheus]
+  C[📦 Another App] --> |Pull| B
+  B --> D[📈 Grafana]
+  B --> E[🔔 Alertmanager]
+```
+
+---
+
+## 📍 Slide 22 – 🎯 Prometheus Metric Types
+
+| 📊 Type | 📝 Description | 🎯 Example |
+|--------|---------------|-----------|
+| **Counter** | Only goes up | Total requests, errors |
+| **Gauge** | Can go up/down | Temperature, queue size |
+| **Histogram** | Distribution of values | Request latency |
+| **Summary** | Similar to histogram | Quantiles |
+
+**Example metrics:**
+```promql
+# Counter - total HTTP requests
+http_requests_total{method="GET", status="200"}
+
+# Gauge - current memory usage
+node_memory_MemAvailable_bytes
+
+# Histogram - request duration
+http_request_duration_seconds_bucket{le="0.5"}
+```
+
+---
+
+## 📍 Slide 23 – 🔍 PromQL Basics
+
+**Query examples:**
+
+```promql
+# Current value
+up{job="kubernetes-pods"}
+
+# Rate of change (per second over 5m)
+rate(http_requests_total[5m])
+
+# Error rate percentage
+sum(rate(http_requests_total{status=~"5.."}[5m])) /
+sum(rate(http_requests_total[5m])) * 100
+
+# 99th percentile latency
+histogram_quantile(0.99, rate(http_request_duration_seconds_bucket[5m]))
+
+# Top 5 pods by CPU
+topk(5, sum by (pod) (rate(container_cpu_usage_seconds_total[5m])))
+```
+
+---
+
+## 📍 Slide 24 – 📦 kube-prometheus-stack
+
+**All-in-one monitoring solution:**
+
+```mermaid
+flowchart TD
+  A[📦 kube-prometheus-stack] --> B[📊 Prometheus]
+  A --> C[📈 Grafana]
+  A --> D[🔔 Alertmanager]
+  A --> E[📝 Node Exporter]
+  A --> F[📊 kube-state-metrics]
+```
+
+**Includes:**
+* 🔧 Pre-configured scrape targets
+* 📊 Default dashboards
+* 🔔 Default alerting rules
+* 📈 Grafana with data sources configured
+
+```bash
+helm install prometheus prometheus-community/kube-prometheus-stack
+```
+
+---
+
+## 📍 Slide 25 – 📈 Grafana Dashboards
+
+**Key Grafana concepts:**
+
+| 🔧 Concept | 📝 Description |
+|-----------|---------------|
+| **Data Source** | Where data comes from (Prometheus) |
+| **Dashboard** | Collection of panels |
+| **Panel** | Single visualization |
+| **Variable** | Dynamic filters (namespace, pod) |
+
+**Popular pre-built dashboards:**
+* 🔢 **1860:** Node Exporter Full
+* 🔢 **315:** Kubernetes cluster
+* 🔢 **7249:** Kubernetes Pod Resources
+
+---
+
+## 📍 Slide 26 – 🔔 Alerting with Alertmanager
+
+**Alert flow:**
+
+```mermaid
+flowchart LR
+  A[📊 Prometheus] --> |Alert fires| B[🔔 Alertmanager]
+  B --> |Route| C[📧 Email]
+  B --> |Route| D[💬 Slack]
+  B --> |Route| E[📱 PagerDuty]
+```
+
+**Alert rule example:**
+```yaml
+groups:
+  - name: app-alerts
+    rules:
+      - alert: HighErrorRate
+        expr: |
+          sum(rate(http_requests_total{status=~"5.."}[5m])) /
+          sum(rate(http_requests_total[5m])) > 0.01
+        for: 5m
+        labels:
+          severity: critical
+        annotations:
+          summary: "High error rate detected"
+          description: "Error rate is {{ $value | humanizePercentage }}"
+```
+
+---
+
+## 📍 Slide 27 – 📊 The Four Golden Signals
+
+**Google SRE's essential metrics:**
+
+| 🔔 Signal | 📝 What to Measure | 📊 Prometheus Example |
+|----------|-------------------|----------------------|
+| **Latency** | Response time | `histogram_quantile(0.99, ...)` |
+| **Traffic** | Request rate | `rate(http_requests_total[5m])` |
+| **Errors** | Failure rate | `rate(http_requests_total{status=~"5.."}[5m])` |
+| **Saturation** | Resource usage | `container_memory_usage_bytes / limit` |
+
+> 💡 **Tip:** Start by monitoring these four signals for every service
+
+---
+
+## 📍 Slide 28 – 🔧 Init Containers for Dependencies
+
+**Problem:** App starts before database is ready
+
+```yaml
+spec:
+  initContainers:
+    - name: wait-for-db
+      image: busybox
+      command:
+        - sh
+        - -c
+        - |
+          until nc -z postgres-0.postgres-headless 5432; do
+            echo "Waiting for database..."
+            sleep 2
+          done
+  containers:
+    - name: app
+      image: my-app
+```
+
+```mermaid
+flowchart LR
+  A[🚀 Pod Start] --> B[⏳ Init Container]
+  B --> |DB Ready| C[📦 App Container]
+```
+
+---
+
+## 📍 Slide 29 – 🏭 Section 4: Production Monitoring Setup
+
+**ServiceMonitor for custom apps:**
+
+```yaml
+apiVersion: monitoring.coreos.com/v1
+kind: ServiceMonitor
+metadata:
+  name: my-app-monitor
+spec:
+  selector:
+    matchLabels:
+      app: my-app
+  endpoints:
+    - port: metrics
+      interval: 30s
+      path: /metrics
+```
+
+**What this does:**
+* 🔍 Tells Prometheus to scrape your app
+* 📊 Collects metrics from `/metrics` endpoint
+* ⏱️ Every 30 seconds
+
+---
+
+## 📍 Slide 30 – 📊 Monitoring StatefulSets
+
+**Key metrics for stateful apps:**
+
+| 📊 Metric | 📝 Why Important |
+|----------|------------------|
+| `kubelet_volume_stats_used_bytes` | Disk usage per PVC |
+| `kube_statefulset_replicas` | Expected vs actual replicas |
+| `kube_statefulset_status_replicas_ready` | Healthy replicas |
+| App-specific metrics | Replication lag, connections |
+
+**Alert example:**
+```yaml
+- alert: StatefulSetNotReady
+  expr: |
+    kube_statefulset_status_replicas_ready /
+    kube_statefulset_replicas < 1
+  for: 5m
+  labels:
+    severity: warning
+```
+
+---
+
+## 📍 Slide 31 – 📈 Resource Monitoring
+
+**CPU and Memory queries:**
+
+```promql
+# CPU usage percentage
+sum(rate(container_cpu_usage_seconds_total{pod=~"my-app.*"}[5m])) /
+sum(kube_pod_container_resource_limits{resource="cpu", pod=~"my-app.*"}) * 100
+
+# Memory usage percentage
+sum(container_memory_working_set_bytes{pod=~"my-app.*"}) /
+sum(kube_pod_container_resource_limits{resource="memory", pod=~"my-app.*"}) * 100
+```
+
+**Capacity planning alerts:**
+```yaml
+- alert: HighMemoryUsage
+  expr: |
+    sum(container_memory_working_set_bytes) by (pod) /
+    sum(kube_pod_container_resource_limits{resource="memory"}) by (pod) > 0.8
+  for: 15m
+```
+
+---
+
+## 📍 Slide 32 – 🔔 Alert Fatigue Prevention
+
+**Problem:** Too many alerts = ignored alerts
+
+| ❌ Bad Practice | ✅ Better Approach |
+|----------------|-------------------|
+| Alert on every metric | Alert on symptoms, not causes |
+| No severity levels | Critical, warning, info tiers |
+| Alert immediately | Use `for` duration |
+| Generic messages | Actionable descriptions |
+| No runbooks | Link to debugging guides |
+
+**Good alert structure:**
+```yaml
+annotations:
+  summary: "High error rate on {{ $labels.service }}"
+  description: "Error rate is {{ $value }}% (threshold: 1%)"
+  runbook_url: "https://wiki/alerts/high-error-rate"
+```
+
+---
+
+## 📍 Slide 33 – 📊 Dashboard Best Practices
+
+**Effective dashboard layout:**
+
+```
+┌─────────────────────────────────────────┐
+│  📊 Overview: Key metrics at a glance   │
+├─────────────┬─────────────┬─────────────┤
+│  🔴 Errors  │  ⏱️ Latency │  📈 Traffic │
+├─────────────┴─────────────┴─────────────┤
+│  💾 Resource Usage (CPU, Memory, Disk)  │
+├─────────────────────────────────────────┤
+│  🔍 Detailed Breakdowns (per pod, etc.) │
+└─────────────────────────────────────────┘
+```
+
+**Tips:**
+* 📊 Start with high-level, drill down for details
+* 🎨 Use consistent colors (red = bad)
+* 📝 Add descriptions to panels
+* 🔗 Link related dashboards
+
+---
+
+## 📍 Slide 34 – 🏢 Real-World: Observability at Scale
+
+**Netflix observability approach:**
+
+* 📊 **Metrics:** Atlas (Prometheus-like, billions of time series)
+* 📝 **Logs:** Mantis (real-time stream processing)
+* 🔗 **Traces:** Edgar (distributed tracing)
+* 🔔 **Alerts:** Focused on customer impact
+
+**Key lessons:**
+* 🎯 Focus on **business metrics** (not just infra)
+* 🔄 Automate **remediation** where possible
+* 📈 Invest in **dashboards** as a product
+* 👥 Make observability **everyone's** job
+
+---
+
+## 📍 Slide 35 – 🎯 Key Takeaways
+
+1. 🗄️ **StatefulSets** provide stable identity and per-pod storage for databases
+2. 🌐 **Headless services** enable direct pod-to-pod communication
+3. 📊 **Three pillars:** Metrics, Logs, Traces for full observability
+4. 📈 **Prometheus + Grafana** is the standard K8s monitoring stack
+5. 🔔 **Alerts should be actionable** — avoid alert fatigue
+6. 🎯 **Four Golden Signals:** Latency, Traffic, Errors, Saturation
+
+> 💬 *"Observability is not about collecting data, it's about understanding your system."*
+
+---
+
+## 📍 Slide 36 – 🧠 Mindset Shift
+
+| 😰 Old Mindset | 🚀 New Mindset |
+|---------------|----------------|
+| "It's working, don't touch it" | "I can see it's working" |
+| "Let's check the logs" | "The dashboard shows the issue" |
+| "User reported an error" | "Alert fired before impact" |
+| "Database needs restart" | "DB has stable identity, restart is safe" |
+| "Collect all the metrics" | "Monitor what matters" |
+| "Alert on everything" | "Alert on symptoms, investigate causes" |
+
+> 🤔 **Question:** What's the first dashboard you'd build for your app?
+
+---
+
+## 📍 Slide 37 – 📝 QUIZ — DEVOPS_L15_POST
+
+---
+
+## 📍 Slide 38 – 🚀 What's Next?
+
+**Coming up: Lecture 16 — Beyond Kubernetes**
+
+```mermaid
+flowchart LR
+  A[☸️ Kubernetes] --> B[✈️ Fly.io]
+  A --> C[🌐 IPFS/4EVERLAND]
+  B --> D[🌍 Global Edge]
+  C --> E[🔗 Decentralized]
+```
+
+* ✈️ **Fly.io:** Edge deployment simplified
+* 🌐 **IPFS:** Decentralized hosting
+* 🤔 **When to use what:** Trade-offs and decisions
+* 🎯 **Beyond the cluster:** Alternative deployment models
+
+> 🎯 **Labs 15 & 16:** Convert your app to StatefulSet and set up comprehensive monitoring!
+
+---
+
+## 📚 Resources
+
+**StatefulSets:**
+* 📖 [Kubernetes StatefulSets](https://kubernetes.io/docs/concepts/workloads/controllers/statefulset/)
+* 📖 [Headless Services](https://kubernetes.io/docs/concepts/services-networking/service/#headless-services)
+
+**Observability:**
+* 📖 [Prometheus Docs](https://prometheus.io/docs/)
+* 📖 [Grafana Docs](https://grafana.com/docs/)
+* 📖 [kube-prometheus-stack](https://github.com/prometheus-community/helm-charts/tree/main/charts/kube-prometheus-stack)
+
+**Books:**
+* 📕 *Observability Engineering* by Charity Majors, et al.
+* 📕 *Site Reliability Engineering* by Google
+* 📕 *Kubernetes Patterns* by Bilgin Ibryam & Roland Huß
diff --git a/lectures/lec16.md b/lectures/lec16.md
new file mode 100644
index 0000000000..2f8bf01d5b
--- /dev/null
+++ b/lectures/lec16.md
@@ -0,0 +1,717 @@
+# 📌 Lecture 16 — Beyond Kubernetes: Alternative Deployment Models
+
+> 🎯 **From cluster management to platform abstraction and decentralized hosting**
+
+---
+
+## 📍 Slide 1 – 🚀 Kubernetes Isn't Always the Answer
+
+We've mastered Kubernetes. But is it always the right choice?
+
+* ☸️ **Kubernetes:** Powerful, but complex
+* ✈️ **PaaS (Fly.io):** Simple, global, managed
+* 🌐 **Decentralized (IPFS):** Permanent, censorship-resistant
+
+```mermaid
+flowchart LR
+  A[📦 Your App] --> B{What matters most?}
+  B --> |Control & Scale| C[☸️ Kubernetes]
+  B --> |Simplicity & Global| D[✈️ Fly.io]
+  B --> |Permanence & Decentralization| E[🌐 IPFS]
+```
+
+> 🎯 **Goal:** Understand when to choose each deployment model
+
+---
+
+## 📍 Slide 2 – 📚 Learning Outcomes
+
+By the end of this lecture, you will:
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | ✅ Evaluate **trade-offs** between deployment models |
+| 2 | ✅ Deploy applications to **Fly.io** edge network |
+| 3 | ✅ Understand **IPFS** and content addressing |
+| 4 | ✅ Use **4EVERLAND** for decentralized hosting |
+| 5 | ✅ Choose the **right tool** for different use cases |
+| 6 | ✅ Appreciate the **evolving cloud landscape** |
+
+---
+
+## 📍 Slide 3 – 🗺️ Lecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  SECTION 0: Introduction                    (Slides 1-4)   │
+├─────────────────────────────────────────────────────────────┤
+│  📝 PRE QUIZ                                (Slide 5)      │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 1: The Complexity Trade-off        (Slides 6-10)  │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 2: Edge Computing with Fly.io      (Slides 11-18) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 MID QUIZ                                (Slide 19)     │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 3: Decentralized Web & IPFS        (Slides 20-28) │
+├─────────────────────────────────────────────────────────────┤
+│  SECTION 4: Choosing Your Path              (Slides 29-35) │
+├─────────────────────────────────────────────────────────────┤
+│  📝 POST QUIZ                               (Slide 36)     │
+├─────────────────────────────────────────────────────────────┤
+│  FINAL: Course Wrap-up                      (Slide 37)     │
+└─────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 📍 Slide 4 – 🤔 The Big Question
+
+> 💬 *"The best tool is the one that solves your problem with the least unnecessary complexity."*
+> — Practical Engineering Wisdom
+
+**Consider these scenarios:**
+
+* 🏢 **Enterprise with 500 microservices:** Probably needs Kubernetes
+* 🚀 **Startup with 3 developers:** Maybe doesn't need a cluster
+* 📰 **News article that must stay online forever:** Decentralized?
+* 🌍 **App serving users globally:** Edge deployment?
+
+> 🤔 **Think:** What does YOUR application actually need?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L16_PRE
+
+---
+
+## 📍 Slide 6 – ⚠️ Section 1: The Kubernetes Tax
+
+**What Kubernetes requires:**
+
+```mermaid
+flowchart TD
+  A[☸️ Kubernetes Cluster] --> B[🔧 Cluster Management]
+  A --> C[🔐 Security Hardening]
+  A --> D[📊 Monitoring Setup]
+  A --> E[🔄 Upgrade Planning]
+  A --> F[💰 Infrastructure Cost]
+```
+
+* 🔧 **Cluster operations:** Updates, scaling, troubleshooting
+* 🧠 **Team expertise:** Steep learning curve
+* 💰 **Cost:** Control plane, nodes, load balancers
+* ⏱️ **Time:** Setup, maintenance, incident response
+
+---
+
+## 📍 Slide 7 – 🔥 When Kubernetes Is Overkill
+
+**Signs you might not need Kubernetes:**
+
+| 🚩 Sign | 📝 Alternative |
+|--------|---------------|
+| Single application | PaaS (Fly.io, Railway, Render) |
+| Small team (1-5 devs) | Managed services |
+| Simple deployment needs | Container platforms |
+| Cost-sensitive startup | Serverless or PaaS |
+| No specialized workloads | Simpler solutions |
+
+> 💬 *"Don't use Kubernetes to solve problems you don't have."*
+
+---
+
+## 📍 Slide 8 – 📊 The Abstraction Spectrum
+
+```mermaid
+flowchart LR
+  A[🖥️ Bare Metal] --> B[☁️ VMs/IaaS]
+  B --> C[☸️ Kubernetes]
+  C --> D[✈️ PaaS]
+  D --> E[⚡ Serverless]
+  E --> F[🌐 Decentralized]
+
+  G[More Control] -.-> A
+  H[More Abstraction] -.-> F
+```
+
+| 🎚️ Level | 🔧 You Manage | ✅ Platform Manages |
+|----------|--------------|---------------------|
+| Bare Metal | Everything | Nothing |
+| IaaS (EC2) | OS, runtime, app | Hardware |
+| Kubernetes | App, configs | Orchestration |
+| PaaS | App code only | Everything else |
+| Serverless | Functions | Runtime, scaling |
+
+---
+
+## 📍 Slide 9 – 🎯 Right Tool, Right Job
+
+**Decision factors:**
+
+| 📋 Factor | ☸️ K8s | ✈️ PaaS | 🌐 IPFS |
+|----------|--------|--------|---------|
+| Team size | Large | Small | Varies |
+| Control needs | High | Medium | Low |
+| Cost at scale | Efficient | Can be expensive | Very low |
+| Setup time | Days/weeks | Minutes | Minutes |
+| Global distribution | Manual config | Built-in | Inherent |
+| Vendor lock-in | Low | Medium | None |
+
+---
+
+## 📍 Slide 10 – 💡 The Emergence of Edge Computing
+
+**Traditional deployment:**
+```
+User (Tokyo) → CDN → US-East Server → Response (200ms)
+```
+
+**Edge deployment:**
+```
+User (Tokyo) → Edge Server (Tokyo) → Response (20ms)
+```
+
+```mermaid
+flowchart TD
+  A[🌍 User Anywhere] --> B{Edge Network}
+  B --> C[🗼 Tokyo]
+  B --> D[🗼 London]
+  B --> E[🗼 New York]
+  B --> F[🗼 Sydney]
+```
+
+* ⚡ **Lower latency:** Code runs closer to users
+* 🌍 **Global by default:** No region configuration
+* 🔄 **Automatic routing:** Users hit nearest edge
+
+---
+
+## 📍 Slide 11 – ✈️ Section 2: Fly.io - Simplicity Meets Global
+
+**What is Fly.io?**
+
+* ✈️ Platform for running apps globally
+* 📦 Deploys Docker containers (or builds from source)
+* 🌍 Runs in 30+ regions automatically
+* 💰 Free tier for small apps
+
+```mermaid
+flowchart LR
+  A[📦 Your Container] --> B[✈️ Fly.io]
+  B --> C[🗼 Edge 1]
+  B --> D[🗼 Edge 2]
+  B --> E[🗼 Edge 3]
+  C --> F[👤 Users]
+  D --> F
+  E --> F
+```
+
+---
+
+## 📍 Slide 12 – 🛠️ Fly.io Architecture
+
+**Key concepts:**
+
+| 🔧 Concept | 📝 Description |
+|-----------|---------------|
+| **Machine** | A Fly VM running your app |
+| **App** | A named collection of Machines |
+| **Region** | A geographical location (ams, iad, sin) |
+| **Volume** | Persistent storage attached to Machine |
+| **Secret** | Encrypted environment variable |
+
+```toml
+# fly.toml
+app = "my-app"
+primary_region = "ams"
+
+[http_service]
+  internal_port = 8080
+  force_https = true
+  auto_stop_machines = true
+  auto_start_machines = true
+```
+
+---
+
+## 📍 Slide 13 – 🚀 Deploying to Fly.io
+
+**The entire deployment process:**
+
+```bash
+# 1. Install CLI
+curl -L https://fly.io/install.sh | sh
+
+# 2. Login
+fly auth login
+
+# 3. Launch (creates app + config)
+fly launch
+
+# 4. Deploy
+fly deploy
+
+# 5. Open in browser
+fly open
+```
+
+**That's it!** No cluster, no YAML manifests, no ingress controllers.
+
+---
+
+## 📍 Slide 14 – 🌍 Multi-Region Deployment
+
+**Adding regions:**
+
+```bash
+# Add regions
+fly regions add iad sin syd
+
+# Check machines
+fly machines list
+
+# Scale in specific region
+fly scale count 2 --region ams
+```
+
+```mermaid
+flowchart TD
+  A[✈️ Your App] --> B[🇳🇱 Amsterdam]
+  A --> C[🇺🇸 Virginia]
+  A --> D[🇸🇬 Singapore]
+  A --> E[🇦🇺 Sydney]
+
+  F[👤 European User] --> B
+  G[👤 US User] --> C
+  H[👤 Asian User] --> D
+  I[👤 Australian User] --> E
+```
+
+---
+
+## 📍 Slide 15 – 🔐 Secrets & Storage on Fly.io
+
+**Secrets:**
+```bash
+fly secrets set DATABASE_URL="postgres://..."
+fly secrets set API_KEY="secret123"
+fly secrets list
+```
+
+**Persistent storage:**
+```bash
+# Create volume
+fly volumes create mydata --size 1 --region ams
+```
+
+```toml
+# fly.toml
+[mounts]
+  source = "mydata"
+  destination = "/data"
+```
+
+---
+
+## 📍 Slide 16 – 📊 Fly.io vs Kubernetes Comparison
+
+| 📋 Aspect | ☸️ Kubernetes | ✈️ Fly.io |
+|----------|--------------|----------|
+| Setup time | Hours/days | Minutes |
+| Learning curve | Steep | Gentle |
+| Global distribution | Manual | Built-in |
+| Scaling | HPA, VPA, manual | Auto-scale, simple commands |
+| Cost (small app) | $50-100/month | Free tier available |
+| Control | Full | Limited |
+| Customization | Unlimited | Constrained |
+| Multi-cloud | Yes | No (Fly only) |
+
+---
+
+## 📍 Slide 17 – 🎯 When to Choose Fly.io
+
+**Good fit:**
+
+* ✅ Small to medium applications
+* ✅ Need for low global latency
+* ✅ Small team, limited DevOps resources
+* ✅ Rapid iteration, quick deployments
+* ✅ Cost-conscious early-stage projects
+
+**Not ideal:**
+
+* ❌ Complex microservices architectures
+* ❌ Need for specific cloud services (AWS RDS, etc.)
+* ❌ Compliance requirements for specific regions
+* ❌ Already invested heavily in Kubernetes
+
+---
+
+## 📍 Slide 18 – 🔧 Fly.io Best Practices
+
+| 📋 Practice | 📝 Reason |
+|------------|----------|
+| Use auto_stop_machines | Save costs when idle |
+| Add health checks | Enable auto-restart on failure |
+| Use volumes for stateful data | Machines are ephemeral |
+| Set min_machines_running | Prevent cold starts |
+| Use regions near your users | Optimize latency |
+
+```toml
+[http_service]
+  auto_stop_machines = true
+  auto_start_machines = true
+  min_machines_running = 1
+
+[checks]
+  [checks.health]
+    type = "http"
+    port = 8080
+    path = "/health"
+```
+
+---
+
+## 📍 Slide 19 – 📝 QUIZ — DEVOPS_L16_MID
+
+---
+
+## 📍 Slide 20 – 🌐 Section 3: IPFS & The Decentralized Web
+
+**What is IPFS?**
+
+* 🌐 **InterPlanetary File System**
+* 📦 Distributed, peer-to-peer storage
+* 🔗 Content-addressed (identified by hash, not location)
+* ♾️ Immutable, permanent storage
+
+```mermaid
+flowchart LR
+  A[📄 File] --> B[#️⃣ Hash]
+  B --> C[🔗 CID: QmXxx...]
+  C --> D[🌐 Available Globally]
+```
+
+> 💡 **Key insight:** Same content = same address, anywhere in the world
+
+---
+
+## 📍 Slide 21 – 🔍 Content Addressing Explained
+
+**Traditional web (location-based):**
+```
+https://server.com/path/to/file.html
+                    ↓
+        Server could change content!
+```
+
+**IPFS (content-based):**
+```
+ipfs://QmXxx.../file.html
+          ↓
+   Hash of actual content
+   If content changes, hash changes!
+```
+
+| 📋 Aspect | 🌐 HTTP | 🔗 IPFS |
+|----------|--------|---------|
+| Addressing | Location | Content hash |
+| Mutability | Content can change | Content is immutable |
+| Availability | Single server | Distributed nodes |
+| Censorship | Easy to block | Very difficult |
+
+---
+
+## 📍 Slide 22 – 🔑 IPFS Key Concepts
+
+| 🔧 Concept | 📝 Description |
+|-----------|---------------|
+| **CID** | Content Identifier - hash of content |
+| **Node** | Computer running IPFS software |
+| **Pinning** | Keeping content available (prevent garbage collection) |
+| **Gateway** | HTTP bridge to IPFS content |
+| **IPNS** | Mutable pointer to IPFS content |
+
+**Example CIDs:**
+```
+QmXoypizjW3WknFiJnKLwHCnL72vedxjQkDDP1mXWo6uco
+bafybeigdyrzt5sfp7udm7hu76uh7y26nf3efuylqabf3oclgtqy55fbzdi
+```
+
+---
+
+## 📍 Slide 23 – 📌 Pinning Services
+
+**The persistence problem:**
+
+```mermaid
+flowchart TD
+  A[📄 Add Content] --> B[🔗 Get CID]
+  B --> C{Who stores it?}
+  C --> |Your node| D[🖥️ Goes offline = Content unavailable]
+  C --> |Pinning service| E[☁️ Always available]
+```
+
+**Pinning services:**
+* 📌 **4EVERLAND** — Web3 hosting platform
+* 📌 **Pinata** — IPFS pinning
+* 📌 **Infura** — IPFS API
+* 📌 **web3.storage** — Free storage
+
+---
+
+## 📍 Slide 24 – 🌐 4EVERLAND Platform
+
+**What is 4EVERLAND?**
+
+* 🌐 Web3 infrastructure platform
+* 📦 IPFS hosting made simple
+* 🔧 Deploy from Git (like Vercel/Netlify)
+* 💰 Free tier available
+
+**Services:**
+* 🚀 **Hosting:** Deploy static sites and SPAs
+* 📦 **Bucket:** IPFS storage (like S3)
+* 🌐 **Gateway:** Access IPFS content via HTTP
+
+---
+
+## 📍 Slide 25 – 🚀 Deploying to 4EVERLAND
+
+**Process:**
+
+```mermaid
+flowchart LR
+  A[📝 Git Push] --> B[🔄 4EVERLAND Build]
+  B --> C[📦 Upload to IPFS]
+  C --> D[🔗 Get CID]
+  D --> E[🌐 Available via Gateway]
+```
+
+**Steps:**
+1. 🔗 Connect GitHub repository
+2. ⚙️ Configure build settings
+3. 🚀 Deploy
+4. 🔗 Access via CID or custom domain
+
+**URLs:**
+* `https://your-project.4everland.app`
+* `https://ipfs.4everland.link/ipfs/CID`
+
+---
+
+## 📍 Slide 26 – 🔄 IPNS: Mutable Pointers
+
+**Problem:** CID changes when content changes
+
+**Solution:** IPNS (InterPlanetary Name System)
+
+```mermaid
+flowchart LR
+  A[🔑 IPNS Name] --> B[🔗 CID v1]
+  A --> |Update| C[🔗 CID v2]
+```
+
+| 📋 Type | 🔗 Address | 📝 Behavior |
+|--------|-----------|------------|
+| **IPFS** | `/ipfs/QmXxx` | Always same content |
+| **IPNS** | `/ipns/k51xxx` | Points to current version |
+
+**4EVERLAND handles this:** Your URL stays the same, content updates automatically
+
+---
+
+## 📍 Slide 27 – 📊 Centralized vs Decentralized
+
+| 📋 Aspect | 🏢 Traditional | 🌐 IPFS/4EVERLAND |
+|----------|---------------|-------------------|
+| Single point of failure | Yes | No |
+| Censorship resistance | Low | High |
+| Content integrity | Trust server | Cryptographic verification |
+| Hosting cost | Ongoing | Pin once, available forever |
+| Update mechanism | Overwrite file | New CID (or IPNS) |
+| Speed | Fast (CDN) | Variable (depends on nodes) |
+| Best for | Dynamic apps | Static content, archives |
+
+---
+
+## 📍 Slide 28 – 🎯 When to Choose IPFS/4EVERLAND
+
+**Good fit:**
+
+* ✅ Static websites and documentation
+* ✅ Content that must survive (archives, important documents)
+* ✅ Censorship-resistant publishing
+* ✅ NFT metadata and assets
+* ✅ Open source project hosting
+
+**Not ideal:**
+
+* ❌ Dynamic server-side applications
+* ❌ Real-time updates needed
+* ❌ Private content (IPFS is public by default)
+* ❌ High-performance requirements
+
+---
+
+## 📍 Slide 29 – 🎯 Section 4: Making the Right Choice
+
+**Decision Framework:**
+
+```mermaid
+flowchart TD
+  A[📦 Your Application] --> B{Need dynamic backend?}
+  B --> |Yes| C{Team size?}
+  B --> |No, static| D{Permanence important?}
+
+  C --> |Large, experienced| E[☸️ Kubernetes]
+  C --> |Small| F{Global latency critical?}
+
+  F --> |Yes| G[✈️ Fly.io]
+  F --> |No| H[Simple hosting]
+
+  D --> |Yes| I[🌐 IPFS/4EVERLAND]
+  D --> |No| J[Static hosting CDN]
+```
+
+---
+
+## 📍 Slide 30 – 📊 Summary Comparison
+
+| 📋 Criteria | ☸️ Kubernetes | ✈️ Fly.io | 🌐 4EVERLAND/IPFS |
+|------------|--------------|----------|-------------------|
+| **Complexity** | High | Low | Low |
+| **Control** | Full | Medium | Limited |
+| **Scalability** | Unlimited | Good | N/A (static) |
+| **Global distribution** | Manual | Automatic | Inherent |
+| **Cost at scale** | Efficient | Can be expensive | Very low |
+| **Learning curve** | Steep | Gentle | Minimal |
+| **Use case** | Microservices, enterprise | Global apps, startups | Static content, Web3 |
+
+---
+
+## 📍 Slide 31 – 🏢 Real-World Examples
+
+**Kubernetes users:**
+* 🏢 **Spotify:** 200+ microservices
+* 🏢 **Pinterest:** ML workloads
+* 🏢 **Airbnb:** Multi-region deployments
+
+**Fly.io users:**
+* 🚀 **Small startups:** Quick global deployment
+* 🎮 **Game backends:** Low-latency requirements
+* 🛠️ **Developer tools:** API services
+
+**IPFS/Decentralized:**
+* 📚 **Wikipedia mirror:** Censorship-resistant access
+* 🎨 **NFT projects:** Metadata storage
+* 📰 **News archives:** Permanent preservation
+
+---
+
+## 📍 Slide 32 – 🔮 The Future of Deployment
+
+**Trends to watch:**
+
+| 🔮 Trend | 📝 Description |
+|---------|---------------|
+| **Edge computing** | Code runs closer to users |
+| **WebAssembly** | Run any language at the edge |
+| **Decentralization** | Web3 infrastructure growth |
+| **Platform abstraction** | Less infra management |
+| **AI-assisted DevOps** | Automated operations |
+
+> 💬 *"The cloud is just someone else's computer. The edge is everyone's computer."*
+
+---
+
+## 📍 Slide 33 – 📋 Practical Recommendations
+
+**For students and learning:**
+1. 🎓 Master Kubernetes fundamentals first
+2. ✈️ Try Fly.io for personal projects
+3. 🌐 Experiment with IPFS for static sites
+
+**For production decisions:**
+1. 📋 Start with requirements, not technology
+2. 📊 Consider team capabilities
+3. 💰 Factor in total cost (including time)
+4. 🔄 Plan for evolution
+
+---
+
+## 📍 Slide 34 – 🎯 Key Takeaways
+
+1. ☸️ **Kubernetes is powerful** but comes with complexity costs
+2. ✈️ **Fly.io offers simplicity** for global, low-latency applications
+3. 🌐 **IPFS provides permanence** and censorship resistance
+4. 🎯 **No single best solution** — choose based on requirements
+5. 📊 **Consider the trade-offs:** control vs simplicity, cost vs features
+6. 🔮 **The landscape evolves** — stay curious, keep learning
+
+> 💬 *"The best architecture is the one your team can operate successfully."*
+
+---
+
+## 📍 Slide 35 – 🧠 Course Mindset Shift
+
+| 😰 Before This Course | 🚀 After This Course |
+|----------------------|---------------------|
+| "How do I deploy this?" | "What's the best deployment model?" |
+| "Kubernetes is complicated" | "I understand K8s and its alternatives" |
+| "DevOps is ops work" | "DevOps is a culture and practice" |
+| "I write code, someone else deploys" | "I can deploy, monitor, and maintain" |
+| "Just get it working" | "Make it observable, scalable, reliable" |
+
+---
+
+## 📍 Slide 36 – 📝 QUIZ — DEVOPS_L16_POST
+
+---
+
+## 📍 Slide 37 – 🎓 Course Wrap-up
+
+**What you've learned:**
+
+```mermaid
+flowchart LR
+  A[🐳 Docker] --> B[☸️ Kubernetes]
+  B --> C[🔄 CI/CD]
+  C --> D[📊 Observability]
+  D --> E[🔐 Security]
+  E --> F[🌍 Global Deployment]
+```
+
+**Your DevOps toolkit:**
+* 🐳 **Containerization:** Docker, multi-stage builds
+* ☸️ **Orchestration:** Kubernetes, Helm, StatefulSets
+* 🔄 **GitOps:** ArgoCD, declarative infrastructure
+* 📊 **Observability:** Prometheus, Grafana, alerting
+* 🔐 **Security:** Secrets management, Vault
+* 🚀 **Progressive delivery:** Canary, blue-green
+* 🌍 **Beyond K8s:** Edge computing, decentralized hosting
+
+> 🎉 **Congratulations!** You're now equipped for production DevOps.
+
+---
+
+## 📚 Resources
+
+**Fly.io:**
+* 📖 [Fly.io Documentation](https://fly.io/docs/)
+* 📖 [flyctl Reference](https://fly.io/docs/flyctl/)
+
+**IPFS & 4EVERLAND:**
+* 📖 [IPFS Documentation](https://docs.ipfs.tech/)
+* 📖 [4EVERLAND Docs](https://docs.4everland.org/)
+* 📖 [IPFS Concepts](https://docs.ipfs.tech/concepts/)
+
+**Further reading:**
+* 📕 *The DevOps Handbook* by Gene Kim, et al.
+* 📕 *Accelerate* by Nicole Forsgren, et al.
+* 📕 *Site Reliability Engineering* by Google
+
+**Keep learning:**
+* 🌐 [CNCF Landscape](https://landscape.cncf.io/)
+* 🌐 [DevOps Roadmap](https://roadmap.sh/devops)
diff --git a/lectures/lec2.md b/lectures/lec2.md
new file mode 100644
index 0000000000..46a3e0485a
--- /dev/null
+++ b/lectures/lec2.md
@@ -0,0 +1,1053 @@
+# 📌 Lecture 2 — Containerization with Docker: From "Works on My Machine" to Works Everywhere
+
+## 📍 Slide 1 – 🐳 Welcome to Containerization
+
+* 🌍 **"Works on my machine"** — the most expensive phrase in software
+* 📦 **Containers** = package your app + all dependencies together
+* 🚀 **Docker** = the tool that made containers mainstream
+* 🎯 This lecture: build production-ready containers from scratch
+
+```mermaid
+flowchart LR
+  Problem[😰 Works on My Machine] -->|Docker| Solution[🐳 Works Everywhere]
+  Solution --> Value[💎 Consistent Deployments]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 Learning Outcomes
+
+* ✅ Understand containers vs VMs and why containers win
+* ✅ Write production-ready Dockerfiles
+* ✅ Apply security best practices (rootless, distroless)
+* ✅ Optimize images with multi-stage builds
+* ✅ Publish images to Docker Hub
+
+**🎓 By the end of this lecture:**
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | 🧠 Explain container architecture and benefits |
+| 2 | 📝 Write optimized, secure Dockerfiles |
+| 3 | 🔐 Implement rootless containers |
+| 4 | 📦 Use multi-stage builds for smaller images |
+| 5 | 🚀 Push/pull images from Docker Hub |
+
+---
+
+## 📍 Slide 3 – 📋 Lecture Overview
+
+* 📚 **Concepts + Diagrams** — how containers work
+* 🛠️ **Dockerfile deep dive** — instructions and best practices
+* 🔐 **Security patterns** — rootless and distroless
+* 📦 **Optimization** — multi-stage builds
+* 🌐 **Registry workflow** — Docker Hub
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction           → 📝 PRE Quiz
+Section 1: The Dependency Problem
+Section 2: Container Fundamentals
+Section 3: Dockerfile Scenarios   → 📝 MID Quiz
+Section 4: Advanced Patterns
+Section 5: Real World Usage
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **65%** of organizations use containers in production (2024)
+* 🐳 **Docker Hub**: 14+ million images, 13+ billion pulls/month
+* 💥 Yet most Dockerfiles have **security vulnerabilities**
+
+> 💬 *"Containers are the new deployment unit"* — Kelsey Hightower
+
+**🤔 Think about it:**
+* Why do apps work locally but fail in production?
+* What's inside a container that makes it portable?
+* How small can a container image be?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L2_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Dependency Problem
+
+* 👨‍💻 **Developer**: "It works on my machine!"
+* ⚙️ **Ops**: "Well, we're not shipping your machine!"
+* 🧩 **The real problem**: dependencies, versions, configurations
+* 💥 **Result**: deployment failures, debugging nightmares
+
+```mermaid
+flowchart LR
+  Dev[👨‍💻 Dev Machine] -->|Different| Prod[🌐 Production]
+  Dev -->|Python 3.11| V1[📦 Version]
+  Prod -->|Python 3.9| V2[📦 Version]
+  V1 -.->|💥 Conflict| V2
+```
+
+---
+
+## 📍 Slide 7 – 🧩 The Dependency Hell
+
+* 🐍 **Python version**: 3.9 vs 3.11 vs 3.12
+* 📚 **Library versions**: requests 2.28 vs 2.31
+* 🖥️ **OS differences**: Ubuntu vs Alpine vs macOS
+* ⚙️ **System libraries**: OpenSSL, libffi, glibc
+
+```mermaid
+flowchart TD
+  App[📱 Your App] --> Py[🐍 Python 3.11]
+  App --> Lib1[📚 Flask 2.3]
+  App --> Lib2[📚 Requests 2.31]
+  Py --> OS[🖥️ Ubuntu 22.04]
+  Lib1 --> SSL[🔐 OpenSSL 3.0]
+  OS --> Kernel[🧠 Linux Kernel]
+```
+
+> 🤔 **Think:** How many things can go wrong?
+
+---
+
+## 📍 Slide 8 – 😱 The VM Solution (Heavy)
+
+* 🖥️ **Virtual Machines** = entire OS per application
+* 💾 **Size**: 10-50 GB per VM
+* ⏱️ **Boot time**: minutes
+* 🔧 **Resource overhead**: hypervisor, guest OS kernel
+
+```mermaid
+flowchart TD
+  subgraph VM1[🖥️ VM 1 - 15GB]
+    App1[📱 App] --> OS1[🖥️ Full OS]
+    OS1 --> Kernel1[🧠 Kernel]
+  end
+  subgraph VM2[🖥️ VM 2 - 15GB]
+    App2[📱 App] --> OS2[🖥️ Full OS]
+    OS2 --> Kernel2[🧠 Kernel]
+  end
+  VM1 --> Hyper[⚙️ Hypervisor]
+  VM2 --> Hyper
+  Hyper --> Host[🖥️ Host OS]
+```
+
+**😰 Problems:**
+* 🐌 Slow to start
+* 💸 Expensive (RAM, CPU, storage)
+* 🔧 Hard to manage at scale
+
+---
+
+## 📍 Slide 9 – 🐳 The Container Solution (Light)
+
+* 📦 **Containers** = isolated processes sharing host kernel
+* 💾 **Size**: 5-500 MB typically
+* ⏱️ **Start time**: milliseconds
+* 🚀 **Density**: 10-100x more containers than VMs
+
+```mermaid
+flowchart TD
+  subgraph Containers
+    C1[📦 Container 1 - 50MB]
+    C2[📦 Container 2 - 50MB]
+    C3[📦 Container 3 - 50MB]
+  end
+  C1 --> Docker[🐳 Docker Engine]
+  C2 --> Docker
+  C3 --> Docker
+  Docker --> Host[🖥️ Host OS + Kernel]
+```
+
+**🚀 Benefits:**
+* ⚡ Start in milliseconds
+* 💰 Efficient resource usage
+* 📦 Portable across environments
+
+---
+
+## 📍 Slide 10 – 💸 VMs vs Containers
+
+| 🔍 Aspect | 🖥️ Virtual Machine | 🐳 Container |
+|-----------|-------------------|--------------|
+| 💾 **Size** | 10-50 GB | 10-500 MB |
+| ⏱️ **Boot Time** | Minutes | Milliseconds |
+| 🧠 **Kernel** | Own kernel | Shared kernel |
+| 🔒 **Isolation** | Strong (hardware) | Process-level |
+| 📦 **Density** | 10-20 per host | 100s per host |
+| 🎯 **Use Case** | Full OS needed | App deployment |
+
+**📈 Real Numbers:**
+* 🖥️ **VM**: 1 app = ~2GB RAM overhead
+* 🐳 **Container**: 1 app = ~50MB overhead
+* 🚀 **Result**: 40x more efficient!
+
+---
+
+## 📍 Slide 11 – 📜 History of Containerization
+
+* 🕰️ **1979**: `chroot` — change root directory (Unix V7)
+* 🔒 **2000**: FreeBSD Jails — first true isolation
+* 🐧 **2006**: cgroups — Google contributes to Linux kernel
+* 📦 **2008**: LXC (Linux Containers) — combines namespaces + cgroups
+* 🐳 **2013**: **Docker** — makes containers accessible to everyone
+* ☸️ **2014**: Kubernetes — container orchestration at scale
+* 📦 **2015**: OCI (Open Container Initiative) — standardization
+
+```mermaid
+flowchart LR
+  Chroot[🕰️ 1979: chroot] --> Jails[🔒 2000: Jails]
+  Jails --> Cgroups[🐧 2006: cgroups]
+  Cgroups --> LXC[📦 2008: LXC]
+  LXC --> Docker[🐳 2013: Docker]
+  Docker --> K8s[☸️ 2014: K8s]
+```
+
+> 💡 Docker didn't invent containers — it made them **usable**.
+
+---
+
+## 📍 Slide 12 – 🐧 Linux Kernel: Namespaces
+
+* 🎯 **Namespaces** = isolate what a process **can see**
+* 🔒 Each container gets its own "view" of the system
+
+| 🏷️ Namespace | 🔒 Isolates | 📝 Example |
+|--------------|------------|-----------|
+| **PID** | Process IDs | Container sees PID 1 as its init |
+| **NET** | Network stack | Own IP, ports, routing |
+| **MNT** | Mount points | Own filesystem view |
+| **UTS** | Hostname | Own hostname |
+| **IPC** | Inter-process comm | Own message queues |
+| **USER** | User/Group IDs | UID 0 in container ≠ root on host |
+
+```mermaid
+flowchart TD
+  subgraph Host[🖥️ Host System]
+    subgraph NS1[📦 Container 1 Namespace]
+      P1[PID 1: app]
+      Net1[eth0: 172.17.0.2]
+    end
+    subgraph NS2[📦 Container 2 Namespace]
+      P2[PID 1: app]
+      Net2[eth0: 172.17.0.3]
+    end
+  end
+```
+
+---
+
+## 📍 Slide 13 – 🎛️ Linux Kernel: cgroups
+
+* 🎯 **cgroups** (Control Groups) = limit what a process **can use**
+* 📊 Resource limits prevent one container from killing the host
+
+| 🎛️ cgroup | 🔧 Controls | 📝 Example |
+|-----------|------------|-----------|
+| **cpu** | CPU time | Max 50% of one core |
+| **memory** | RAM usage | Max 512MB |
+| **blkio** | Disk I/O | Max 100MB/s read |
+| **pids** | Process count | Max 100 processes |
+
+```mermaid
+flowchart LR
+  Container[🐳 Container] --> Cgroups[🎛️ cgroups]
+  Cgroups --> CPU[🖥️ CPU: 50%]
+  Cgroups --> RAM[💾 RAM: 512MB]
+  Cgroups --> IO[💿 I/O: 100MB/s]
+```
+
+**🛡️ Why it matters:**
+* ✅ Prevent runaway processes
+* ✅ Fair resource sharing
+* ✅ Predictable performance
+
+---
+
+## 📍 Slide 14 – 📂 Linux Kernel: Union Filesystems
+
+* 🎯 **Union FS** = layer multiple filesystems as one
+* 📚 Docker uses **overlay2** (default on Linux)
+* 💾 Layers are **read-only**, changes go to top layer
+
+```mermaid
+flowchart TD
+  subgraph Image[📦 Image Layers - Read Only]
+    L1[🐧 Layer 1: Base OS]
+    L2[📦 Layer 2: Dependencies]
+    L3[📁 Layer 3: App Code]
+  end
+  subgraph Container[🏃 Container Layer - Read/Write]
+    L4[✏️ Layer 4: Runtime Changes]
+  end
+  L1 --> L2 --> L3 --> L4
+```
+
+**💡 Benefits:**
+* ✅ **Shared layers** — 10 containers can share base image
+* ✅ **Fast startup** — no copying, just add thin layer
+* ✅ **Efficient storage** — only differences stored
+
+---
+
+## 📍 Slide 15 – 🧩 How It All Fits Together
+
+```mermaid
+flowchart TD
+  subgraph Docker[🐳 Docker Engine]
+    CLI[🖥️ Docker CLI]
+    Daemon[⚙️ dockerd]
+    Containerd[📦 containerd]
+    Runc[🏃 runc]
+  end
+  subgraph Kernel[🐧 Linux Kernel]
+    NS[🔒 Namespaces]
+    CG[🎛️ cgroups]
+    UFS[📂 overlay2]
+  end
+  CLI --> Daemon --> Containerd --> Runc
+  Runc --> NS
+  Runc --> CG
+  Runc --> UFS
+```
+
+**🔧 The Stack:**
+* 🖥️ **Docker CLI** — user interface
+* ⚙️ **dockerd** — Docker daemon (API)
+* 📦 **containerd** — container lifecycle management
+* 🏃 **runc** — OCI runtime (creates containers)
+* 🐧 **Kernel** — namespaces + cgroups + filesystem
+
+---
+
+## 📍 Slide 16 – 💡 Section 2: Docker Fundamentals
+
+* 🐳 **Docker** = platform for building, shipping, running containers
+* 📦 **Image** = blueprint (read-only template)
+* 🏃 **Container** = running instance of an image
+* 📝 **Dockerfile** = recipe to build an image
+
+```mermaid
+flowchart LR
+  Dockerfile[📝 Dockerfile] -->|build| Image[📦 Image]
+  Image -->|run| Container[🏃 Container]
+  Image -->|push| Registry[🌐 Registry]
+  Registry -->|pull| Image2[📦 Image]
+```
+
+**📖 Definition:**
+> *A container is a standard unit of software that packages code and all its dependencies so the application runs quickly and reliably across environments.*
+
+---
+
+## 📍 Slide 17 – 🏗️ Docker Architecture
+
+* 🖥️ **Docker Client** = CLI commands (`docker build`, `docker run`)
+* ⚙️ **Docker Daemon** = background service managing containers
+* 📦 **Images** = layered filesystem snapshots
+* 🌐 **Registry** = image storage (Docker Hub, ECR, GCR)
+
+```mermaid
+flowchart LR
+  CLI[🖥️ Docker CLI] -->|API| Daemon[⚙️ Docker Daemon]
+  Daemon --> Images[📦 Images]
+  Daemon --> Containers[🏃 Containers]
+  Daemon <-->|push/pull| Registry[🌐 Registry]
+```
+
+**🔧 Key Commands:**
+* 🔨 `docker build` — create image from Dockerfile
+* 🏃 `docker run` — start container from image
+* 📤 `docker push` — upload image to registry
+* 📥 `docker pull` — download image from registry
+
+---
+
+## 📍 Slide 18 – 📚 Image Layers
+
+* 🎂 **Images are layered** = each instruction creates a layer
+* 💾 **Layers are cached** = faster rebuilds
+* 🔄 **Layers are shared** = efficient storage
+* 📝 **Order matters** = for cache efficiency
+
+```mermaid
+flowchart TD
+  L1[🐧 Layer 1: Base OS - python:3.12-slim]
+  L2[📦 Layer 2: Install dependencies]
+  L3[📁 Layer 3: Copy application code]
+  L4[⚙️ Layer 4: Configure runtime]
+  L1 --> L2 --> L3 --> L4
+  L4 --> Image[📦 Final Image]
+```
+
+**💡 Key Insight:**
+* ✅ Change code → only Layer 3-4 rebuild
+* ❌ Change base → ALL layers rebuild
+
+---
+
+## 📍 Slide 19 – 📝 Dockerfile Basics
+
+```dockerfile
+# 🐍 Start from base image
+FROM python:3.12-slim
+
+# 📁 Set working directory
+WORKDIR /app
+
+# 📦 Copy and install dependencies FIRST (caching!)
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+
+# 📁 Copy application code
+COPY . .
+
+# 🚀 Define startup command
+CMD ["python", "app.py"]
+```
+
+**📝 Key Instructions:**
+| Instruction | 🎯 Purpose |
+|-------------|-----------|
+| `FROM` | 🐧 Base image |
+| `WORKDIR` | 📁 Set directory |
+| `COPY` | 📄 Copy files |
+| `RUN` | ⚙️ Execute commands |
+| `CMD` | 🚀 Default command |
+| `EXPOSE` | 🔌 Document port |
+
+---
+
+## 📍 Slide 20 – ⚡ Before vs After Docker
+
+| 😰 Before Docker | 🐳 After Docker |
+|-----------------|-----------------|
+| 📋 Manual server setup | 📝 Dockerfile defines everything |
+| 🔧 "Install Python 3.11, then..." | 🐳 `FROM python:3.11` |
+| 😱 "Works on my machine" | ✅ Works everywhere |
+| 📅 Deploy monthly (scary) | 🚀 Deploy daily (confident) |
+| 🐛 "Which version is prod?" | 📦 Image tag = version |
+| 💀 Snowflake servers | 🐄 Immutable containers |
+
+> 🤔 Which column describes your current workflow?
+
+---
+
+## 📍 Slide 21 – 🎮 Section 3: Dockerfile Scenarios
+
+## 🕹️ Lab Preview: Containerize Your App
+
+* 🏢 **Scenario**: You have a Python Flask app from Lab 1
+* 🎯 **Goal**: Package it in a production-ready container
+* 📋 **Requirements**: Security, optimization, best practices
+
+**❓ What could go wrong?**
+
+> 💀 **A lot.** Let's see common mistakes and fixes.
+
+🎮 **Let's build it right.**
+
+---
+
+## 📍 Slide 22 – 💥 Scenario 1: Running as Root
+
+**😰 The Problem:**
+```dockerfile
+FROM python:3.12
+COPY . /app
+CMD ["python", "app.py"]
+# 💀 Running as root by default!
+```
+
+* 🔓 Container runs as **root** (UID 0)
+* 💥 If attacker escapes container → **root on host**
+* 🚨 Kubernetes blocks root containers by default
+
+```mermaid
+flowchart LR
+  Attack[🔓 Container Escape] --> Root[👑 Root Access]
+  Root --> Host[💀 Host Compromised]
+```
+
+> ❓ **Why is this dangerous?**
+
+---
+
+## 📍 Slide 23 – ✅ Solution: Rootless Containers
+
+## 🛠️ Fix: Create Non-Root User
+
+```dockerfile
+FROM python:3.12-slim
+
+# 👤 Create non-root user
+RUN useradd --create-home --shell /bin/bash appuser
+
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY . .
+
+# 🔒 Switch to non-root user
+USER appuser
+
+CMD ["python", "app.py"]
+```
+
+**🎯 Result:** Container runs as `appuser`, not root
+
+**🔐 Security Benefits:**
+* ✅ Limited privileges inside container
+* ✅ Can't modify system files
+* ✅ Container escape = unprivileged user
+* ✅ Kubernetes-compatible
+
+---
+
+## 📍 Slide 24 – 🐌 Scenario 2: Slow Builds (Bad Layer Order)
+
+**😰 The Problem:**
+```dockerfile
+FROM python:3.12-slim
+WORKDIR /app
+
+# ❌ Copy EVERYTHING first
+COPY . .
+
+# 📦 Then install dependencies
+RUN pip install -r requirements.txt
+
+CMD ["python", "app.py"]
+```
+
+* 🔄 **Any code change** → reinstall ALL dependencies
+* ⏱️ Build time: **5 minutes** every time
+* 💸 Wasted CI/CD minutes
+
+```mermaid
+flowchart TD
+  Change[📝 Change 1 line of code] --> Copy[❌ COPY invalidated]
+  Copy --> Pip[❌ pip install runs again]
+  Pip --> Slow[🐌 5 min rebuild]
+```
+
+---
+
+## 📍 Slide 25 – ✅ Solution: Optimized Layer Order
+
+## 🛠️ Fix: Dependencies Before Code
+
+```dockerfile
+FROM python:3.12-slim
+WORKDIR /app
+
+# 📦 Copy ONLY requirements first
+COPY requirements.txt .
+
+# 📦 Install dependencies (cached if requirements unchanged)
+RUN pip install --no-cache-dir -r requirements.txt
+
+# 📁 THEN copy application code
+COPY . .
+
+CMD ["python", "app.py"]
+```
+
+**🎯 Result:** Change code → only last layer rebuilds
+
+```mermaid
+flowchart TD
+  Change[📝 Change code] --> Skip1[✅ FROM cached]
+  Skip1 --> Skip2[✅ requirements cached]
+  Skip2 --> Skip3[✅ pip install cached]
+  Skip3 --> Rebuild[🔨 Only COPY . . rebuilds]
+  Rebuild --> Fast[⚡ 10 sec rebuild]
+```
+
+**⚡ Build time: 5 min → 10 sec**
+
+---
+
+## 📍 Slide 26 – 📦 Scenario 3: Bloated Images
+
+**😰 The Problem:**
+```dockerfile
+FROM python:3.12
+# 💾 Full Python image = 1.0 GB!
+```
+
+* 💾 Image size: **1+ GB**
+* 🐌 Slow to pull/push
+* 💸 Storage costs
+* 🔓 Larger attack surface
+
+**📊 Python Image Sizes:**
+| Image | 💾 Size |
+|-------|--------|
+| `python:3.12` | 1.0 GB |
+| `python:3.12-slim` | 150 MB |
+| `python:3.12-alpine` | 50 MB |
+
+> 🤔 **Do you need the full image?**
+
+---
+
+## 📍 Slide 27 – ✅ Solution: Slim Base Images
+
+## 🛠️ Fix: Use Minimal Base Images
+
+```dockerfile
+# ✅ Use slim variant
+FROM python:3.12-slim
+
+# ✅ No cache for pip (smaller image)
+RUN pip install --no-cache-dir -r requirements.txt
+
+# ✅ Only copy what's needed
+COPY app.py .
+COPY templates/ templates/
+```
+
+**🎯 Result:** 1 GB → 150 MB (85% reduction!)
+
+**📦 Base Image Guide:**
+| Image Type | 🎯 Use Case | 💾 Size |
+|------------|------------|--------|
+| `python:3.12` | Need compilation tools | 1.0 GB |
+| `python:3.12-slim` | Most apps (recommended) | 150 MB |
+| `python:3.12-alpine` | Size-critical, simple apps | 50 MB |
+
+**⚠️ Alpine Warning:** Uses musl libc, may break some packages
+
+---
+
+## 📍 Slide 28 – 📁 Scenario 4: No .dockerignore
+
+**😰 The Problem:**
+```bash
+# Build context includes EVERYTHING
+Sending build context to Docker daemon  500MB
+```
+
+* 📁 `.git/` folder (100+ MB)
+* 📁 `node_modules/` or `venv/`
+* 📁 `__pycache__/` files
+* 📄 `.env` with secrets! 💀
+
+**💥 Consequences:**
+* 🐌 Slow builds
+* 💾 Bloated images
+* 🔓 Secrets leaked into image
+
+---
+
+## 📍 Slide 29 – ✅ Solution: .dockerignore
+
+## 🛠️ Fix: Exclude Unnecessary Files
+
+```dockerignore
+# 🐙 Version control
+.git
+.gitignore
+
+# 🐍 Python
+__pycache__
+*.pyc
+*.pyo
+venv/
+.venv/
+
+# 🔐 Secrets (NEVER include!)
+.env
+*.pem
+secrets/
+
+# 📝 Documentation
+*.md
+docs/
+
+# 🧪 Tests (if not needed in container)
+tests/
+```
+
+**🎯 Result:**
+* ⚡ Build context: 500 MB → 5 MB
+* 🔐 No secrets in image
+* 🚀 Faster builds
+
+---
+
+## 📍 Slide 30 – 📝 QUIZ — DEVOPS_L2_MID
+
+---
+
+## 📍 Slide 31 – 🚀 Section 4: Advanced Patterns
+
+## 🏗️ Multi-Stage Builds
+
+* 🎯 **Problem**: Build tools bloat final image
+* 💡 **Solution**: Separate build and runtime stages
+* 📦 **Result**: Tiny production images
+
+```mermaid
+flowchart LR
+  subgraph Stage1[🔨 Builder Stage]
+    SDK[📦 Full SDK]
+    Compile[⚙️ Compile]
+  end
+  subgraph Stage2[🚀 Runtime Stage]
+    Binary[📦 Binary Only]
+    Minimal[🐧 Minimal OS]
+  end
+  Stage1 -->|copy binary| Stage2
+```
+
+**📊 Size Impact:**
+* 🔨 Builder: 1+ GB (SDK, compilers)
+* 🚀 Runtime: 10-50 MB (binary only)
+
+---
+
+## 📍 Slide 32 – 📝 Multi-Stage Dockerfile
+
+```dockerfile
+# 🔨 Stage 1: Builder
+FROM golang:1.21 AS builder
+WORKDIR /app
+COPY go.mod go.sum ./
+RUN go mod download
+COPY . .
+RUN CGO_ENABLED=0 go build -o myapp
+
+# 🚀 Stage 2: Runtime
+FROM alpine:3.18
+RUN adduser -D appuser
+WORKDIR /app
+COPY --from=builder /app/myapp .
+USER appuser
+CMD ["./myapp"]
+```
+
+**🔍 Key Points:**
+* 🏷️ `AS builder` — name the stage
+* 📦 `COPY --from=builder` — copy from previous stage
+* 🗑️ Builder stage discarded in final image
+
+**📊 Result:** 1.2 GB → 15 MB
+
+---
+
+## 📍 Slide 33 – 🔐 Distroless Images
+
+## 🛡️ Ultimate Minimal Images
+
+* 🚫 **No shell** — can't exec into container
+* 🚫 **No package manager** — can't install malware
+* 🚫 **No unnecessary files** — minimal attack surface
+* ✅ **Only your app** — and runtime dependencies
+
+```dockerfile
+# 🔨 Build stage
+FROM golang:1.21 AS builder
+WORKDIR /app
+COPY . .
+RUN CGO_ENABLED=0 go build -o myapp
+
+# 🔐 Distroless runtime
+FROM gcr.io/distroless/static-debian12
+COPY --from=builder /app/myapp /
+CMD ["/myapp"]
+```
+
+**📊 Distroless Options:**
+| Image | 🎯 For | 💾 Size |
+|-------|-------|--------|
+| `distroless/static` | Go, Rust (static) | 2 MB |
+| `distroless/base` | C/C++ apps | 20 MB |
+| `distroless/python3` | Python apps | 50 MB |
+| `distroless/java` | Java apps | 190 MB |
+
+---
+
+## 📍 Slide 34 – 📊 Image Size Comparison
+
+## 📈 Same App, Different Images
+
+| 🏗️ Build Strategy | 💾 Image Size | 🔐 Security |
+|-------------------|--------------|-------------|
+| `FROM python:3.12` | 1.0 GB | 😰 Large attack surface |
+| `FROM python:3.12-slim` | 150 MB | 😊 Better |
+| Multi-stage + slim | 100 MB | 😄 Good |
+| Multi-stage + alpine | 50 MB | 😄 Good |
+| Multi-stage + distroless | 20 MB | 🔐 Excellent |
+| `FROM scratch` (Go) | 5 MB | 🔐 Maximum |
+
+```mermaid
+flowchart LR
+  Full[📦 1 GB] --> Slim[📦 150 MB]
+  Slim --> Multi[📦 50 MB]
+  Multi --> Distroless[📦 20 MB]
+  Distroless --> Scratch[📦 5 MB]
+```
+
+**🎯 Goal:** As small as possible while functional
+
+---
+
+## 📍 Slide 35 – 🌐 Docker Hub & Registries
+
+## 📦 Publishing Your Images
+
+```mermaid
+flowchart LR
+  Build[🔨 Build] --> Tag[🏷️ Tag]
+  Tag --> Push[📤 Push]
+  Push --> Registry[🌐 Docker Hub]
+  Registry --> Pull[📥 Pull]
+  Pull --> Run[🏃 Run]
+```
+
+**🔧 Workflow:**
+```bash
+# 🔨 Build image
+docker build -t myapp:1.0 .
+
+# 🏷️ Tag for registry
+docker tag myapp:1.0 username/myapp:1.0
+
+# 🔐 Login to Docker Hub
+docker login
+
+# 📤 Push to registry
+docker push username/myapp:1.0
+```
+
+**📦 Registries:**
+* 🐳 Docker Hub — public/private
+* ☁️ AWS ECR — AWS integrated
+* 🌐 GCP GCR — Google integrated
+* 🦊 GitLab Registry — GitLab integrated
+
+---
+
+## 📍 Slide 36 – 🏢 Section 5: Real World Usage
+
+## 📅 Docker in Production
+
+**🔨 Build Phase:**
+* 📝 Dockerfile in repo
+* 🤖 CI builds image on every commit
+* 🏷️ Tag with git SHA or semantic version
+* 📤 Push to registry
+
+**🚀 Deploy Phase:**
+* 📥 Pull image to servers
+* 🏃 Run containers
+* 📊 Monitor health
+* 🔄 Rolling updates
+
+```mermaid
+flowchart LR
+  Code[📝 Code] --> CI[🤖 CI Build]
+  CI --> Registry[🌐 Registry]
+  Registry --> K8s[☸️ Kubernetes]
+  K8s --> Prod[🌐 Production]
+```
+
+---
+
+## 📍 Slide 37 – 🏷️ Tagging Strategies
+
+| 🏷️ Strategy | 📝 Example | 🎯 Use Case |
+|-------------|-----------|-------------|
+| **Semantic** | `myapp:1.2.3` | Releases |
+| **Git SHA** | `myapp:a1b2c3d` | Traceability |
+| **Branch** | `myapp:develop` | Dev environments |
+| **Latest** | `myapp:latest` | ⚠️ Avoid in prod! |
+| **Date** | `myapp:2024-01-15` | Daily builds |
+
+**⚠️ Never use `latest` in production:**
+* 🤷 Which version is "latest"?
+* 🔄 Changes without notice
+* 🐛 Can't rollback reliably
+
+**✅ Best Practice:**
+```bash
+# 🏷️ Immutable tags
+docker tag myapp:1.0.0 registry/myapp:1.0.0
+docker tag myapp:1.0.0 registry/myapp:sha-a1b2c3d
+```
+
+---
+
+## 📍 Slide 38 – 🔐 Security Best Practices
+
+```mermaid
+flowchart TD
+  Scan[🔍 Scan Images] --> Base[📦 Minimal Base]
+  Base --> User[👤 Non-root User]
+  User --> Secrets[🔐 No Secrets in Image]
+  Secrets --> Update[🔄 Update Regularly]
+  Update --> Sign[✍️ Sign Images]
+```
+
+**🔐 Security Checklist:**
+* ✅ Run as non-root user (`USER appuser`)
+* ✅ Use minimal base images (slim, distroless)
+* ✅ Scan for vulnerabilities (Trivy, Snyk)
+* ✅ Never store secrets in images
+* ✅ Pin base image versions
+* ✅ Update base images regularly
+
+**🛠️ Scanning Tools:**
+* 🔍 **Trivy** — open source, fast
+* 🔍 **Snyk** — developer-friendly
+* 🔍 **Docker Scout** — built into Docker
+
+---
+
+## 📍 Slide 39 – 📈 Career Skills
+
+```mermaid
+flowchart LR
+  Docker[🐳 Docker Basics] --> Compose[📦 Docker Compose]
+  Compose --> K8s[☸️ Kubernetes]
+  K8s --> GitOps[🔄 GitOps]
+  GitOps --> Platform[🏗️ Platform Engineering]
+```
+
+**🛠️ Docker Skills Progression:**
+* 🐳 **Level 1**: Write Dockerfiles, build/run containers
+* 📦 **Level 2**: Multi-stage builds, optimization
+* 🔐 **Level 3**: Security hardening, distroless
+* 📊 **Level 4**: Registry management, scanning
+* ☸️ **Level 5**: Container orchestration (K8s)
+
+**📊 Job Market (2024):**
+* 🐳 Docker required in **80%** of DevOps jobs
+* ☸️ Kubernetes in **65%** of container jobs
+* 💰 Container skills = **+15-20%** salary
+
+---
+
+## 📍 Slide 40 – 🌍 Real Company Examples
+
+**🎬 Netflix:**
+* 🐳 Millions of containers daily
+* 📦 Custom base images (hardened)
+* 🔄 Immutable deployments
+
+**🛒 Shopify:**
+* 🐳 Containerized entire platform
+* ⚡ Deploy 80x/day
+* 📦 Standardized Dockerfiles
+
+**🚗 Uber:**
+* 🐳 4,000+ microservices in containers
+* 🔐 Strict security policies
+* 📊 Custom image scanning
+
+**📊 Common Patterns:**
+* ✅ Standardized base images
+* ✅ Automated security scanning
+* ✅ Multi-stage builds everywhere
+* ✅ No root containers
+
+---
+
+## 📍 Slide 41 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🐳 **Containers = lightweight, portable app packaging**
+2. 📝 **Dockerfile order matters** — dependencies before code
+3. 👤 **Always run as non-root** — security first
+4. 🏗️ **Multi-stage builds** — separate build from runtime
+5. 📦 **Smaller is better** — less attack surface, faster deploys
+
+> 💡 A good Dockerfile is secure, optimized, and maintainable.
+
+---
+
+## 📍 Slide 42 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🐳 Container Mindset |
+|---------------|---------------------|
+| 🖥️ "Configure servers manually" | 📝 "Define in Dockerfile" |
+| 🔧 "Install dependencies on host" | 📦 "Bundle in container" |
+| 👑 "Run as root, it's easier" | 👤 "Run as non-root always" |
+| 💾 "Bigger image = more features" | ⚡ "Smaller = faster & safer" |
+| 🏷️ "Just use :latest" | 🔖 "Pin versions always" |
+
+> ❓ Which mindset will you adopt?
+
+---
+
+## 📍 Slide 43 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Why containers beat VMs for app deployment
+* ✅ Docker architecture: images, containers, registries
+* ✅ How to write optimized Dockerfiles
+* ✅ Security: rootless containers, minimal images
+* ✅ Multi-stage builds for smaller images
+* ✅ Docker Hub publishing workflow
+
+> 🚀 **You're ready for Lab 2!**
+
+---
+
+## 📍 Slide 44 – 📝 QUIZ — DEVOPS_L2_POST
+
+---
+
+## 📍 Slide 45 – 🚀 What Comes Next
+
+## 📚 Lab 2: Containerize Your App
+
+* 🐳 Write Dockerfile for your Python app
+* 👤 Implement non-root user
+* 📦 Optimize with layer ordering
+* 🌐 Push to Docker Hub
+* 🏆 Bonus: Multi-stage build for Go app
+
+**🔮 Future Lectures:**
+* 📦 **Lecture 3**: CI/CD with GitHub Actions
+* ☸️ **Lecture 9**: Kubernetes deployment
+* 🔄 **Lecture 13**: GitOps with ArgoCD
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Docker[🐳 Docker Skills]
+  Docker --> K8s[☸️ Kubernetes]
+  K8s --> GitOps[🔄 GitOps]
+  GitOps --> Career[🚀 DevOps Career]
+```
+
+**👋 See you in the lab!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Docker Deep Dive* — Nigel Poulton
+* 📖 *Container Security* — Liz Rice
+* 📖 *Docker in Action* — Jeff Nickoloff
+
+**🔗 Links:**
+* 🌐 [Dockerfile Best Practices](https://docs.docker.com/develop/develop-images/dockerfile_best-practices/)
+* 🌐 [Distroless Images](https://github.com/GoogleContainerTools/distroless)
+* 🌐 [Docker Security](https://docs.docker.com/engine/security/)
+* 🌐 [Multi-Stage Builds](https://docs.docker.com/build/building/multi-stage/)
+
+**🛠️ Tools:**
+* 🔍 [Hadolint](https://github.com/hadolint/hadolint) — Dockerfile linter
+* 🔍 [Dive](https://github.com/wagoodman/dive) — Explore image layers
+* 🔍 [Trivy](https://github.com/aquasecurity/trivy) — Security scanner
+
+---
diff --git a/lectures/lec3.md b/lectures/lec3.md
new file mode 100644
index 0000000000..9afebb8b15
--- /dev/null
+++ b/lectures/lec3.md
@@ -0,0 +1,978 @@
+# 📌 Lecture 3 — Continuous Integration: Automate Testing & Build Confidence
+
+## 📍 Slide 1 – 🤖 Welcome to CI/CD
+
+* 🐛 **Manual testing** = slow, error-prone, doesn't scale
+* 🤖 **Continuous Integration** = automate testing, building, and validation
+* ✅ **Goal**: Catch bugs before they reach production
+* 🚀 This lecture: Build your first CI/CD pipeline with GitHub Actions
+
+```mermaid
+flowchart LR
+  Manual[😰 Manual Testing] -->|CI/CD| Auto[🤖 Automated Pipeline]
+  Auto --> Confidence[💪 Deploy with Confidence]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 Learning Outcomes
+
+* ✅ Understand CI/CD principles and benefits
+* ✅ Write effective unit tests
+* ✅ Build GitHub Actions workflows
+* ✅ Implement security scanning with Snyk
+* ✅ Apply CI/CD best practices (caching, versioning)
+
+**🎓 By the end of this lecture:**
+
+| # | 🎯 Outcome |
+|---|-----------|
+| 1 | 🧠 Explain CI/CD and why it matters |
+| 2 | 🧪 Write meaningful unit tests |
+| 3 | ⚙️ Create GitHub Actions workflows |
+| 4 | 🔐 Integrate security scanning |
+| 5 | 📦 Automate Docker builds & publishing |
+
+---
+
+## 📍 Slide 3 – 📋 Lecture Overview
+
+* 📚 **CI/CD fundamentals** — what, why, how
+* 🧪 **Testing strategies** — unit, integration, coverage
+* ⚙️ **GitHub Actions** — YAML workflows, actions marketplace
+* 🔐 **Security** — Snyk vulnerability scanning
+* 🚀 **Automation** — Docker builds, versioning, caching
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction           → 📝 PRE Quiz
+Section 1: The Testing Problem
+Section 2: CI/CD Fundamentals
+Section 3: GitHub Actions Hands-on → 📝 MID Quiz
+Section 4: Advanced CI Patterns
+Section 5: Production Practices
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **85%** of software bugs are found in production (2024)
+* ⏱️ Average cost to fix a prod bug: **100x** more than dev bug
+* 🚀 Teams with good CI deploy **46x** more frequently
+
+> 💬 *"If it hurts, do it more often"* — Continuous Delivery principle
+
+**🤔 Think about it:**
+* How do you know your code works before deploying?
+* What happens when someone breaks the main branch?
+* How many bugs could be caught automatically?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L3_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Testing Problem
+
+* 👨‍💻 **Developer**: "It works on my machine!"
+* 🐛 **Production**: 500 errors, users complaining
+* 😰 **The gap**: No automated testing or validation
+* 💥 **Result**: Bugs slip through, confidence is low
+
+```mermaid
+flowchart LR
+  Dev[👨‍💻 Dev: Works!] -->|No Tests| Prod[🌐 Production]
+  Prod --> Bug[🐛 Bug Found]
+  Bug --> Fire[🔥 Firefighting]
+```
+
+---
+
+## 📍 Slide 7 – 🧪 Manual Testing Hell
+
+* 📋 **Manual checklist**: 50 steps to test before deploy
+* ⏱️ **Time**: 2 hours per test cycle
+* 😴 **Human error**: Forgot to test one endpoint
+* 🔄 **Frequency**: Only before big releases (too painful)
+
+```mermaid
+flowchart TD
+  Code[📝 Write Code] --> Manual[📋 Manual Testing]
+  Manual --> Bug[🐛 Found Bug]
+  Bug --> Fix[🔧 Fix Code]
+  Fix --> Manual
+  Manual --> Deploy[😮‍💨 Finally Deploy]
+```
+
+**😰 Problems:**
+* 🐌 Slow feedback loop
+* 🎰 Testing is inconsistent
+* 🧠 Requires human to remember all steps
+* 💀 Nobody wants to test
+
+---
+
+## 📍 Slide 8 – 💥 The Integration Problem
+
+* 👥 **Multiple developers** pushing to main branch
+* 🔀 **Merge conflicts** caught too late
+* 💥 **Breaking changes** not detected
+* 🤷 **"Who broke the build?"** — the blame game
+
+```mermaid
+flowchart LR
+  Dev1[👨‍💻 Dev 1] -->|Push| Main[🌳 Main Branch]
+  Dev2[👩‍💻 Dev 2] -->|Push| Main
+  Dev3[👨‍💻 Dev 3] -->|Push| Main
+  Main --> Break[💥 Build Broken]
+```
+
+> 🤔 **Think:** How do we prevent this?
+
+---
+
+## 📍 Slide 9 – 🔐 The Security Gap
+
+* 📦 **Dependencies** with known vulnerabilities
+* 🔓 **Secrets** accidentally committed
+* 🚨 **CVEs** discovered after deployment
+* 🤷 **Nobody checked** before merging
+
+**📊 Real Stats:**
+* 🔍 **84%** of codebases have vulnerable dependencies
+* ⏱️ Average time to detect vulnerability: **54 days**
+* 💰 Average breach cost: **$4.45 million**
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of No CI
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐛 Bugs in production | Customer churn, reputation damage |
+| ⏱️ Slow feedback | Wasted development time |
+| 😰 Fear of deployment | Infrequent releases |
+| 🔒 Security vulnerabilities | Data breaches, compliance issues |
+
+**📈 Real Numbers:**
+* 🐛 Prod bug fix cost: **$10,000 - $100,000**
+* 🕒 Time to detect + fix: **4-8 hours**
+* 🏢 Without CI: Deploy **monthly**
+* 🚀 With CI: Deploy **daily**
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: CI/CD Fundamentals
+
+* 🤖 **Continuous Integration (CI)** = automatically test every change
+* 🚀 **Continuous Delivery (CD)** = always ready to deploy
+* 📦 **Continuous Deployment** = automatically deploy to production
+* 🎯 **Goal**: Fast, reliable, automated software delivery
+
+```mermaid
+flowchart LR
+  CI[🤖 CI: Test] --> CD[📦 CD: Package]
+  CD --> Deploy[🚀 Deploy]
+```
+
+**📖 Definitions:**
+> *CI: Developers integrate code into shared repository frequently. Each integration is verified by automated build and tests.*
+> *CD: Software can be released to production at any time.*
+
+---
+
+## 📍 Slide 12 – 🔄 The CI/CD Pipeline
+
+```mermaid
+flowchart LR
+  Commit[📝 Commit] --> Trigger[⚡ Trigger CI]
+  Trigger --> Checkout[📥 Checkout Code]
+  Checkout --> Build[🔨 Build]
+  Build --> Test[🧪 Test]
+  Test --> Lint[🔍 Lint]
+  Lint --> Scan[🔐 Security Scan]
+  Scan --> Package[📦 Package]
+  Package --> Publish[🚀 Publish]
+```
+
+**🔧 Stages:**
+1. 📝 **Commit** — Developer pushes code
+2. ⚡ **Trigger** — CI system detects change
+3. 🔨 **Build** — Compile/prepare code
+4. 🧪 **Test** — Run automated tests
+5. 🔍 **Lint** — Check code quality
+6. 🔐 **Scan** — Security vulnerabilities
+7. 📦 **Package** — Build artifacts (Docker image)
+8. 🚀 **Publish** — Push to registry
+
+---
+
+## 📍 Slide 13 – ✅ CI/CD Benefits
+
+| 🎯 Benefit | 📊 Impact |
+|-----------|----------|
+| ⚡ **Fast Feedback** | Know in 5 min if code works |
+| 🐛 **Early Bug Detection** | Catch before production |
+| 🔒 **Security** | Automated vulnerability scanning |
+| 📦 **Consistent Builds** | Same process every time |
+| 💪 **Confidence** | Deploy without fear |
+| 🚀 **Faster Releases** | Deploy multiple times per day |
+
+**📈 DORA Metrics (Elite Performers):**
+* 📦 Deploy frequency: **Multiple times/day**
+* ⏱️ Lead time: **< 1 hour**
+* 🔧 MTTR: **< 1 hour**
+* ❌ Change failure rate: **< 15%**
+
+---
+
+## 📍 Slide 14 – 🧪 Testing Pyramid
+
+```mermaid
+flowchart TD
+  subgraph Pyramid[🔺 Testing Pyramid]
+    E2E[🌐 E2E Tests<br/>Few, Slow, Expensive]
+    INT[🔗 Integration Tests<br/>Some, Moderate]
+    UNIT[🧪 Unit Tests<br/>Many, Fast, Cheap]
+  end
+  E2E --> INT --> UNIT
+```
+
+**🎯 Test Types:**
+* 🧪 **Unit Tests** (80%) — Test individual functions
+* 🔗 **Integration Tests** (15%) — Test components together
+* 🌐 **End-to-End Tests** (5%) — Test full user flows
+
+**💡 Why the pyramid?**
+* ✅ Unit tests: Fast (ms), cheap, catch most bugs
+* ✅ Integration: Slower (seconds), catch interface bugs
+* ⚠️ E2E: Slowest (minutes), brittle, expensive
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After CI/CD
+
+| 😰 Before CI/CD | 🚀 After CI/CD |
+|-----------------|----------------|
+| 📋 Manual testing checklist | 🤖 Automated test suite |
+| 🎰 "Fingers crossed" deploys | ✅ Confident deployments |
+| 🐛 Bugs found in production | 🧪 Bugs caught in CI |
+| ⏱️ 2 hour test cycle | ⚡ 5 minute feedback |
+| 😱 Deploy monthly | 🚀 Deploy daily |
+| 🤷 "Who broke it?" | 📊 Git bisect + logs |
+
+> 🤔 Which column is your current process?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: GitHub Actions Hands-On
+
+## 🕹️ Lab Preview: Build Your CI Pipeline
+
+* 🏢 **Scenario**: You have a Python Flask app
+* 🎯 **Goal**: Automate testing and Docker builds
+* 📋 **Requirements**: Tests, lint, security scan, publish
+
+**❓ How do we automate all this?**
+
+> 🤖 **GitHub Actions** to the rescue!
+
+🎮 **Let's build it step by step.**
+
+---
+
+## 📍 Slide 17 – 💥 Scenario 1: No Tests
+
+**😰 The Problem:**
+```python
+# app.py
+@app.route('/')
+def home():
+    return {"message": "Hello", "hostname": os.getenv("HOSTNAME")}
+
+# 🚫 No tests!
+```
+
+* 📝 Code looks fine
+* 💥 Deploy → crashes because `HOSTNAME` is None
+* 🐛 Users see 500 errors
+* 😱 Rollback emergency
+
+> ❓ **How do we catch this before deploy?**
+
+---
+
+## 📍 Slide 18 – ✅ Solution: Unit Testing
+
+## 🛠️ Fix: Write Tests First
+
+```python
+# tests/test_app.py
+import pytest
+from app import app
+
+def test_home_endpoint():
+    """Test that home returns expected structure"""
+    client = app.test_client()
+    response = client.get('/')
+
+    assert response.status_code == 200
+    data = response.get_json()
+    assert "message" in data
+    assert "hostname" in data
+    assert isinstance(data["message"], str)
+
+def test_health_endpoint():
+    """Test health check"""
+    client = app.test_client()
+    response = client.get('/health')
+
+    assert response.status_code == 200
+    assert response.get_json()["status"] == "healthy"
+```
+
+**🎯 Result:** Tests catch the bug before deploy!
+
+---
+
+## 📍 Slide 19 – 🧪 Testing Frameworks
+
+## Python Testing Options
+
+| Framework | 🎯 Pros | ⚠️ Cons |
+|-----------|--------|--------|
+| **pytest** | Simple, powerful, fixtures | Extra dependency |
+| **unittest** | Built-in, no dependencies | Verbose, old-style |
+
+```bash
+# 🧪 pytest (recommended)
+pip install pytest
+pytest tests/
+
+# 🧪 unittest (built-in)
+python -m unittest discover tests/
+```
+
+**💡 Why pytest?**
+* ✅ Simple syntax (`assert` instead of `self.assertEqual`)
+* ✅ Powerful fixtures (setup/teardown)
+* ✅ Great plugins (coverage, parallel, etc.)
+* ✅ Industry standard
+
+---
+
+## 📍 Slide 20 – 📝 Scenario 2: Manual Docker Builds
+
+**😰 The Problem:**
+```bash
+# 🐌 Manual process every time
+docker build -t myapp:latest .
+docker tag myapp:latest username/myapp:v1.2.3
+docker login
+docker push username/myapp:v1.2.3
+docker push username/myapp:latest
+
+# 😱 Forgot to update version tag!
+# 💀 Built from wrong branch!
+```
+
+* ⏱️ Takes 10 minutes
+* 🎰 Inconsistent (human error)
+* 📋 No validation before build
+* 🤷 Can't track what version is deployed
+
+---
+
+## 📍 Slide 21 – ✅ Solution: GitHub Actions CI/CD
+
+## 🛠️ Fix: Automate Everything
+
+```yaml
+# .github/workflows/python-ci.yml
+name: Python CI
+
+on:
+  push:
+    branches: [ main ]
+  pull_request:
+
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - uses: actions/setup-python@v5
+        with:
+          python-version: '3.12'
+
+      - name: Install dependencies
+        run: |
+          pip install -r requirements.txt
+          pip install pytest flake8
+
+      - name: Lint
+        run: flake8 app.py
+
+      - name: Test
+        run: pytest tests/
+```
+
+**🎯 Result:** Every commit automatically tested!
+
+---
+
+## 📍 Slide 22 – 🐳 Docker Build Automation
+
+```yaml
+  docker:
+    needs: test  # ✅ Only run if tests pass
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Login to Docker Hub
+        uses: docker/login-action@v3
+        with:
+          username: ${{ secrets.DOCKER_USERNAME }}
+          password: ${{ secrets.DOCKER_TOKEN }}
+
+      - name: Build and push
+        uses: docker/build-push-action@v5
+        with:
+          context: ./app_python
+          push: true
+          tags: |
+            ${{ secrets.DOCKER_USERNAME }}/myapp:latest
+            ${{ secrets.DOCKER_USERNAME }}/myapp:${{ github.sha }}
+```
+
+**🔐 Security Note:** Never hardcode credentials!
+
+---
+
+## 📍 Slide 23 – 🔓 Scenario 3: Vulnerable Dependencies
+
+**😰 The Problem:**
+```bash
+# requirements.txt
+flask==2.0.1  # 💀 Known CVE-2023-30861
+requests==2.25.0  # 🔓 Security vulnerability
+
+# 🤷 Nobody checked before deploying
+```
+
+* 🔍 **84%** of apps have vulnerable dependencies
+* ⏱️ Takes **weeks** to discover
+* 💀 Already in production when found
+
+**📊 Real Example:**
+* 📦 Log4Shell (2021) — **35,000+ CVE**
+* 💰 Cost to remediate: **Billions of dollars**
+
+---
+
+## 📍 Slide 24 – ✅ Solution: Snyk Security Scanning
+
+## 🛠️ Fix: Automated Vulnerability Scanning
+
+```yaml
+  security:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Run Snyk
+        uses: snyk/actions/python-3.10@master
+        env:
+          SNYK_TOKEN: ${{ secrets.SNYK_TOKEN }}
+        with:
+          args: --severity-threshold=high
+```
+
+**🎯 What Snyk Does:**
+* 🔍 Scans dependencies for known CVEs
+* 📊 Reports severity (low/medium/high/critical)
+* 🔧 Suggests fixes
+* ❌ Fails build if critical vulnerabilities found
+
+**🔐 Result:** Catch vulnerabilities before production!
+
+---
+
+## 📍 Slide 25 – 🐌 Scenario 4: Slow CI Builds
+
+**😰 The Problem:**
+```
+[Run 1] Installing dependencies... 2 minutes
+[Run 2] Installing dependencies... 2 minutes
+[Run 3] Installing dependencies... 2 minutes
+# 💸 Wasting 6 minutes downloading same packages!
+```
+
+* ⏱️ Each run: **5-10 minutes**
+* 🔄 Re-downloading same dependencies
+* 💰 Wasting CI minutes (costs money!)
+* 😴 Slow feedback loop
+
+---
+
+## 📍 Slide 26 – ✅ Solution: Dependency Caching
+
+## 🛠️ Fix: Cache Dependencies
+
+```yaml
+- uses: actions/setup-python@v5
+  with:
+    python-version: '3.12'
+    cache: 'pip'  # ✅ Enable caching
+    cache-dependency-path: 'requirements.txt'
+
+# Alternative with explicit cache
+- uses: actions/cache@v4
+  with:
+    path: ~/.cache/pip
+    key: ${{ runner.os }}-pip-${{ hashFiles('requirements.txt') }}
+```
+
+**📊 Performance Impact:**
+* ⏱️ **Before caching**: 5 minutes
+* ⚡ **After caching**: 30 seconds
+* 🚀 **10x faster!**
+
+**💡 Cache Key Strategy:**
+* 🔑 Key includes `requirements.txt` hash
+* 🔄 Cache invalidates when dependencies change
+* ✅ Fresh install when needed, cached otherwise
+
+---
+
+## 📍 Slide 27 – 📝 QUIZ — DEVOPS_L3_MID
+
+---
+
+## 📍 Slide 28 – 🏷️ Section 4: Versioning Strategies
+
+## 📦 How to Version Your Images?
+
+**Two main approaches:**
+
+**🔢 Semantic Versioning (SemVer):**
+* Format: `MAJOR.MINOR.PATCH` (e.g., `1.2.3`)
+* 🎯 Use when: Breaking changes matter
+* 📚 Example: Libraries, APIs
+
+**📅 Calendar Versioning (CalVer):**
+* Format: `YYYY.MM.DD` (e.g., `2024.01.15`)
+* 🎯 Use when: Continuous deployment
+* 🚀 Example: Web services, SaaS
+
+```mermaid
+flowchart LR
+  Code[📝 Code] --> SemVer[🔢 v1.2.3]
+  Code --> CalVer[📅 2024.01]
+  SemVer --> Lib[📚 Library]
+  CalVer --> Service[🌐 Service]
+```
+
+---
+
+## 📍 Slide 29 – 🔢 Semantic Versioning (SemVer)
+
+## v MAJOR.MINOR.PATCH
+
+| Version | 🎯 When to Bump |
+|---------|----------------|
+| **MAJOR** (v2.0.0) | Breaking changes (API changed) |
+| **MINOR** (v1.1.0) | New features (backward-compatible) |
+| **PATCH** (v1.0.1) | Bug fixes (backward-compatible) |
+
+```yaml
+# 🏷️ Multiple tags per release
+tags: |
+  username/app:1.2.3
+  username/app:1.2
+  username/app:1
+  username/app:latest
+```
+
+**✅ Pros:**
+* 📖 Clear breaking change signals
+* 🎯 Industry standard for libraries
+* 🔄 Users can pin to major version
+
+**⚠️ Cons:**
+* 🤔 Requires discipline
+* 📋 Need to track what's breaking vs feature
+
+---
+
+## 📍 Slide 30 – 📅 Calendar Versioning (CalVer)
+
+## YYYY.MM.DD or YYYY.MM
+
+| Format | 📝 Example | 🎯 Use Case |
+|--------|-----------|-------------|
+| `YYYY.MM.DD` | `2024.01.15` | Daily releases |
+| `YYYY.MM.MICRO` | `2024.01.3` | Monthly + patch |
+| `YYYY.0M` | `2024.01` | Monthly releases |
+
+```yaml
+# 📅 Generate version from date
+- name: Generate version
+  run: echo "VERSION=$(date +%Y.%m.%d)" >> $GITHUB_ENV
+
+tags: |
+  username/app:2024.01.15
+  username/app:2024.01
+  username/app:latest
+```
+
+**✅ Pros:**
+* 📆 No ambiguity (date is date)
+* 🚀 Perfect for continuous deployment
+* 🧠 Easy to remember
+
+**⚠️ Cons:**
+* 🤷 Doesn't indicate breaking changes
+
+---
+
+## 📍 Slide 31 – 🔀 Matrix Builds
+
+## Test Multiple Versions
+
+```yaml
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python-version: ['3.11', '3.12', '3.13']
+
+    steps:
+      - uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python-version }}
+
+      - run: pytest tests/
+```
+
+**🎯 What This Does:**
+* 🔄 Runs tests **3 times** (one per Python version)
+* ⚡ Runs in **parallel**
+* ✅ Ensures compatibility across versions
+
+```mermaid
+flowchart LR
+  Test[🧪 Tests] --> Py311[🐍 Python 3.11]
+  Test --> Py312[🐍 Python 3.12]
+  Test --> Py313[🐍 Python 3.13]
+```
+
+---
+
+## 📍 Slide 32 – 📂 Path Filters (Monorepo)
+
+## Only Run CI for Changed Apps
+
+```yaml
+# Python CI only runs when Python code changes
+on:
+  push:
+    paths:
+      - 'app_python/**'
+      - '.github/workflows/python-ci.yml'
+
+# Go CI only runs when Go code changes
+on:
+  push:
+    paths:
+      - 'app_go/**'
+      - '.github/workflows/go-ci.yml'
+```
+
+**🎯 Benefits:**
+* ⚡ Faster CI (don't run unnecessary builds)
+* 💰 Save CI minutes
+* 🔕 Less noise (only relevant notifications)
+
+**📊 Impact:**
+* 🐌 Without filters: Every commit runs **all** CI
+* 🚀 With filters: Only **affected** apps run
+
+---
+
+## 📍 Slide 33 – 📊 Test Coverage
+
+## Measure What's Tested
+
+```yaml
+- name: Run tests with coverage
+  run: |
+    pip install pytest-cov
+    pytest --cov=app_python --cov-report=xml --cov-report=term
+
+- name: Upload to Codecov
+  uses: codecov/codecov-action@v4
+  with:
+    file: ./coverage.xml
+```
+
+**📊 Coverage Badge:**
+```markdown
+![Coverage](https://codecov.io/gh/user/repo/branch/main/graph/badge.svg)
+```
+
+**🎯 What's Good Coverage?**
+* 🥉 **60-70%** — Okay, could be better
+* 🥈 **70-85%** — Good, most code tested
+* 🥇 **85-95%** — Excellent coverage
+* ⚠️ **100%** — Usually overkill (diminishing returns)
+
+---
+
+## 📍 Slide 34 – ✅ CI Best Practices
+
+| 🎯 Practice | 💡 Why It Matters |
+|------------|------------------|
+| ⚡ **Fail Fast** | Stop on first failure, save time |
+| 🔗 **Job Dependencies** | Don't push if tests fail |
+| 🔒 **Secrets in Vault** | Never hardcode credentials |
+| 📦 **Cache Dependencies** | 10x faster builds |
+| 🔍 **Security Scanning** | Catch CVEs early |
+| 📊 **Status Badges** | Visibility into health |
+| 🎯 **Branch Protection** | Require CI before merge |
+| ♻️ **Concurrency Control** | Cancel outdated runs |
+
+**🔐 Security:**
+* ✅ Use `secrets.*` for sensitive data
+* ✅ Minimum permissions (`permissions:`)
+* ✅ Pin action versions (`actions/checkout@v4`)
+
+---
+
+## 📍 Slide 35 – 🌐 GitHub Actions Marketplace
+
+## Reusable Actions
+
+```mermaid
+flowchart LR
+  Marketplace[🏪 Actions Marketplace] --> Setup[⚙️ Setup Actions]
+  Marketplace --> Build[🔨 Build Actions]
+  Marketplace --> Deploy[🚀 Deploy Actions]
+  Marketplace --> Security[🔐 Security Actions]
+```
+
+**🔥 Popular Actions:**
+* ⚙️ `actions/checkout@v4` — Clone repo
+* 🐍 `actions/setup-python@v5` — Setup Python
+* 🐳 `docker/build-push-action@v5` — Build Docker
+* 🔐 `snyk/actions@master` — Security scan
+* 📊 `codecov/codecov-action@v4` — Coverage
+
+**🔍 Find Actions:**
+* 🌐 [github.com/marketplace](https://github.com/marketplace?type=actions)
+* ⭐ Check stars/downloads
+* 📖 Read documentation
+* 🔒 Verify source/security
+
+---
+
+## 📍 Slide 36 – 🏢 Section 5: Production CI/CD
+
+## Real-World CI Workflows
+
+**🎬 Netflix:**
+* 🚀 **3000+** builds per day
+* 🔄 Full CI pipeline in **<10 minutes**
+* 🎯 A/B test deployments
+
+**🛒 Shopify:**
+* ⚡ Deploy **80+ times per day**
+* 🤖 Auto-rollback on failure
+* 📊 Real-time metrics in CI
+
+**🔍 Google:**
+* 🏗️ **Monorepo** with 2 billion LOC
+* 🧪 **100+ million tests** daily
+* 📦 Bazel build system
+
+---
+
+## 📍 Slide 37 – 🚦 Branch Protection Rules
+
+## Require CI Before Merge
+
+```mermaid
+flowchart LR
+  PR[📝 Pull Request] --> CI[🤖 CI Runs]
+  CI -->|✅ Pass| Merge[✅ Can Merge]
+  CI -->|❌ Fail| Block[🚫 Blocked]
+```
+
+**⚙️ GitHub Settings:**
+* ✅ Require status checks to pass
+* ✅ Require branches to be up to date
+* ✅ Require review from code owners
+* 🔒 Prevent direct push to main
+
+**🎯 Result:**
+* 🚫 No broken code in main branch
+* ✅ Every change is tested
+* 📊 Full history of CI results
+
+---
+
+## 📍 Slide 38 – 🔄 GitOps Preview
+
+## From CI to CD
+
+```mermaid
+flowchart LR
+  CI[🤖 CI: Test & Build] --> Push[📦 Push Image]
+  Push --> ArgoCD[🔄 ArgoCD Detects]
+  ArgoCD --> Deploy[🚀 Auto Deploy]
+  Deploy --> K8s[☸️ Kubernetes]
+```
+
+**🔮 Coming Up:**
+* 📦 **Lab 13**: ArgoCD deploys what CI builds
+* ☸️ **K8s**: Orchestrate containers
+* 🔄 **GitOps**: Git as source of truth
+* 🚀 **Full automation**: Commit → Production
+
+---
+
+## 📍 Slide 39 – 💡 CI/CD Anti-Patterns
+
+| ❌ Anti-Pattern | ✅ Better Approach |
+|----------------|-------------------|
+| 🎰 "It works on my machine" | 🧪 Automated tests catch issues |
+| 📋 Manual deployment checklist | 🤖 Automated pipeline |
+| 🤷 No tests, just deploy | 🧪 Comprehensive test suite |
+| 💀 Long-lived feature branches | 🔄 Trunk-based development |
+| 🐌 Slow CI (>30 min) | ⚡ Optimize, parallelize, cache |
+| 🔓 Secrets in code | 🔒 Environment variables |
+
+---
+
+## 📍 Slide 40 – 📈 CI Metrics to Track
+
+| 📊 Metric | 🎯 Target |
+|-----------|----------|
+| ⏱️ **Build Time** | < 10 minutes |
+| ✅ **Success Rate** | > 95% |
+| 🐛 **Bugs Caught in CI** | Maximize |
+| 📦 **Deploy Frequency** | Multiple/day |
+| 🔧 **Time to Fix Broken Build** | < 10 minutes |
+| 📊 **Test Coverage** | > 80% |
+
+```mermaid
+flowchart LR
+  Fast[⚡ Fast CI] --> Deploy[🚀 Deploy Often]
+  Deploy --> Confidence[💪 High Confidence]
+  Confidence --> Fast
+```
+
+---
+
+## 📍 Slide 41 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🤖 **CI automates testing** — catch bugs before production
+2. 🧪 **Unit tests are essential** — fast feedback loop
+3. ⚙️ **GitHub Actions** — powerful, free CI/CD platform
+4. 🔐 **Security scanning** — integrate Snyk, scan dependencies
+5. 📦 **Versioning matters** — SemVer or CalVer, be consistent
+
+> 💡 CI isn't just about automation — it's about building confidence.
+
+---
+
+## 📍 Slide 42 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🚀 CI/CD Mindset |
+|---------------|------------------|
+| 📋 "Test before release" | 🧪 "Test every commit" |
+| 🤞 "Hope it works" | ✅ "Know it works" |
+| 🎰 Manual deployments | 🤖 Automated pipelines |
+| 😱 "Who broke it?" | 📊 "CI caught it" |
+| 🐌 Deploy monthly | 🚀 Deploy daily |
+| 🔍 Find bugs in prod | 🧪 Catch bugs in CI |
+
+> ❓ Which mindset will you adopt?
+
+---
+
+## 📍 Slide 43 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Why CI/CD is critical for modern development
+* ✅ How to write effective unit tests
+* ✅ GitHub Actions workflow syntax
+* ✅ Security scanning with Snyk
+* ✅ Versioning strategies (SemVer vs CalVer)
+* ✅ CI best practices (caching, matrix builds, path filters)
+
+> 🚀 **You're ready for Lab 3!**
+
+---
+
+## 📍 Slide 44 – 📝 QUIZ — DEVOPS_L3_POST
+
+---
+
+## 📍 Slide 45 – 🚀 What Comes Next
+
+## 📚 Lab 3: Build Your CI Pipeline
+
+* 🧪 Write unit tests for your Flask app
+* ⚙️ Create GitHub Actions workflow
+* 🔐 Integrate Snyk security scanning
+* 📦 Automate Docker builds and versioning
+* ⚡ Apply caching and best practices
+* 🏆 Bonus: Multi-app CI with path filters
+
+**🔮 Future Lectures:**
+* 📦 **Lecture 7**: Monitoring & Observability
+* ☸️ **Lecture 9**: Kubernetes Deployment
+* 🔄 **Lecture 13**: GitOps with ArgoCD
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Tests[🧪 Write Tests]
+  Tests --> CI[🤖 GitHub Actions]
+  CI --> Automation[⚡ Full Automation]
+  Automation --> Career[🚀 DevOps Skills]
+```
+
+**👋 See you in the lab!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Continuous Delivery* — Jez Humble
+* 📖 *The DevOps Handbook* — Gene Kim
+* 📖 *Accelerate* — Nicole Forsgren
+
+**🔗 Links:**
+* 🌐 [GitHub Actions Docs](https://docs.github.com/en/actions)
+* 🌐 [Pytest Documentation](https://docs.pytest.org/)
+* 🌐 [Snyk Security](https://snyk.io/)
+* 🌐 [SemVer](https://semver.org/)
+* 🌐 [CalVer](https://calver.org/)
+
+**🛠️ Tools:**
+* 🔍 [act](https://github.com/nektos/act) — Run GitHub Actions locally
+* 🔍 [actionlint](https://github.com/rhysd/actionlint) — Lint workflows
+* 📊 [Codecov](https://codecov.io/) — Coverage tracking
+
+---
diff --git a/lectures/lec4.md b/lectures/lec4.md
new file mode 100644
index 0000000000..acfe810526
--- /dev/null
+++ b/lectures/lec4.md
@@ -0,0 +1,801 @@
+# 📌 Lecture 4 — Infrastructure as Code: From Snowflakes to Cattle
+
+## 📍 Slide 1 – 🚀 Welcome to Infrastructure as Code
+
+* 🌍 **Infrastructure used to be physical** — racks, cables, manual configuration
+* 😰 Manual setup leads to inconsistency, drift, and undocumented "snowflakes"
+* 🏗️ **Infrastructure as Code (IaC)** treats infrastructure like software
+* 🎯 This lecture: learn to define, version, and automate your infrastructure
+
+```mermaid
+flowchart LR
+  Manual[🔧 Manual Setup] -->|IaC| Code[📝 Code-Defined]
+  Code --> Reproducible[🔄 Reproducible Infrastructure]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand Infrastructure as Code principles
+* ✅ Compare declarative vs imperative IaC approaches
+* ✅ Apply Terraform workflows to real cloud infrastructure
+* ✅ Manage infrastructure state securely
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Define IaC and explain its benefits |
+| 2 | 🔍 Distinguish between Terraform and Pulumi |
+| 3 | 🛠️ Write basic Terraform configurations |
+| 4 | 🗺️ Understand state management and security |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + Code examples** — hands-on focus
+* 🎮 **Real-world scenarios** — cloud provisioning challenges
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Tool comparison**: Terraform vs Pulumi
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Infrastructure Problem
+Section 2: IaC Fundamentals
+Section 3: Terraform Deep Dive    → 📝 MID Quiz
+Section 4: State & Security
+Section 5: Real World IaC
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **73%** of organizations report configuration drift as a major issue
+* ⏱️ Average time to provision a server manually: **hours to days**
+* 💥 Most outages caused by **configuration changes**
+
+> 💬 *"It works in staging but not production"* — Every ops engineer, ever
+
+**🤔 Think about it:**
+* How do you recreate your production environment?
+* What happens when the person who set it up leaves?
+* Can you spin up a new environment in minutes?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L4_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Infrastructure Problem
+
+* 🐶 **Pet Servers** = unique, hand-crafted, irreplaceable
+* 🔧 Manual configuration via SSH and console clicks
+* 📋 Documentation gets outdated immediately
+* 💥 Result: **snowflake infrastructure** — no two servers are the same
+
+```mermaid
+flowchart LR
+  Server1[🖥️ Server 1: Ubuntu 20 + patches]
+  Server2[🖥️ Server 2: Ubuntu 22 + different patches]
+  Server3[🖥️ Server 3: ???]
+  Server1 --> Chaos[😱 Configuration Chaos]
+  Server2 --> Chaos
+  Server3 --> Chaos
+```
+
+---
+
+## 📍 Slide 7 – 🐶 Pets vs Cattle
+
+* 🐶 **Pets**: Named servers, nursed back to health when sick
+* 🐄 **Cattle**: Numbered, identical, replaced when broken
+* 🌍 Cloud-native = cattle mindset
+
+```mermaid
+flowchart TD
+  subgraph 🐶 Pets
+    P1[web-prod-01]
+    P2[db-master]
+    P3[app-legacy]
+  end
+  subgraph 🐄 Cattle
+    C1[instance-001]
+    C2[instance-002]
+    C3[instance-003]
+  end
+  Pets -->|😰 Unique, fragile| Problem[Hard to scale]
+  Cattle -->|🔄 Identical, disposable| Solution[Easy to scale]
+```
+
+> 🤔 **Think:** Are your servers pets or cattle?
+
+---
+
+## 📍 Slide 8 – 😱 Configuration Drift
+
+* 📅 Server configured once, modified many times
+* 🔧 "Quick fixes" applied directly in production
+* 📋 No record of what changed
+* 💀 Disaster recovery = guesswork
+
+```mermaid
+flowchart TD
+  Initial[✅ Initial Setup] --> Month1[📅 Month 1: Hotfix applied]
+  Month1 --> Month3[📅 Month 3: Security patch]
+  Month3 --> Month6[📅 Month 6: Unknown changes]
+  Month6 --> Drift[😱 Configuration Drift]
+  Drift --> Unknown[❓ What's actually running?]
+```
+
+**📊 The Numbers:**
+* 🔍 **65%** of downtime caused by configuration issues
+* ⏱️ Average recovery time: **4+ hours**
+* 💰 Cost per hour of downtime: **$300,000** (enterprise)
+
+---
+
+## 📍 Slide 9 – 😨 The Bus Factor
+
+* 👤 One person knows how the infrastructure works
+* 🚌 They leave, get sick, or go on vacation
+* 🙈 Nobody can recreate or fix the environment
+* 💀 Business continuity at risk
+
+> ⚠️ **Bus Factor = 1** means your infrastructure is fragile
+
+**😰 Signs of Low Bus Factor:**
+* 🔇 "Ask John, he set that up"
+* 📝 Documentation is outdated or missing
+* 🐌 Changes require specific people
+* 🚪 Knowledge walks out the door
+
+**💬 Discussion:** What's your infrastructure bus factor?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Manual Infrastructure
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow provisioning | Days to spin up new environments |
+| 📋 Manual processes | Human error, inconsistency |
+| 👉 No audit trail | Compliance violations |
+| 🙈 Configuration drift | Unpredictable behavior |
+
+**📈 Real Numbers:**
+* 🏢 **Manual provisioning**: 2-4 hours per server
+* 🚀 **With IaC**: 2-4 minutes per server
+* 🔄 **Environment recreation**: hours vs seconds
+
+**💰 Time Cost:**
+* 👨‍💻 Engineer time: **$75-150/hour**
+* 🖥️ 10 servers manually: **$1,500-3,000**
+* 🤖 10 servers with IaC: **$15-30**
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Infrastructure as Code Is
+
+* 📝 **IaC** = defining infrastructure in version-controlled files
+* 🔄 Infrastructure becomes **reproducible** and **auditable**
+* 🚫 No more clicking through consoles
+* 🎯 Same infrastructure, every time
+
+```mermaid
+flowchart LR
+  Code[📝 Code] -->|🔄 Apply| Cloud[☁️ Cloud]
+  Cloud --> Infra[🏗️ Infrastructure]
+  Code -->|📜 Git| Version[Version Control]
+```
+
+**📖 Definition:**
+> *Infrastructure as Code is the practice of managing and provisioning infrastructure through machine-readable configuration files rather than through manual processes or interactive tools.*
+
+---
+
+## 📍 Slide 12 – 🚫 What IaC is NOT
+
+| ❌ Myth | ✅ Reality |
+|---------|-----------|
+| "Just automation scripts" | 📝 Declarative desired state |
+| "Only for cloud" | 🖥️ Works for any infrastructure |
+| "Replaces ops people" | 🤝 Empowers ops teams |
+| "Too complex for small teams" | 🎯 Benefits scale to any size |
+| "One-time setup" | 🔄 Continuous lifecycle management |
+
+> 🔥 **Hot take:** If you can't recreate your infrastructure from code, you don't have IaC.
+
+**🎯 IaC is about:**
+* 🧠 Declarative definitions
+* 🤝 Team collaboration on infrastructure
+* 🔄 Repeatable, consistent environments
+* 📊 Audit trails and compliance
+
+---
+
+## 📍 Slide 13 – 🔀 Declarative vs Imperative
+
+```mermaid
+flowchart TD
+  subgraph Declarative
+    D1[📝 Define desired state]
+    D2[🤖 Tool figures out how]
+    D1 --> D2
+  end
+  subgraph Imperative
+    I1[📝 Define exact steps]
+    I2[🔧 Execute step by step]
+    I1 --> I2
+  end
+```
+
+| 📋 Aspect | 🌍 Declarative | 🔧 Imperative |
+|-----------|---------------|---------------|
+| 📝 What you write | Desired end state | Exact steps |
+| 🛠️ Tool | Terraform, CloudFormation | Pulumi, Scripts |
+| 🔄 Idempotency | Built-in | You implement |
+| 📚 Example | "3 VMs exist" | "Create VM 1, 2, 3" |
+
+**📚 Source:** Terraform documentation
+
+---
+
+## 📍 Slide 14 – 🛠️ IaC Tool Landscape
+
+```mermaid
+graph TD
+  IaC[🏗️ Infrastructure as Code]
+  IaC --> Prov[📦 Provisioning]
+  IaC --> Config[⚙️ Configuration]
+  Prov --> Terraform[🌍 Terraform]
+  Prov --> Pulumi[📦 Pulumi]
+  Prov --> Cloud[☁️ CloudFormation/ARM]
+  Config --> Ansible[🔧 Ansible]
+  Config --> Chef[👨‍🍳 Chef]
+  Config --> Puppet[🎭 Puppet]
+```
+
+| 🛠️ Tool | 🎯 Focus | 📝 Language |
+|---------|---------|------------|
+| 🌍 **Terraform** | Provisioning | HCL (declarative) |
+| 📦 **Pulumi** | Provisioning | Python, TS, Go |
+| 🔧 **Ansible** | Configuration | YAML |
+| ☁️ **CloudFormation** | AWS only | YAML/JSON |
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After IaC
+
+| 😰 Before | 🚀 After |
+|----------|---------|
+| 📅 Days to provision | ⚡ Minutes to provision |
+| 📋 Manual documentation | 📝 Code IS documentation |
+| 👉 "Who changed that?" | 📜 Git history shows all |
+| 😨 Fear of recreation | 💪 Confident rebuilds |
+| 🐶 Unique snowflakes | 🐄 Identical cattle |
+| 🙅 "Don't touch prod" | 🔄 Infrastructure is disposable |
+
+> 🤔 How confident are you in recreating your infrastructure?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Terraform Deep Dive
+
+## 🌍 Why Terraform?
+
+* 🌐 **Multi-cloud**: AWS, GCP, Azure, Yandex, and 3000+ providers
+* 📝 **HCL**: Human-readable configuration language
+* 🔄 **State management**: Tracks what exists
+* 🏢 **Industry standard**: Most widely adopted IaC tool
+
+**🎮 Let's build infrastructure.**
+
+---
+
+## 📍 Slide 17 – 📝 Terraform Workflow
+
+```mermaid
+flowchart LR
+  Write[📝 Write] --> Init[🔧 Init]
+  Init --> Plan[📋 Plan]
+  Plan --> Apply[🚀 Apply]
+  Apply --> Destroy[💥 Destroy]
+```
+
+* 📝 **Write**: Define resources in `.tf` files
+* 🔧 **Init**: Download provider plugins
+* 📋 **Plan**: Preview changes (dry run)
+* 🚀 **Apply**: Create/update infrastructure
+* 💥 **Destroy**: Remove all resources
+
+**🛠️ Commands:**
+```bash
+terraform init      # Download providers
+terraform plan      # Preview changes
+terraform apply     # Apply changes
+terraform destroy   # Remove everything
+```
+
+---
+
+## 📍 Slide 18 – 🧱 Terraform Building Blocks
+
+```mermaid
+flowchart TD
+  Config[📁 Configuration]
+  Config --> Provider[☁️ Provider]
+  Config --> Resource[🏗️ Resource]
+  Config --> Variable[📊 Variable]
+  Config --> Output[📤 Output]
+  Config --> Data[🔍 Data Source]
+```
+
+* ☁️ **Provider**: Cloud API connection (AWS, GCP, Yandex)
+* 🏗️ **Resource**: Infrastructure component (VM, network, firewall)
+* 📊 **Variable**: Configurable inputs
+* 📤 **Output**: Values to display/export
+* 🔍 **Data Source**: Query existing infrastructure
+
+---
+
+## 📍 Slide 19 – 💻 Terraform Example: VM Creation
+
+```hcl
+# ☁️ Provider configuration
+provider "yandex" {
+  zone = "ru-central1-a"
+}
+
+# 🏗️ Virtual machine resource
+resource "yandex_compute_instance" "web" {
+  name        = "web-server"
+  platform_id = "standard-v2"
+
+  resources {
+    cores  = 2
+    memory = 2
+  }
+
+  boot_disk {
+    initialize_params {
+      image_id = "fd8vmcue7aajqdge3bp0"  # Ubuntu 22.04
+    }
+  }
+}
+```
+
+**🎯 Result:** One command creates a VM in the cloud
+
+---
+
+## 📍 Slide 20 – 📊 Variables and Outputs
+
+```hcl
+# 📊 Input variables
+variable "instance_count" {
+  description = "Number of VMs to create"
+  type        = number
+  default     = 1
+}
+
+variable "environment" {
+  description = "Environment name"
+  type        = string
+}
+
+# 📤 Output values
+output "vm_ip" {
+  description = "Public IP of the VM"
+  value       = yandex_compute_instance.web.network_interface.0.nat_ip_address
+}
+```
+
+**🛠️ Usage:**
+```bash
+terraform apply -var="instance_count=3" -var="environment=prod"
+```
+
+---
+
+## 📍 Slide 21 – 🔄 Terraform Plan
+
+```mermaid
+flowchart LR
+  Code[📝 Config] --> Plan[📋 terraform plan]
+  State[📦 State] --> Plan
+  Plan --> Diff[🔍 Difference]
+  Diff --> Preview[👀 What will change?]
+```
+
+**📋 Plan Output Example:**
+```
+# yandex_compute_instance.web will be created
++ resource "yandex_compute_instance" "web" {
+    + name        = "web-server"
+    + platform_id = "standard-v2"
+    + status      = (known after apply)
+
+    + resources {
+        + cores  = 2
+        + memory = 2
+      }
+  }
+
+Plan: 1 to add, 0 to change, 0 to destroy.
+```
+
+**🎯 Always review the plan before applying!**
+
+---
+
+## 📍 Slide 22 – 📦 Pulumi Alternative
+
+```mermaid
+flowchart LR
+  Terraform[🌍 Terraform] -->|HCL| Declarative[📝 Declarative]
+  Pulumi[📦 Pulumi] -->|Python/TS/Go| Imperative[💻 Imperative]
+```
+
+**📦 Pulumi Python Example:**
+```python
+import pulumi
+import pulumi_yandex as yandex
+
+# 🏗️ Create VM using Python
+vm = yandex.ComputeInstance("web",
+    name="web-server",
+    platform_id="standard-v2",
+    resources=yandex.ComputeInstanceResourcesArgs(
+        cores=2,
+        memory=2,
+    ))
+
+# 📤 Export IP address
+pulumi.export("ip", vm.network_interfaces[0].nat_ip_address)
+```
+
+**🎯 Same result, real programming language**
+
+---
+
+## 📍 Slide 23 – ⚖️ Terraform vs Pulumi
+
+| 📋 Aspect | 🌍 Terraform | 📦 Pulumi |
+|-----------|-------------|----------|
+| 📝 Language | HCL (domain-specific) | Python, TS, Go, C# |
+| 📚 Learning curve | New syntax to learn | Familiar languages |
+| 🔄 Logic | Limited (count, for_each) | Full programming |
+| 🧪 Testing | External tools | Native unit tests |
+| 📦 State | Local or S3 | Pulumi Cloud (free tier) |
+| 🔐 Secrets | Plain in state | Encrypted by default |
+
+> ❓ **When to use which?**
+> * 🌍 **Terraform**: Larger community, more examples, declarative simplicity
+> * 📦 **Pulumi**: Complex logic, existing codebase, testing requirements
+
+---
+
+## 📍 Slide 24 – 🔐 Security Best Practices
+
+```yaml
+# ❌ NEVER do this
+provider "aws" {
+  access_key = "AKIAIOSFODNN7EXAMPLE"    # 💀 Hardcoded secret!
+  secret_key = "wJalrXUtnFEMI/..."       # 💀 Hardcoded secret!
+}
+
+# ✅ Use environment variables
+# export AWS_ACCESS_KEY_ID="..."
+# export AWS_SECRET_ACCESS_KEY="..."
+provider "aws" {
+  # Automatically uses env vars
+}
+```
+
+**🔐 Security Rules:**
+* 🚫 Never commit secrets to Git
+* 📁 Use `.gitignore` for state and tfvars
+* 🔑 Use environment variables or secret managers
+* 🔒 Encrypt state file at rest
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L4_MID
+
+---
+
+## 📍 Slide 26 – 📦 Section 4: State Management
+
+## 🗃️ What is Terraform State?
+
+* 📝 Maps configuration to real-world resources
+* 🔍 Tracks what Terraform manages
+* 🔄 Determines what changes are needed
+* ⚠️ Contains sensitive data
+
+```mermaid
+flowchart LR
+  Config[📝 Config Files] --> TF[🌍 Terraform]
+  State[📦 State File] --> TF
+  TF --> Cloud[☁️ Real Infrastructure]
+  Cloud --> State
+```
+
+---
+
+## 📍 Slide 27 – 📁 State File Contents
+
+```json
+{
+  "version": 4,
+  "terraform_version": "1.9.0",
+  "resources": [
+    {
+      "type": "yandex_compute_instance",
+      "name": "web",
+      "instances": [
+        {
+          "attributes": {
+            "id": "fhm1234567890",
+            "name": "web-server",
+            "network_interface": [
+              {
+                "ip_address": "192.168.1.10",
+                "nat_ip_address": "51.250.1.100"
+              }
+            ]
+          }
+        }
+      ]
+    }
+  ]
+}
+```
+
+**⚠️ Never edit state manually!**
+
+---
+
+## 📍 Slide 28 – 🌐 Remote State
+
+```mermaid
+flowchart TD
+  Dev1[👨‍💻 Developer 1] --> Remote[🌐 Remote State]
+  Dev2[👨‍💻 Developer 2] --> Remote
+  Dev3[👨‍💻 Developer 3] --> Remote
+  Remote --> Cloud[☁️ Cloud Infrastructure]
+```
+
+**🌐 Remote State Benefits:**
+* 🤝 Team collaboration
+* 🔒 Locking prevents conflicts
+* 🔐 Encrypted at rest
+* 📜 Versioning and backup
+
+**📦 Backend Options:**
+* ☁️ **S3/GCS**: Object storage
+* 🏢 **Terraform Cloud**: HashiCorp managed
+* 🔐 **Consul**: HashiCorp Consul
+
+---
+
+## 📍 Slide 29 – 📊 IaC Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| ⏱️ **Provisioning Time** | Time to create env | < 15 minutes |
+| 🔄 **Environment Parity** | Dev = Staging = Prod | 100% |
+| ❌ **Drift Detection** | Config drift incidents | 0 per month |
+| 📜 **Audit Compliance** | Changes tracked in Git | 100% |
+
+> 📚 These metrics indicate IaC maturity.
+
+**🤔 Question:** How long does it take to spin up a new environment?
+
+---
+
+## 📍 Slide 30 – 🌊 From Snowflakes to Cattle
+
+```mermaid
+flowchart LR
+  subgraph 😱 Snowflakes
+    Manual[🔧 Manual Setup]
+    Unique[❄️ Unique Servers]
+    Drift[📋 Configuration Drift]
+  end
+  subgraph 🐄 Cattle
+    Code[📝 Code-Defined]
+    Identical[🔄 Identical Servers]
+    Reproducible[✅ Reproducible]
+  end
+  Snowflakes -->|🚀 IaC| Cattle
+```
+
+**🎯 Goal State:**
+* ⚡ Any environment recreatable in minutes
+* 🔄 All changes through code review
+* 📈 Teams deploy infrastructure confidently
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: IaC in Real Life
+
+## 📅 A Day with IaC
+
+**☀️ Morning:**
+* 📊 Review infrastructure PR
+* 👀 Check `terraform plan` output
+* ✅ Approve and merge
+
+**🌤️ Afternoon:**
+* 🚨 Need new test environment
+* 🔧 Copy `terraform.tfvars`
+* 🚀 `terraform apply` — **done in 10 minutes**
+
+**🌙 Evening:**
+* 🗑️ `terraform destroy` test environment
+* 💰 No resources running overnight
+
+---
+
+## 📍 Slide 32 – 👥 IaC Team Workflow
+
+| 👤 Role | 🎯 IaC Responsibility |
+|---------|----------------------|
+| 🔧 **DevOps/Platform** | Write and maintain IaC modules |
+| 👨‍💻 **Developer** | Use modules, request infrastructure |
+| 🛡️ **Security** | Review IaC for compliance |
+| 📊 **FinOps** | Monitor infrastructure costs |
+
+**🔗 Common Workflow:**
+* 📝 Create branch with IaC changes
+* 🔍 CI runs `terraform plan`
+* 👀 Team reviews the plan
+* ✅ Merge triggers `terraform apply`
+
+---
+
+## 📍 Slide 33 – 🤝 GitOps for Infrastructure
+
+```mermaid
+flowchart TD
+  Dev[👨‍💻 Developer] -->|📝 PR| Git[🐙 Git Repository]
+  Git -->|🔄 CI/CD| Plan[📋 Terraform Plan]
+  Plan -->|👀 Review| Approve[✅ Approve]
+  Approve -->|🚀 Merge| Apply[🌍 Terraform Apply]
+  Apply --> Cloud[☁️ Infrastructure]
+```
+
+**🤝 GitOps Practices:**
+* 📟 All changes through pull requests
+* 📝 Plan output in PR comments
+* 👥 Required approvals
+* 🔓 Protected main branch
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: IaC Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Basic Terraform] --> Mid[💼 Mid: Modules & CI/CD]
+  Mid --> Senior[⭐ Senior: Multi-cloud & Architecture]
+  Senior --> Principal[🏆 Principal: Platform Strategy]
+```
+
+**🛠️ Skills to Build:**
+* 🌍 Terraform HCL fluency
+* ☁️ Cloud provider APIs
+* 🔐 Security best practices
+* 📦 Module design
+* 🔄 CI/CD integration
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 HashiCorp Customers:**
+* 🏦 **Stripe**: Terraform for AWS infrastructure
+* 🎮 **Riot Games**: Multi-cloud with Terraform
+* 🛒 **Shopify**: Thousands of resources managed
+
+**☁️ Cloud Native:**
+* 🔍 **Google**: Uses Terraform internally
+* 📦 **Spotify**: IaC for Kubernetes infrastructure
+* 🎬 **Netflix**: Custom tooling built on IaC principles
+
+**📊 Stats:**
+* 🌍 **2M+** Terraform users worldwide
+* 📦 **3000+** providers available
+* 🏢 **Fortune 500**: 85% use IaC
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🏗️ **IaC = Infrastructure defined in code**
+2. 🐄 **Cattle not pets** — servers are disposable
+3. 📝 **Version control everything** — Git for infrastructure
+4. 📋 **Plan before apply** — always review changes
+5. 🔐 **Never commit secrets** — use environment variables
+
+> 💡 If you can't recreate it from code, it's not really infrastructure as code.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🚀 IaC Mindset |
+|---------------|------------------|
+| 🙅 "SSH and fix it" | 📝 "Change the code" |
+| 🚫 "Don't touch that server" | 💪 "Destroy and recreate" |
+| 👉 "Who set this up?" | 📜 "Git blame shows history" |
+| 😨 "Manual is faster" | ⚡ "Automation is faster at scale" |
+| 💻 "Works on my cloud" | 🌍 "Works on any cloud" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Why IaC is essential for modern infrastructure
+* ✅ The difference between declarative and imperative
+* ✅ How Terraform and Pulumi work
+* ✅ State management and security practices
+* ✅ Real-world IaC workflows
+
+> 🚀 **You're ready for Lab 4: Terraform & Pulumi**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L4_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Configuration Management with Ansible
+
+* 🔧 Ansible fundamentals
+* 📦 Roles and playbooks
+* 🤖 Automating server configuration
+* 💻 Hands-on: Deploying Docker with Ansible
+
+**🎉 Your IaC journey begins.**
+
+> 🐄 From snowflakes to cattle — one terraform apply at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> IaC[🏗️ IaC Skills]
+  IaC --> Reproducible[🔄 Reproducible Infra]
+  Reproducible --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Terraform: Up & Running* — Yevgeniy Brikman
+* 📖 *Infrastructure as Code* — Kief Morris
+* 📖 *The DevOps Handbook* — Gene Kim et al.
+
+**🔗 Links:**
+* 🌐 [Terraform Documentation](https://developer.hashicorp.com/terraform/docs)
+* 🌐 [Pulumi Documentation](https://www.pulumi.com/docs/)
+* 🌐 [Terraform Registry](https://registry.terraform.io/)
+
+---
diff --git a/lectures/lec5.md b/lectures/lec5.md
new file mode 100644
index 0000000000..5bcfba6c1a
--- /dev/null
+++ b/lectures/lec5.md
@@ -0,0 +1,824 @@
+# 📌 Lecture 5 — Configuration Management: Ansible Fundamentals
+
+## 📍 Slide 1 – 🚀 Welcome to Configuration Management
+
+* 🌍 **Infrastructure is provisioned** — but what about configuring it?
+* 😰 Manual server setup leads to inconsistency and errors
+* 🔧 **Ansible automates configuration** — repeatable, reliable, documented
+* 🎯 This lecture: master Ansible roles, playbooks, and best practices
+
+```mermaid
+flowchart LR
+  Provision[🏗️ Terraform: Create VMs] --> Configure[🔧 Ansible: Configure VMs]
+  Configure --> Ready[✅ Ready to Run Apps]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand Ansible architecture and concepts
+* ✅ Write idempotent playbooks and roles
+* ✅ Secure credentials with Ansible Vault
+* ✅ Apply configuration management best practices
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Explain Ansible's agentless architecture |
+| 2 | 🔍 Create reusable roles for configuration |
+| 3 | 🛠️ Write idempotent tasks and handlers |
+| 4 | 🗺️ Secure secrets with Ansible Vault |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + YAML examples** — hands-on learning
+* 🎮 **Real-world scenarios** — server configuration challenges
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Best practices**: roles, handlers, idempotency
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Configuration Problem
+Section 2: Ansible Fundamentals
+Section 3: Roles & Playbooks      → 📝 MID Quiz
+Section 4: Idempotency & Handlers
+Section 5: Real World Ansible
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **94%** of organizations experienced security incidents from misconfigurations
+* ⏱️ Average time to configure a server manually: **2-4 hours**
+* 💥 Most configuration drift goes **undetected for months**
+
+> 💬 *"I installed it the same way... I think"* — Every sysadmin, ever
+
+**🤔 Think about it:**
+* How do you ensure 100 servers have identical configs?
+* What happens when you need to update a package on all servers?
+* Can you prove compliance across your infrastructure?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L5_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Configuration Problem
+
+* 🔧 **Manual configuration** = SSH into each server
+* 📋 Run commands, edit files, install packages
+* 📝 Document steps (that nobody reads)
+* 💥 Result: **no two servers are identical**
+
+```mermaid
+flowchart LR
+  Admin[👤 Admin] -->|SSH| Server1[🖥️ Server 1]
+  Admin -->|SSH| Server2[🖥️ Server 2]
+  Admin -->|SSH| Server3[🖥️ Server 3]
+  Server1 --> Drift1[📋 Config A]
+  Server2 --> Drift2[📋 Config B]
+  Server3 --> Drift3[📋 Config ???]
+```
+
+---
+
+## 📍 Slide 7 – 🐚 Shell Script Approach
+
+* 📝 Write bash scripts to automate
+* 🔄 Run scripts on each server
+* ⚠️ Problem: Scripts aren't idempotent
+
+```bash
+#!/bin/bash
+# 😰 What happens if you run this twice?
+apt-get update
+apt-get install -y nginx
+echo "Welcome" > /var/www/html/index.html
+systemctl start nginx
+```
+
+**💥 Issues:**
+* 🔄 Re-running may cause errors
+* 😰 No rollback mechanism
+* 📋 No state tracking
+* 🔗 No dependency management
+
+> 🤔 **Think:** What if nginx is already installed?
+
+---
+
+## 📍 Slide 8 – 😱 Configuration Management Challenges
+
+* 📅 100 servers need the same update
+* 🔧 Some servers have different OS versions
+* 📋 Some packages conflict with others
+* 💀 One mistake = hours of cleanup
+
+```mermaid
+flowchart TD
+  Update[📦 Update Required] --> S1[🖥️ Server 1: Ubuntu 20]
+  Update --> S2[🖥️ Server 2: Ubuntu 22]
+  Update --> S3[🖥️ Server 3: Ubuntu 24]
+  S1 --> Problem1[😰 Different package versions]
+  S2 --> Problem2[😰 Different dependencies]
+  S3 --> Problem3[😰 Different configs needed]
+```
+
+**📊 The Numbers:**
+* 🔍 **85%** of breaches involve misconfiguration
+* ⏱️ Manual update of 100 servers: **days**
+* 💰 Cost of configuration-related downtime: **$5,600/minute**
+
+---
+
+## 📍 Slide 9 – 😨 Documentation Drift
+
+* 📝 Documentation written once
+* 🔧 Server modified many times
+* 📋 Documentation never updated
+* 💀 Reality ≠ documentation
+
+> ⚠️ **Outdated docs are worse than no docs**
+
+**😰 Signs of Documentation Drift:**
+* 🔇 "The wiki says X but we do Y now"
+* 📝 Multiple conflicting runbooks
+* 🐌 New hires struggle to onboard
+* 🚪 Knowledge leaves with employees
+
+**💬 Discussion:** How current is your documentation?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Manual Configuration
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow updates | Security vulnerabilities linger |
+| 📋 Manual errors | Downtime from typos |
+| 👉 Inconsistency | "Works on server 1 but not 2" |
+| 🙈 No audit trail | Compliance failures |
+
+**📈 Real Numbers:**
+* 🏢 **Manual config time**: 2-4 hours per server
+* 🚀 **With Ansible**: 5-10 minutes per server
+* 🔄 **Scaling**: minutes vs days
+
+**💰 ROI Example:**
+* 👨‍💻 100 servers × 3 hours × $75/hour = **$22,500**
+* 🤖 Ansible: 1 hour setup + seconds to run = **$75**
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Ansible Is
+
+* 🔧 **Configuration management tool** — automate server setup
+* 🌐 **Agentless** — uses SSH, no agents to install
+* 📝 **YAML-based** — human-readable playbooks
+* 🔄 **Idempotent** — safe to run multiple times
+
+```mermaid
+flowchart LR
+  Control[💻 Control Node] -->|SSH| Node1[🖥️ Managed Node]
+  Control -->|SSH| Node2[🖥️ Managed Node]
+  Control -->|SSH| Node3[🖥️ Managed Node]
+```
+
+**📖 Definition:**
+> *Ansible is an open-source automation tool for configuration management, application deployment, and task automation using a simple YAML syntax.*
+
+---
+
+## 📍 Slide 12 – 🚫 What Ansible is NOT
+
+| ❌ Myth | ✅ Reality |
+|---------|-----------|
+| "Replaces Terraform" | 🤝 They complement each other |
+| "Requires agents" | 🌐 Agentless, SSH-based |
+| "Only for Linux" | 🪟 Works with Windows too |
+| "Just a scripting tool" | 📦 Full configuration management |
+| "Hard to learn" | 📝 YAML is simple |
+
+> 🔥 **Hot take:** Terraform provisions, Ansible configures. Use both.
+
+**🎯 Ansible is about:**
+* 🧠 Declarative configuration
+* 🤝 Consistent state across servers
+* 🔄 Repeatable automation
+* 📊 Self-documenting infrastructure
+
+---
+
+## 📍 Slide 13 – 🏗️ Ansible Architecture
+
+```mermaid
+flowchart TD
+  Control[💻 Control Node]
+  Control --> Inventory[📋 Inventory]
+  Control --> Playbook[📝 Playbook]
+  Control --> Modules[📦 Modules]
+  Inventory --> Managed[🖥️ Managed Nodes]
+  Playbook --> Managed
+  Modules --> Managed
+```
+
+| 🧱 Component | 🎯 Purpose |
+|-------------|----------|
+| 💻 **Control Node** | Where Ansible runs |
+| 📋 **Inventory** | List of managed servers |
+| 📝 **Playbook** | Automation instructions |
+| 📦 **Modules** | Units of work (apt, copy, service) |
+| 🖥️ **Managed Nodes** | Target servers |
+
+---
+
+## 📍 Slide 14 – 📋 Inventory Basics
+
+```ini
+# inventory/hosts.ini
+[webservers]
+web1 ansible_host=192.168.1.10
+web2 ansible_host=192.168.1.11
+
+[databases]
+db1 ansible_host=192.168.1.20
+
+[all:vars]
+ansible_user=ubuntu
+ansible_python_interpreter=/usr/bin/python3
+```
+
+**🎯 Inventory Features:**
+* 📁 Group servers logically
+* 🔧 Set per-host or per-group variables
+* 🌐 Static files or dynamic discovery
+* 🏷️ Use patterns: `webservers`, `all`, `db*`
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After Ansible
+
+| 😰 Before | 🚀 After |
+|----------|---------|
+| 📅 SSH into each server | 🤖 One command for all |
+| 📋 Manual steps | 📝 Documented playbooks |
+| 👉 "Run these commands" | ✅ "Desired state defined" |
+| 😨 Fear of updates | 💪 Confident automation |
+| 🐌 Hours per server | ⚡ Seconds per server |
+| 📝 Outdated wiki | 📄 Living documentation |
+
+> 🤔 How much time does your team spend on manual configuration?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Roles & Playbooks
+
+## 📝 Playbook Basics
+
+* 📄 YAML file with automation tasks
+* 🎯 Defines desired state
+* 🔄 Executes on target hosts
+* 📦 Groups related tasks
+
+**🎮 Let's write some Ansible.**
+
+---
+
+## 📍 Slide 17 – 📝 Simple Playbook Example
+
+```yaml
+---
+# playbook.yml
+- name: Configure web servers
+  hosts: webservers
+  become: yes  # 🔐 Run as root
+
+  tasks:
+    - name: Update apt cache
+      apt:
+        update_cache: yes
+        cache_valid_time: 3600
+
+    - name: Install nginx
+      apt:
+        name: nginx
+        state: present
+
+    - name: Start nginx
+      service:
+        name: nginx
+        state: started
+        enabled: yes
+```
+
+**🛠️ Run it:**
+```bash
+ansible-playbook -i inventory/hosts.ini playbook.yml
+```
+
+---
+
+## 📍 Slide 18 – 📦 Why Roles?
+
+```mermaid
+flowchart TD
+  subgraph ❌ Without Roles
+    P1[📝 One huge playbook]
+    P1 --> Problem[😰 Hard to maintain]
+  end
+  subgraph ✅ With Roles
+    R1[📦 common role]
+    R2[📦 docker role]
+    R3[📦 app role]
+    R1 --> Reuse[🔄 Reusable]
+    R2 --> Reuse
+    R3 --> Reuse
+  end
+```
+
+**📦 Role Benefits:**
+* 🔄 **Reusability**: Use across projects
+* 📁 **Organization**: Clear structure
+* 🧪 **Testability**: Test roles independently
+* 🤝 **Sharing**: Ansible Galaxy
+
+---
+
+## 📍 Slide 19 – 📁 Role Structure
+
+```
+roles/
+├── docker/
+│   ├── tasks/
+│   │   └── main.yml      # 🎯 Main tasks
+│   ├── handlers/
+│   │   └── main.yml      # 🔔 Event handlers
+│   ├── defaults/
+│   │   └── main.yml      # 📊 Default variables
+│   ├── templates/
+│   │   └── config.j2     # 📝 Jinja2 templates
+│   └── files/
+│       └── script.sh     # 📄 Static files
+```
+
+**🔑 Key Directories:**
+* 📁 **tasks/**: What to do
+* 📁 **handlers/**: React to changes
+* 📁 **defaults/**: Default values (low priority)
+* 📁 **templates/**: Dynamic file templates
+* 📁 **files/**: Static files to copy
+
+---
+
+## 📍 Slide 20 – 🐳 Docker Role Example
+
+```yaml
+# roles/docker/tasks/main.yml
+---
+- name: Install Docker prerequisites
+  apt:
+    name:
+      - apt-transport-https
+      - ca-certificates
+      - curl
+    state: present
+
+- name: Add Docker GPG key
+  apt_key:
+    url: https://download.docker.com/linux/ubuntu/gpg
+    state: present
+
+- name: Add Docker repository
+  apt_repository:
+    repo: "deb https://download.docker.com/linux/ubuntu {{ ansible_distribution_release }} stable"
+    state: present
+
+- name: Install Docker
+  apt:
+    name: docker-ce
+    state: present
+  notify: restart docker
+```
+
+---
+
+## 📍 Slide 21 – 🔔 Handlers
+
+```yaml
+# roles/docker/handlers/main.yml
+---
+- name: restart docker
+  service:
+    name: docker
+    state: restarted
+```
+
+**🔔 Handler Features:**
+* 🔄 Only run when notified
+* ⏱️ Run once at end of play
+* 🎯 React to configuration changes
+* 💡 Prevent unnecessary restarts
+
+```yaml
+# tasks/main.yml
+- name: Update Docker config
+  template:
+    src: daemon.json.j2
+    dest: /etc/docker/daemon.json
+  notify: restart docker  # 🔔 Trigger handler
+```
+
+---
+
+## 📍 Slide 22 – 📊 Variables & Defaults
+
+```yaml
+# roles/docker/defaults/main.yml
+---
+docker_version: "24.0"
+docker_users:
+  - ubuntu
+docker_log_driver: "json-file"
+docker_log_max_size: "10m"
+```
+
+**📊 Variable Precedence (lowest to highest):**
+1. 📁 Role defaults
+2. 📋 Inventory variables
+3. 📄 Playbook vars
+4. 🔧 Command line (`-e var=value`)
+
+```yaml
+# Using variables in tasks
+- name: Install Docker {{ docker_version }}
+  apt:
+    name: "docker-ce={{ docker_version }}*"
+    state: present
+```
+
+---
+
+## 📍 Slide 23 – 📝 Using Roles in Playbooks
+
+```yaml
+# playbooks/provision.yml
+---
+- name: Provision web servers
+  hosts: webservers
+  become: yes
+
+  roles:
+    - common      # 📦 Install common packages
+    - docker      # 🐳 Install Docker
+    - app_deploy  # 🚀 Deploy application
+```
+
+**🎯 Clean and simple!**
+
+```mermaid
+flowchart LR
+  Playbook[📝 Playbook] --> Common[📦 common]
+  Playbook --> Docker[🐳 docker]
+  Playbook --> App[🚀 app_deploy]
+  Common --> Result[✅ Configured Server]
+  Docker --> Result
+  App --> Result
+```
+
+---
+
+## 📍 Slide 24 – 🔐 Ansible Vault
+
+```bash
+# 🔐 Create encrypted file
+ansible-vault create group_vars/all.yml
+
+# 📝 Edit encrypted file
+ansible-vault edit group_vars/all.yml
+
+# 👀 View encrypted file
+ansible-vault view group_vars/all.yml
+```
+
+**🔐 Encrypted Content:**
+```yaml
+---
+# group_vars/all.yml (encrypted)
+dockerhub_username: myuser
+dockerhub_password: super_secret_token
+app_secret_key: very_secret_key_123
+```
+
+**🛠️ Using Vault:**
+```bash
+ansible-playbook playbook.yml --ask-vault-pass
+# Or use password file (gitignored!)
+ansible-playbook playbook.yml --vault-password-file .vault_pass
+```
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L5_MID
+
+---
+
+## 📍 Slide 26 – 🔄 Section 4: Idempotency
+
+## ♾️ What is Idempotency?
+
+* 🔄 Same result whether run once or many times
+* ✅ Safe to re-run playbooks
+* 📊 Converges to desired state
+* 🎯 No unintended side effects
+
+```mermaid
+flowchart LR
+  Run1[🚀 First Run] --> State[✅ Desired State]
+  Run2[🚀 Second Run] --> State
+  Run3[🚀 Third Run] --> State
+```
+
+**🎨 Output Colors:**
+* 🟢 **ok**: Already in desired state
+* 🟡 **changed**: Made a change
+* 🔴 **failed**: Task failed
+* ⚫ **skipped**: Task skipped
+
+---
+
+## 📍 Slide 27 – 🔄 Idempotent vs Non-Idempotent
+
+```yaml
+# ❌ Non-idempotent (shell command)
+- name: Add line to file
+  shell: echo "config=value" >> /etc/app.conf
+  # 💥 Adds line EVERY time!
+
+# ✅ Idempotent (lineinfile module)
+- name: Ensure line in file
+  lineinfile:
+    path: /etc/app.conf
+    line: "config=value"
+    state: present
+  # ✅ Only adds if missing!
+```
+
+**📦 Idempotent Modules:**
+| Module | Purpose | Idempotent? |
+|--------|---------|-------------|
+| `apt` | Install packages | ✅ Yes |
+| `service` | Manage services | ✅ Yes |
+| `file` | Manage files | ✅ Yes |
+| `shell` | Run commands | ❌ Usually no |
+| `command` | Run commands | ❌ Usually no |
+
+---
+
+## 📍 Slide 28 – 🧪 Testing Idempotency
+
+```mermaid
+flowchart TD
+  Run1[🚀 First Run] --> Changed[🟡 changed: 15]
+  Run2[🚀 Second Run] --> Ok[🟢 changed: 0]
+  Ok --> Idempotent[✅ Playbook is Idempotent!]
+```
+
+**🧪 Test Process:**
+1. 🚀 Run playbook first time → many changes
+2. 🚀 Run playbook second time → **zero changes**
+3. ✅ If second run shows `changed: 0`, you're idempotent
+
+**📊 Example Output:**
+```
+PLAY RECAP
+server1 : ok=15  changed=0  unreachable=0  failed=0
+```
+
+---
+
+## 📍 Slide 29 – 📊 Configuration Management Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| ⏱️ **Config Time** | Time to configure server | < 15 minutes |
+| 🔄 **Drift Rate** | Servers with drift | 0% |
+| ✅ **Idempotency** | Re-run changes | 0 changes |
+| 📜 **Compliance** | Servers meeting policy | 100% |
+
+> 📚 These metrics indicate configuration management maturity.
+
+**🤔 Question:** What happens when you re-run your playbooks?
+
+---
+
+## 📍 Slide 30 – 🌊 From Manual to Automated
+
+```mermaid
+flowchart LR
+  subgraph 😱 Manual
+    SSH[🔌 SSH Sessions]
+    Commands[💻 Run Commands]
+    Hope[🙏 Hope It Works]
+  end
+  subgraph 🤖 Automated
+    Playbook[📝 Playbooks]
+    Roles[📦 Roles]
+    Consistent[✅ Consistent]
+  end
+  Manual -->|🚀 Ansible| Automated
+```
+
+**🎯 Automation State:**
+* ⚡ Any server configurable in minutes
+* 🔄 All changes through playbooks
+* 📈 Teams deploy configuration confidently
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: Ansible in Real Life
+
+## 📅 A Day with Ansible
+
+**☀️ Morning:**
+* 📊 Review Ansible PR for new role
+* 👀 Check syntax with `ansible-lint`
+* ✅ Merge to main branch
+
+**🌤️ Afternoon:**
+* 🚨 Security patch needed
+* 🔧 Update role with new package version
+* 🚀 Run playbook — **all servers patched in 10 minutes**
+
+**🌙 Evening:**
+* 🤖 Scheduled playbook runs
+* 📊 Compliance reports generated
+* 🏠 Go home confident
+
+---
+
+## 📍 Slide 32 – 👥 Team Ansible Workflow
+
+| 👤 Role | 🎯 Ansible Responsibility |
+|---------|----------------------|
+| 🔧 **DevOps** | Write and maintain roles |
+| 👨‍💻 **Developer** | Request configuration changes |
+| 🛡️ **Security** | Review roles for compliance |
+| 📊 **Audit** | Verify configuration state |
+
+**🔗 Common Workflow:**
+* 📝 Create branch with role changes
+* 🔍 CI runs `ansible-lint` and syntax check
+* 👀 Team reviews the changes
+* ✅ Merge triggers playbook run
+
+---
+
+## 📍 Slide 33 – 🤝 Ansible + Terraform
+
+```mermaid
+flowchart LR
+  TF[🌍 Terraform] -->|Creates| VM[🖥️ Virtual Machine]
+  VM -->|IP Address| Ansible[🔧 Ansible]
+  Ansible -->|Configures| Ready[✅ Ready Server]
+```
+
+**🤝 Integration Patterns:**
+* 🌍 Terraform provisions infrastructure
+* 📋 Terraform outputs inventory
+* 🔧 Ansible configures servers
+* 🔄 Both stored in Git
+
+**💡 Best Practice:**
+* 🏗️ Terraform = **what** exists
+* 🔧 Ansible = **how** it's configured
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: Ansible Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Basic Playbooks] --> Mid[💼 Mid: Roles & Vault]
+  Mid --> Senior[⭐ Senior: Dynamic Inventory & CI/CD]
+  Senior --> Principal[🏆 Principal: Enterprise Automation]
+```
+
+**🛠️ Skills to Build:**
+* 📝 YAML and Jinja2 fluency
+* 📦 Role design patterns
+* 🔐 Vault and secrets management
+* 🌐 Dynamic inventory
+* 🔄 CI/CD integration
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 Enterprise Users:**
+* 🏦 **NASA**: Manages thousands of servers
+* 🎮 **EA Games**: Game server configuration
+* 🛒 **Walmart**: Retail infrastructure
+
+**☁️ Cloud Native:**
+* 🔍 **Twitter**: Configuration at scale
+* 📦 **Lyft**: Microservices configuration
+* 🎬 **Apple**: Device management
+
+**📊 Stats:**
+* 🌍 **#1** open-source automation tool
+* 📦 **30,000+** modules available
+* 🏢 **Most used** by Fortune 100
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🔧 **Ansible = Agentless configuration management**
+2. 📦 **Roles organize** reusable automation
+3. 🔄 **Idempotency** makes re-runs safe
+4. 🔔 **Handlers** efficiently manage service restarts
+5. 🔐 **Vault encrypts** sensitive data
+
+> 💡 Ansible playbooks are living documentation of your infrastructure.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🚀 Ansible Mindset |
+|---------------|------------------|
+| 🙅 "SSH and run commands" | 📝 "Define in playbook" |
+| 🚫 "Each server is unique" | 🔄 "All servers are identical" |
+| 👉 "Document the steps" | 📄 "Code IS documentation" |
+| 😨 "Updates are risky" | 💪 "Updates are automated" |
+| 💻 "Works on my server" | 🌍 "Works on all servers" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Ansible's agentless architecture
+* ✅ How to write playbooks and roles
+* ✅ Why idempotency matters
+* ✅ How handlers improve efficiency
+* ✅ Securing secrets with Vault
+
+> 🚀 **You're ready for Lab 5: Ansible Fundamentals**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L5_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Continuous Deployment with Ansible
+
+* 🚀 Application deployment roles
+* 🐳 Docker Compose templates
+* 🏷️ Tags and blocks
+* 💻 Hands-on: Deploying your app with Ansible
+
+**🎉 Your configuration automation journey continues.**
+
+> 🔧 From manual to automated — one playbook at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Ansible[🔧 Ansible Skills]
+  Ansible --> Automated[🤖 Automated Config]
+  Automated --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Ansible: Up & Running* — Lorin Hochstein
+* 📖 *Ansible for DevOps* — Jeff Geerling
+* 📖 *The Practice of Cloud System Administration* — Limoncelli
+
+**🔗 Links:**
+* 🌐 [Ansible Documentation](https://docs.ansible.com/)
+* 🌐 [Ansible Galaxy](https://galaxy.ansible.com/)
+* 🌐 [Ansible Best Practices](https://docs.ansible.com/ansible/latest/user_guide/playbooks_best_practices.html)
+
+---
diff --git a/lectures/lec6.md b/lectures/lec6.md
new file mode 100644
index 0000000000..a78ba20b5b
--- /dev/null
+++ b/lectures/lec6.md
@@ -0,0 +1,887 @@
+# 📌 Lecture 6 — Continuous Deployment: Advanced Ansible
+
+## 📍 Slide 1 – 🚀 Welcome to Continuous Deployment
+
+* 🌍 **Configuration is automated** — but what about deployments?
+* 😰 Manual deployments are slow, error-prone, and risky
+* 🚀 **CI/CD with Ansible** = automated, repeatable, safe deployments
+* 🎯 This lecture: master blocks, tags, Docker Compose, and CI/CD integration
+
+```mermaid
+flowchart LR
+  Code[💻 Code Push] -->|CI/CD| Build[🔨 Build]
+  Build --> Deploy[🚀 Ansible Deploy]
+  Deploy --> Running[✅ Running in Production]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Use blocks for error handling and task grouping
+* ✅ Apply tags for selective execution
+* ✅ Deploy applications with Docker Compose templates
+* ✅ Integrate Ansible with GitHub Actions
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Implement blocks with rescue and always |
+| 2 | 🔍 Design effective tag strategies |
+| 3 | 🛠️ Template Docker Compose files with Jinja2 |
+| 4 | 🗺️ Automate deployments with CI/CD |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Advanced patterns** — production-ready practices
+* 🎮 **Real-world scenarios** — deployment challenges
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **CI/CD integration**: GitHub Actions + Ansible
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Deployment Problem
+Section 2: Blocks & Error Handling
+Section 3: Tags & Selective Execution → 📝 MID Quiz
+Section 4: Docker Compose Deployment
+Section 5: CI/CD Integration
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **46%** of organizations deploy weekly or faster
+* ⏱️ Top performers deploy **multiple times per day**
+* 💥 **80%** of outages caused by changes (deploys, configs)
+
+> 💬 *"We deploy on Fridays and pray over the weekend"* — Nobody should say this
+
+**🤔 Think about it:**
+* How often does your team deploy?
+* How long does a deployment take?
+* Can you roll back in under 5 minutes?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L6_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Deployment Problem
+
+* 🎰 **Deployments = high-risk events**
+* 📋 Manual steps, checklists, approval gates
+* 🌙 Deploy only during "maintenance windows"
+* 💥 Result: **fear of deploying**
+
+```mermaid
+flowchart LR
+  Ready[✅ Code Ready] --> Wait[📅 Wait for Window]
+  Wait --> Manual[📋 Manual Steps]
+  Manual --> Pray[🙏 Hope It Works]
+  Pray -->|💥 Fail| Rollback[😱 Manual Rollback]
+  Pray -->|✅ Success| Relief[😮‍💨 Temporary Relief]
+```
+
+---
+
+## 📍 Slide 7 – 💥 Deployment Failures
+
+* 🔧 Wrong version deployed
+* 📦 Missing dependencies
+* ⚙️ Configuration mismatch
+* 💀 Partial deployment (some servers updated, some not)
+
+```mermaid
+flowchart TD
+  Deploy[🚀 Deploy Started] --> S1[🖥️ Server 1: ✅ Updated]
+  Deploy --> S2[🖥️ Server 2: ❌ Failed]
+  Deploy --> S3[🖥️ Server 3: 🔄 Pending]
+  S1 --> Inconsistent[😱 Inconsistent State]
+  S2 --> Inconsistent
+  S3 --> Inconsistent
+```
+
+**📊 The Numbers:**
+* 🔍 **60%** of outages caused by bad deployments
+* ⏱️ Average recovery time: **4+ hours**
+* 💰 Cost per hour of downtime: **$300,000+**
+
+---
+
+## 📍 Slide 8 – 😱 Rollback Nightmares
+
+* 📋 "Just revert the code" — but what about:
+  * 💾 Database migrations?
+  * ⚙️ Configuration changes?
+  * 📦 Dependencies?
+* 🙈 No automated rollback = manual scramble
+* 💀 Hours of downtime
+
+> ⚠️ **If you can't roll back quickly, you shouldn't deploy**
+
+**😰 Signs of Rollback Problems:**
+* 🔇 "We've never actually tested rollback"
+* 📝 Rollback requires manual steps
+* 🐌 "Rollback takes longer than fixing forward"
+* 🚪 Nobody knows the rollback procedure
+
+---
+
+## 📍 Slide 9 – 😨 All-or-Nothing Deploys
+
+* 📅 Big-bang releases every few months
+* 🎰 Everything changes at once
+* 📋 Impossible to isolate failures
+* 💀 If it fails, everything fails
+
+> ⚠️ **Large releases = large risk**
+
+**💬 Discussion:** Would you rather deploy 100 changes once or 1 change 100 times?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Manual Deployment
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow deployments | Features delayed |
+| 📋 Manual errors | Outages, rollbacks |
+| 👉 Inconsistent process | "Works for Alice, not Bob" |
+| 🙈 Fear of deploying | Innovation stalls |
+
+**📈 Elite vs Low Performers:**
+| Metric | 🏆 Elite | 😰 Low |
+|--------|---------|-------|
+| Deploy frequency | Multiple/day | Monthly |
+| Lead time | < 1 hour | 1-6 months |
+| Change failure rate | 0-15% | 46-60% |
+| Recovery time | < 1 hour | 1 week+ |
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: Blocks & Error Handling
+
+* 🧱 **Blocks** = group related tasks
+* 🔄 **Rescue** = handle failures
+* ✅ **Always** = run regardless of outcome
+* 🎯 Production-ready error handling
+
+```mermaid
+flowchart TD
+  Block[🧱 Block] --> Try[🎯 Try Tasks]
+  Try -->|✅ Success| Always[✅ Always]
+  Try -->|❌ Failure| Rescue[🔧 Rescue]
+  Rescue --> Always
+```
+
+---
+
+## 📍 Slide 12 – 🧱 Block Syntax
+
+```yaml
+- name: Deploy application with error handling
+  block:
+    - name: Pull latest image
+      docker_image:
+        name: "{{ app_image }}"
+        source: pull
+
+    - name: Start container
+      docker_container:
+        name: "{{ app_name }}"
+        image: "{{ app_image }}"
+        state: started
+
+  rescue:
+    - name: Log failure
+      debug:
+        msg: "Deployment failed! Rolling back..."
+
+    - name: Notify team
+      uri:
+        url: "{{ slack_webhook }}"
+        method: POST
+        body: '{"text": "Deployment failed!"}'
+
+  always:
+    - name: Cleanup temp files
+      file:
+        path: /tmp/deploy
+        state: absent
+```
+
+---
+
+## 📍 Slide 13 – 🛡️ Block Benefits
+
+```mermaid
+flowchart LR
+  subgraph Without Blocks
+    T1[Task 1] --> T2[Task 2]
+    T2 -->|❌ Fail| Stop[😱 Playbook Stops]
+  end
+  subgraph With Blocks
+    B1[🧱 Block] -->|❌ Fail| R1[🔧 Rescue]
+    R1 --> A1[✅ Always]
+  end
+```
+
+**🛡️ Advantages:**
+* 🔄 Graceful error handling
+* 📊 Cleanup runs even on failure
+* 🔔 Notification on failure
+* 🎯 Apply settings to multiple tasks
+
+```yaml
+- name: Docker installation
+  block:
+    - name: Task 1
+    - name: Task 2
+    - name: Task 3
+  become: yes        # 🔐 Applied to all tasks
+  when: install_docker  # 🔀 Condition for all
+  tags:
+    - docker         # 🏷️ Tag for all
+```
+
+---
+
+## 📍 Slide 14 – 🏷️ Section 3: Tags Strategy
+
+* 🏷️ **Tags** = label tasks for selective execution
+* 🎯 Run only what you need
+* ⏱️ Speed up development and testing
+* 🔧 Isolate specific operations
+
+```bash
+# Run only docker tasks
+ansible-playbook site.yml --tags "docker"
+
+# Skip common tasks
+ansible-playbook site.yml --skip-tags "common"
+
+# List available tags
+ansible-playbook site.yml --list-tags
+```
+
+---
+
+## 📍 Slide 15 – 🏷️ Tag Design Patterns
+
+```yaml
+# roles/web_app/tasks/main.yml
+- name: Application deployment
+  block:
+    - name: Pull image
+      docker_image:
+        name: "{{ app_image }}"
+        source: pull
+
+    - name: Deploy container
+      docker_container:
+        name: "{{ app_name }}"
+        state: started
+  tags:
+    - app_deploy
+    - deploy
+
+- name: Application wipe
+  block:
+    - name: Stop container
+      docker_container:
+        name: "{{ app_name }}"
+        state: absent
+  when: web_app_wipe | bool
+  tags:
+    - web_app_wipe
+```
+
+**🏷️ Tag Categories:**
+* 🚀 **deploy**: Deployment tasks
+* 🧹 **wipe**: Cleanup tasks
+* 📦 **packages**: Package installation
+* ⚙️ **config**: Configuration only
+
+---
+
+## 📍 Slide 16 – ⚠️ Wipe Logic Pattern
+
+```mermaid
+flowchart TD
+  Check{🔍 web_app_wipe = true?}
+  Check -->|No| Skip[⏭️ Skip wipe tasks]
+  Check -->|Yes| TagCheck{🏷️ --tags web_app_wipe?}
+  TagCheck -->|No| Skip2[⏭️ Skip: tag not specified]
+  TagCheck -->|Yes| Wipe[🧹 Execute wipe]
+```
+
+**🛡️ Double Safety Mechanism:**
+* 📊 **Variable gate**: `web_app_wipe: false` by default
+* 🏷️ **Tag gate**: Must specify `--tags web_app_wipe`
+* ✅ Both required to execute dangerous tasks
+
+```bash
+# Normal deploy (wipe doesn't run)
+ansible-playbook deploy.yml
+
+# Wipe only
+ansible-playbook deploy.yml -e "web_app_wipe=true" --tags web_app_wipe
+
+# Clean reinstall (wipe + deploy)
+ansible-playbook deploy.yml -e "web_app_wipe=true"
+```
+
+---
+
+## 📍 Slide 17 – 🐳 Docker Compose Deployment
+
+```mermaid
+flowchart LR
+  Template[📝 Template] -->|Jinja2| Compose[🐳 docker-compose.yml]
+  Compose --> Deploy[🚀 Deploy]
+  Deploy --> Running[✅ Running]
+```
+
+**🐳 Why Docker Compose with Ansible?**
+* 📝 Declarative container configuration
+* 🔄 Managed by templates (dynamic values)
+* 🔧 Easy updates and rollbacks
+* 📊 Multi-container applications
+
+---
+
+## 📍 Slide 18 – 📝 Jinja2 Templates
+
+```yaml
+# roles/web_app/templates/docker-compose.yml.j2
+version: '3.8'
+
+services:
+  {{ app_name }}:
+    image: {{ docker_image }}:{{ docker_tag }}
+    container_name: {{ app_name }}
+    ports:
+      - "{{ app_port }}:{{ app_internal_port }}"
+    environment:
+{% for key, value in app_env.items() %}
+      {{ key }}: "{{ value }}"
+{% endfor %}
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:{{ app_internal_port }}/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+```
+
+**📊 Variables Used:**
+* 📦 `app_name`: Container name
+* 🐳 `docker_image`: Image repository
+* 🏷️ `docker_tag`: Image version
+* 🔌 `app_port`: Exposed port
+
+---
+
+## 📍 Slide 19 – 🚀 Deploy with Docker Compose Module
+
+```yaml
+# roles/web_app/tasks/main.yml
+- name: Create application directory
+  file:
+    path: "{{ compose_project_dir }}"
+    state: directory
+    mode: '0755'
+
+- name: Template docker-compose file
+  template:
+    src: docker-compose.yml.j2
+    dest: "{{ compose_project_dir }}/docker-compose.yml"
+    mode: '0644'
+  notify: restart app
+
+- name: Deploy with Docker Compose
+  community.docker.docker_compose_v2:
+    project_src: "{{ compose_project_dir }}"
+    state: present
+    pull: always
+  register: deploy_result
+
+- name: Verify deployment
+  uri:
+    url: "http://localhost:{{ app_port }}/health"
+    status_code: 200
+  retries: 5
+  delay: 10
+```
+
+---
+
+## 📍 Slide 20 – 🔗 Role Dependencies
+
+```yaml
+# roles/web_app/meta/main.yml
+---
+dependencies:
+  - role: docker
+    vars:
+      docker_users:
+        - "{{ ansible_user }}"
+```
+
+**🔗 Dependency Benefits:**
+* 🔄 Automatic execution order
+* 📦 Ensures prerequisites
+* 🎯 Self-contained roles
+
+```mermaid
+flowchart LR
+  WebApp[📦 web_app role] -->|depends on| Docker[🐳 docker role]
+  Docker --> Tasks[🔧 Docker tasks run first]
+  Tasks --> WebAppTasks[🚀 Web app tasks run second]
+```
+
+---
+
+## 📍 Slide 21 – 📊 Multi-Environment Deployment
+
+```yaml
+# vars/app_python.yml
+app_name: devops-python
+docker_image: username/devops-info-service
+docker_tag: latest
+app_port: 8000
+
+# vars/app_bonus.yml
+app_name: devops-go
+docker_image: username/devops-info-service-go
+docker_tag: latest
+app_port: 8001
+```
+
+```yaml
+# playbooks/deploy_python.yml
+---
+- name: Deploy Python Application
+  hosts: webservers
+  become: yes
+  vars_files:
+    - ../vars/app_python.yml
+  roles:
+    - web_app
+```
+
+**🔄 Same role, different variables!**
+
+---
+
+## 📍 Slide 22 – 🤖 CI/CD Integration
+
+```mermaid
+flowchart LR
+  Push[📤 Git Push] --> CI[🔄 GitHub Actions]
+  CI --> Lint[📋 ansible-lint]
+  Lint --> Deploy[🚀 ansible-playbook]
+  Deploy --> Verify[✅ Verification]
+```
+
+**🤖 CI/CD Benefits:**
+* 🔄 Automatic deployments on push
+* 📋 Linting catches errors early
+* 🔐 Secure credential handling
+* 📊 Audit trail of deployments
+
+---
+
+## 📍 Slide 23 – 📝 GitHub Actions Workflow
+
+```yaml
+# .github/workflows/ansible-deploy.yml
+name: Ansible Deployment
+
+on:
+  push:
+    branches: [main]
+    paths:
+      - 'ansible/**'
+
+jobs:
+  lint:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install ansible-lint
+        run: pip install ansible ansible-lint
+      - name: Run ansible-lint
+        run: ansible-lint ansible/playbooks/*.yml
+
+  deploy:
+    needs: lint
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Setup SSH
+        run: |
+          mkdir -p ~/.ssh
+          echo "${{ secrets.SSH_KEY }}" > ~/.ssh/id_rsa
+          chmod 600 ~/.ssh/id_rsa
+      - name: Deploy
+        run: |
+          cd ansible
+          echo "${{ secrets.VAULT_PASS }}" > .vault_pass
+          ansible-playbook playbooks/deploy.yml \
+            --vault-password-file .vault_pass
+          rm .vault_pass
+```
+
+---
+
+## 📍 Slide 24 – 🔐 Secrets in CI/CD
+
+```mermaid
+flowchart TD
+  Secrets[🔐 GitHub Secrets] --> Workflow[🔄 Workflow]
+  Workflow --> TempFile[📄 Temp File]
+  TempFile --> Ansible[🔧 Ansible]
+  Ansible --> Delete[🗑️ Delete Temp File]
+```
+
+**🔐 Security Practices:**
+* 📦 Store credentials in GitHub Secrets
+* 📄 Write to temp file during run
+* 🗑️ Delete immediately after use
+* 🚫 Never echo secrets to logs
+
+```yaml
+# Using secrets safely
+- name: Deploy with Vault
+  env:
+    VAULT_PASS: ${{ secrets.ANSIBLE_VAULT_PASSWORD }}
+  run: |
+    echo "$VAULT_PASS" > /tmp/vault_pass
+    ansible-playbook playbook.yml --vault-password-file /tmp/vault_pass
+    rm /tmp/vault_pass  # 🗑️ Cleanup!
+```
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L6_MID
+
+---
+
+## 📍 Slide 26 – 📁 Section 4: Path Filters
+
+```yaml
+on:
+  push:
+    paths:
+      - 'ansible/**'           # 📁 Only ansible changes
+      - '!ansible/docs/**'     # 📝 Exclude docs
+      - '.github/workflows/ansible-deploy.yml'
+```
+
+**📁 Path Filter Benefits:**
+* ⚡ Faster CI (skip unnecessary runs)
+* 💰 Lower costs (fewer minutes used)
+* 🎯 Focused workflows
+
+```mermaid
+flowchart TD
+  Push[📤 Push] --> Check{📁 ansible/** changed?}
+  Check -->|Yes| Run[🚀 Run Workflow]
+  Check -->|No| Skip[⏭️ Skip Workflow]
+```
+
+---
+
+## 📍 Slide 27 – 📊 Deployment Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| ⏱️ **Deploy Time** | Push to production | < 15 minutes |
+| 📦 **Deploy Frequency** | How often | Daily+ |
+| ❌ **Failure Rate** | Failed deploys | < 15% |
+| 🔄 **Rollback Time** | Recovery time | < 5 minutes |
+
+> 📚 These are DORA metrics for deployment performance.
+
+**🤔 Question:** How fast can you deploy and roll back?
+
+---
+
+## 📍 Slide 28 – 🔄 Rollback Strategy
+
+```yaml
+# Rollback by re-deploying previous version
+- name: Rollback application
+  block:
+    - name: Stop current container
+      docker_container:
+        name: "{{ app_name }}"
+        state: stopped
+
+    - name: Deploy previous version
+      community.docker.docker_compose_v2:
+        project_src: "{{ compose_project_dir }}"
+        state: present
+      vars:
+        docker_tag: "{{ rollback_tag }}"
+
+    - name: Verify rollback
+      uri:
+        url: "http://localhost:{{ app_port }}/health"
+        status_code: 200
+      retries: 3
+      delay: 5
+```
+
+**🔄 Rollback Options:**
+* 🏷️ Deploy previous tag
+* 📦 Docker Compose down/up
+* 🔙 Git revert + CI/CD
+
+---
+
+## 📍 Slide 29 – 🌊 From Manual to Automated Deployment
+
+```mermaid
+flowchart LR
+  subgraph 😱 Manual
+    SSH[🔌 SSH to servers]
+    Commands[💻 Run commands]
+    Hope[🙏 Hope it works]
+  end
+  subgraph 🤖 Automated
+    Push[📤 Git push]
+    CI[🔄 CI/CD]
+    Deploy[🚀 Ansible]
+  end
+  Manual -->|🚀 Automate| Automated
+```
+
+**🎯 Automation State:**
+* ⚡ Deploy in minutes, not hours
+* 🔄 Every change through CI/CD
+* 📈 Deploy with confidence
+
+---
+
+## 📍 Slide 30 – 🏢 Section 5: Real World CI/CD
+
+## 📅 A Day with Automated Deployment
+
+**☀️ Morning:**
+* 📊 Review deployment PR
+* 👀 Check CI lint results
+* ✅ Merge to main
+
+**🌤️ Afternoon:**
+* 🤖 CI automatically deploys
+* 📊 Monitoring shows healthy
+* ☕ Coffee break
+
+**🌙 Evening:**
+* 🚨 Bug found in production
+* 🔙 Revert commit, CI deploys previous
+* ⏱️ **5 minutes** to rollback
+
+---
+
+## 📍 Slide 31 – 👥 Team Deployment Workflow
+
+| 👤 Role | 🎯 CI/CD Responsibility |
+|---------|----------------------|
+| 👨‍💻 **Developer** | Create PR, fix lint issues |
+| 🔧 **DevOps** | Maintain workflows, roles |
+| 👀 **Reviewer** | Approve changes |
+| 🤖 **CI/CD** | Execute deployment |
+
+**🔗 GitOps Workflow:**
+```mermaid
+flowchart LR
+  PR[📝 Pull Request] --> Review[👀 Review]
+  Review --> Merge[✅ Merge]
+  Merge --> CI[🔄 CI/CD]
+  CI --> Deploy[🚀 Deploy]
+  Deploy --> Prod[🌐 Production]
+```
+
+---
+
+## 📍 Slide 32 – 🔀 Deployment Strategies
+
+```mermaid
+flowchart TD
+  subgraph Rolling
+    R1[🔄 Update 1 at a time]
+  end
+  subgraph Blue-Green
+    BG1[🔵 Blue: Current]
+    BG2[🟢 Green: New]
+  end
+  subgraph Canary
+    C1[🐤 Small % first]
+    C2[📊 Monitor]
+    C3[🚀 Full rollout]
+  end
+```
+
+| 🚀 Strategy | 🎯 Use Case |
+|------------|----------|
+| 🔄 **Rolling** | Gradual update, zero downtime |
+| 🔵 **Blue-Green** | Instant switch, easy rollback |
+| 🐤 **Canary** | Test with subset of users |
+
+---
+
+## 📍 Slide 33 – 🧪 Deployment Verification
+
+```yaml
+# Verify deployment success
+- name: Wait for application
+  uri:
+    url: "http://{{ ansible_host }}:{{ app_port }}/health"
+    status_code: 200
+    return_content: yes
+  register: health_check
+  until: health_check.status == 200
+  retries: 10
+  delay: 6
+
+- name: Run smoke tests
+  command: "curl -f http://{{ ansible_host }}:{{ app_port }}/"
+  register: smoke_test
+  failed_when: smoke_test.rc != 0
+
+- name: Log deployment success
+  debug:
+    msg: "✅ Deployment verified: {{ app_name }} is healthy"
+```
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: CD Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Manual deploys] --> Mid[💼 Mid: CI/CD pipelines]
+  Mid --> Senior[⭐ Senior: Zero-downtime strategies]
+  Senior --> Principal[🏆 Principal: Platform architecture]
+```
+
+**🛠️ Skills to Build:**
+* 🔄 CI/CD pipeline design
+* 🐳 Container orchestration
+* 📊 Monitoring and alerting
+* 🔙 Rollback strategies
+* 🔐 Security in pipelines
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 Enterprise CD:**
+* 📦 **Amazon**: Deploy every 11.7 seconds
+* 🎬 **Netflix**: Canary deployments everywhere
+* 🔍 **Google**: Feature flags for gradual rollout
+
+**☁️ CD Practices:**
+* 🏦 **Stripe**: Shadow traffic for testing
+* 📦 **Etsy**: 50+ deploys per day
+* 🎮 **Spotify**: Squad-based ownership
+
+**📊 Stats:**
+* 🚀 Elite teams deploy **on demand**
+* ⏱️ Lead time: **less than 1 hour**
+* 🔄 Recovery: **less than 1 hour**
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🧱 **Blocks** enable graceful error handling
+2. 🏷️ **Tags** allow selective execution
+3. 🐳 **Docker Compose** templates for flexible deployments
+4. 🔗 **Role dependencies** ensure proper ordering
+5. 🤖 **CI/CD** automates the entire process
+
+> 💡 Small, frequent deployments are safer than big releases.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🚀 CD Mindset |
+|---------------|------------------|
+| 🙅 "Deploy on weekends" | 🚀 "Deploy anytime" |
+| 🚫 "Big releases quarterly" | 🔄 "Small releases daily" |
+| 👉 "Manual verification" | 🤖 "Automated checks" |
+| 😨 "Rollback is hard" | 💪 "Rollback in minutes" |
+| 💻 "It works locally" | 🌍 "CI validates it" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Blocks with rescue and always
+* ✅ Tag strategies for selective execution
+* ✅ Docker Compose templates with Jinja2
+* ✅ Role dependencies and ordering
+* ✅ CI/CD integration with GitHub Actions
+
+> 🚀 **You're ready for Lab 6: Advanced Ansible & CI/CD**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L6_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Observability & Logging
+
+* 📋 Log aggregation with Loki
+* 📊 Visualization with Grafana
+* 🔍 LogQL query language
+* 💻 Hands-on: Building a logging stack
+
+**🎉 Your continuous deployment journey continues.**
+
+> 🚀 From manual deploys to automated CI/CD — one commit at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> CICD[🤖 CI/CD Skills]
+  CICD --> Automated[🚀 Automated Deploys]
+  Automated --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Continuous Delivery* — Jez Humble
+* 📖 *The DevOps Handbook* — Gene Kim et al.
+* 📖 *Accelerate* — Nicole Forsgren
+
+**🔗 Links:**
+* 🌐 [Ansible Blocks](https://docs.ansible.com/ansible/latest/user_guide/playbooks_blocks.html)
+* 🌐 [Ansible Tags](https://docs.ansible.com/ansible/latest/user_guide/playbooks_tags.html)
+* 🌐 [GitHub Actions](https://docs.github.com/en/actions)
+
+---
diff --git a/lectures/lec7.md b/lectures/lec7.md
new file mode 100644
index 0000000000..b00d0ad39f
--- /dev/null
+++ b/lectures/lec7.md
@@ -0,0 +1,849 @@
+# 📌 Lecture 7 — Observability & Logging: From Blind to Insight
+
+## 📍 Slide 1 – 🚀 Welcome to Observability
+
+* 🌍 **Applications are running** — but what's happening inside?
+* 😰 Without visibility, debugging is guesswork
+* 🔍 **Observability** = understanding system state from outputs
+* 🎯 This lecture: master logging with Loki, Promtail, and Grafana
+
+```mermaid
+flowchart LR
+  App[📦 Application] -->|📋 Logs| Collect[🔧 Promtail]
+  Collect --> Store[💾 Loki]
+  Store --> View[📊 Grafana]
+  View --> Insight[💡 Insight]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand the three pillars of observability
+* ✅ Deploy Loki stack for log aggregation
+* ✅ Query logs with LogQL
+* ✅ Build effective log dashboards
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Differentiate logs, metrics, and traces |
+| 2 | 🔍 Configure Loki 3.0 with TSDB storage |
+| 3 | 🛠️ Write LogQL queries for filtering and aggregation |
+| 4 | 🗺️ Design actionable log dashboards |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + Configuration** — hands-on focus
+* 🎮 **Real-world scenarios** — debugging production issues
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Tool stack**: Loki + Promtail + Grafana
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Visibility Problem
+Section 2: Observability Fundamentals
+Section 3: Loki Stack Deep Dive   → 📝 MID Quiz
+Section 4: LogQL & Dashboards
+Section 5: Production Logging
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **70%** of mean time to resolution is spent finding the problem
+* ⏱️ Average time to detect issues: **hours to days**
+* 💥 Without observability, debugging is **archaeology**
+
+> 💬 *"Users reported it's slow... but where?"* — Every on-call engineer, ever
+
+**🤔 Think about it:**
+* How do you know your app is healthy?
+* When users report issues, where do you look first?
+* Can you trace a request through your system?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L7_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Visibility Problem
+
+* 🙈 **No logs** = flying blind
+* 📋 Logs scattered across servers
+* 🔍 grep through SSH sessions
+* 💥 Result: **hours spent finding problems**
+
+```mermaid
+flowchart LR
+  Issue[🚨 Issue Reported] --> SSH1[🔌 SSH to Server 1]
+  SSH1 --> Grep1[🔍 grep logs]
+  Grep1 --> SSH2[🔌 SSH to Server 2]
+  SSH2 --> Grep2[🔍 grep logs]
+  Grep2 --> Hours[⏱️ Hours Later...]
+```
+
+---
+
+## 📍 Slide 7 – 📋 Log Chaos
+
+* 📁 Logs in different formats
+* 🖥️ Different locations per server
+* 📅 Old logs deleted or rotated
+* 💀 No correlation between services
+
+```mermaid
+flowchart TD
+  App1[📦 App 1: JSON logs]
+  App2[📦 App 2: Plain text]
+  App3[📦 App 3: Custom format]
+  App1 --> Chaos[😱 No Unified View]
+  App2 --> Chaos
+  App3 --> Chaos
+```
+
+**📊 The Numbers:**
+* 🔍 **73%** of engineers can't find logs quickly
+* ⏱️ Average time to find relevant log: **15+ minutes**
+* 💰 Cost of slow debugging: **$26,000/hour** (enterprise)
+
+---
+
+## 📍 Slide 8 – 😱 "It's Working for Me"
+
+* 👥 Users report: *"App is slow"*
+* 🤷 Team responds: *"Works for me"*
+* 🔍 No data to prove either side
+* 💀 Frustration all around
+
+> ⚠️ **Without observability, you can't prove anything**
+
+**😰 Signs of Poor Observability:**
+* 🔇 "Check the server logs" (which server?)
+* 📝 "It was working yesterday" (what changed?)
+* 🐌 "Let's restart and see" (cargo cult debugging)
+* 🚪 Blame instead of data
+
+**💬 Discussion:** How do you currently debug production issues?
+
+---
+
+## 📍 Slide 9 – 🔥 The Alert Fatigue Problem
+
+* 🚨 Too many alerts = no alerts
+* 📧 Inbox full of "warnings"
+* 😴 Real issues get ignored
+* 💀 On-call burnout
+
+> ⚠️ **Noise drowns out signal**
+
+```mermaid
+flowchart LR
+  Alerts[🚨 1000 Alerts/day] --> Ignore[😴 Alert Fatigue]
+  Ignore --> Miss[🙈 Miss Real Issues]
+  Miss --> Outage[💥 Production Outage]
+```
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Blind Operations
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow debugging | Hours/days to resolve |
+| 📋 No correlation | Can't trace requests |
+| 👉 Finger pointing | No data, just blame |
+| 🙈 Hidden failures | Issues go unnoticed |
+
+**📈 Real Numbers:**
+* 🏢 **MTTR without observability**: 4+ hours
+* 🚀 **MTTR with observability**: < 30 minutes
+* 💰 **ROI of observability**: 10x+ reduction in incident cost
+
+**💰 Cost Example:**
+* 💵 1-hour outage: **$300,000**
+* 🔍 Good observability: **$30/month**
+* 🧮 Break-even: **first 6 seconds of prevented downtime**
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Observability Is
+
+* 🔍 **Observability** = understanding system state from external outputs
+* 📊 **Three pillars**: Logs, Metrics, Traces
+* 🎯 Answer: "Why is this happening?"
+* 🚫 NOT just monitoring (which asks "Is it working?")
+
+```mermaid
+flowchart TD
+  Obs[🔍 Observability]
+  Obs --> Logs[📋 Logs: What happened]
+  Obs --> Metrics[📊 Metrics: How much]
+  Obs --> Traces[🔗 Traces: Where/how long]
+```
+
+**📖 Definition:**
+> *Observability is the ability to understand the internal state of a system by examining its external outputs — logs, metrics, and traces.*
+
+---
+
+## 📍 Slide 12 – 📋 The Three Pillars
+
+| 📊 Pillar | 🎯 Answers | 🛠️ Tools |
+|-----------|-----------|----------|
+| 📋 **Logs** | What happened? | Loki, ELK |
+| 📊 **Metrics** | How much/fast? | Prometheus |
+| 🔗 **Traces** | Where did time go? | Jaeger, Tempo |
+
+```mermaid
+flowchart LR
+  subgraph Logs
+    L1[📝 Error: Connection refused]
+  end
+  subgraph Metrics
+    M1[📈 99.9% availability]
+  end
+  subgraph Traces
+    T1[🔗 Request: 250ms total]
+  end
+```
+
+**🎯 Together they tell the full story**
+
+---
+
+## 📍 Slide 13 – 📋 Logs: What Happened
+
+* 📝 **Events** with timestamps
+* 🔍 Detailed context for debugging
+* 📊 Can be structured (JSON) or unstructured
+* ⚠️ High volume, high storage
+
+```json
+{
+  "timestamp": "2024-01-15T10:23:45Z",
+  "level": "ERROR",
+  "service": "user-api",
+  "message": "Database connection failed",
+  "error": "Connection refused",
+  "host": "server-1"
+}
+```
+
+**🎯 Use logs when:**
+* 🔍 Debugging specific errors
+* 📋 Understanding request flow
+* 🛡️ Security auditing
+
+---
+
+## 📍 Slide 14 – 📊 Why Structured Logging?
+
+```mermaid
+flowchart LR
+  subgraph ❌ Unstructured
+    U1[ERROR: Failed to connect to db at 10:23]
+  end
+  subgraph ✅ Structured
+    S1[JSON with fields]
+  end
+  U1 --> Hard[😰 Hard to parse]
+  S1 --> Easy[✅ Easy to query]
+```
+
+**❌ Unstructured:**
+```
+ERROR 2024-01-15 10:23:45 Connection to database failed on server-1
+```
+
+**✅ Structured (JSON):**
+```json
+{"timestamp":"2024-01-15T10:23:45Z","level":"ERROR","msg":"Connection failed","server":"server-1"}
+```
+
+**🎯 Benefits:**
+* 🔍 Easy to filter and search
+* 📊 Aggregate by any field
+* 🤖 Machine-parseable
+
+---
+
+## 📍 Slide 15 – ⚡ Loki vs ELK
+
+| 📋 Aspect | 📊 Loki | 🔍 ELK Stack |
+|-----------|---------|-------------|
+| 🏗️ Architecture | Lightweight | Heavy |
+| 💾 Storage | Index labels only | Full-text index |
+| 📊 Query | LogQL | Lucene |
+| 💰 Cost | Low (storage) | High (compute) |
+| 🎯 Best for | Cloud-native | Enterprise search |
+
+```mermaid
+flowchart LR
+  Loki[📊 Loki] -->|Labels| Index1[🏷️ Small Index]
+  ELK[🔍 ELK] -->|Full Text| Index2[📚 Large Index]
+  Index1 --> Cost1[💰 Low Cost]
+  Index2 --> Cost2[💸 High Cost]
+```
+
+> 🔥 **Loki**: "Like Prometheus, but for logs"
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Loki Stack Deep Dive
+
+## 🏗️ Loki Architecture
+
+* 💾 **Loki**: Log storage (index + chunks)
+* 🔧 **Promtail**: Log collector (agent)
+* 📊 **Grafana**: Visualization
+
+```mermaid
+flowchart LR
+  App1[📦 App 1] --> Promtail[🔧 Promtail]
+  App2[📦 App 2] --> Promtail
+  Promtail -->|Push| Loki[💾 Loki]
+  Loki --> Grafana[📊 Grafana]
+```
+
+**🎮 Let's build a logging stack.**
+
+---
+
+## 📍 Slide 17 – 💾 Loki 3.0 Features
+
+* 🚀 **TSDB index**: 10x faster queries
+* 📊 **Structured metadata**: First-class support
+* 💾 **Better compression**: Lower storage costs
+* 🔍 **Schema v13**: Latest and recommended
+
+```yaml
+# loki/config.yml
+schema_config:
+  configs:
+    - from: 2024-01-01
+      store: tsdb        # 🚀 New fast store
+      object_store: filesystem
+      schema: v13        # 📊 Latest schema
+      index:
+        prefix: index_
+        period: 24h
+```
+
+**🎯 Always use TSDB for new deployments!**
+
+---
+
+## 📍 Slide 18 – ⚙️ Loki Configuration
+
+```yaml
+# loki/config.yml
+auth_enabled: false
+
+server:
+  http_listen_port: 3100
+
+common:
+  path_prefix: /loki
+  storage:
+    filesystem:
+      chunks_directory: /loki/chunks
+      rules_directory: /loki/rules
+  replication_factor: 1
+  ring:
+    instance_addr: 127.0.0.1
+    kvstore:
+      store: inmemory
+
+limits_config:
+  retention_period: 168h  # 🗓️ 7 days
+```
+
+**🔑 Key Settings:**
+* 🔐 `auth_enabled`: False for testing
+* 💾 `storage`: Where logs are stored
+* 🗓️ `retention_period`: How long to keep logs
+
+---
+
+## 📍 Slide 19 – 🔧 Promtail Configuration
+
+```yaml
+# promtail/config.yml
+server:
+  http_listen_port: 9080
+
+positions:
+  filename: /tmp/positions.yaml
+
+clients:
+  - url: http://loki:3100/loki/api/v1/push
+
+scrape_configs:
+  - job_name: docker
+    docker_sd_configs:
+      - host: unix:///var/run/docker.sock
+        refresh_interval: 5s
+    relabel_configs:
+      - source_labels: ['__meta_docker_container_name']
+        regex: '/(.*)'
+        target_label: 'container'
+```
+
+**🔑 Key Components:**
+* 📋 `positions`: Track what's been read
+* 🔗 `clients`: Where to send logs
+* 🐳 `docker_sd_configs`: Auto-discover containers
+
+---
+
+## 📍 Slide 20 – 🐳 Docker Compose Stack
+
+```yaml
+# docker-compose.yml
+version: '3.8'
+
+services:
+  loki:
+    image: grafana/loki:3.0.0
+    ports:
+      - "3100:3100"
+    volumes:
+      - ./loki/config.yml:/etc/loki/config.yml
+      - loki-data:/loki
+    command: -config.file=/etc/loki/config.yml
+
+  promtail:
+    image: grafana/promtail:3.0.0
+    volumes:
+      - ./promtail/config.yml:/etc/promtail/config.yml
+      - /var/lib/docker/containers:/var/lib/docker/containers:ro
+      - /var/run/docker.sock:/var/run/docker.sock:ro
+    command: -config.file=/etc/promtail/config.yml
+
+  grafana:
+    image: grafana/grafana:11.3.0
+    ports:
+      - "3000:3000"
+    volumes:
+      - grafana-data:/var/lib/grafana
+```
+
+---
+
+## 📍 Slide 21 – 🏷️ Labels: The Key Concept
+
+```mermaid
+flowchart TD
+  Log[📋 Log Entry] --> Labels[🏷️ Labels]
+  Labels --> App[app=web-api]
+  Labels --> Env[env=production]
+  Labels --> Level[level=error]
+  App --> Query[🔍 Query by Labels]
+  Env --> Query
+  Level --> Query
+```
+
+**🏷️ Labels = How Loki indexes logs**
+
+```logql
+# Query logs by labels
+{app="web-api", env="production"}
+
+# Filter errors
+{app="web-api"} |= "error"
+```
+
+**⚠️ Label Best Practices:**
+* 🔢 Keep cardinality low (< 10 values per label)
+* 🚫 Never use high-cardinality fields (user IDs, request IDs)
+* 🏷️ Use for: app name, environment, service
+
+---
+
+## 📍 Slide 22 – 🔍 LogQL Basics
+
+```mermaid
+flowchart LR
+  Selector[🏷️ Stream Selector] --> Filter[🔍 Line Filter]
+  Filter --> Parser[📊 Parser]
+  Parser --> Result[📋 Results]
+```
+
+**🔍 Query Structure:**
+```logql
+{label="value"} |= "filter" | json | field="value"
+```
+
+**📋 Examples:**
+```logql
+# All logs from container
+{container="web-api"}
+
+# Errors only
+{container="web-api"} |= "error"
+
+# Parse JSON, filter by level
+{container="web-api"} | json | level="ERROR"
+
+# Count errors per minute
+rate({container="web-api"} |= "error" [1m])
+```
+
+---
+
+## 📍 Slide 23 – 📊 LogQL Operators
+
+| 🔧 Operator | 🎯 Purpose | 📝 Example |
+|-------------|----------|---------|
+| `\|=` | Contains | `\|= "error"` |
+| `!=` | Not contains | `!= "debug"` |
+| `\|~` | Regex match | `\|~ "error\|warn"` |
+| `\| json` | Parse JSON | `\| json` |
+| `\| logfmt` | Parse logfmt | `\| logfmt` |
+| `rate()` | Logs per second | `rate({app="x"}[5m])` |
+
+**📊 Aggregation:**
+```logql
+# Logs per second by container
+sum by (container) (rate({job="docker"}[1m]))
+
+# Count by level
+sum by (level) (count_over_time({app="web"} | json [5m]))
+```
+
+---
+
+## 📍 Slide 24 – 🐍 Structured Logging in Python
+
+```python
+import logging
+import json
+from datetime import datetime
+
+class JSONFormatter(logging.Formatter):
+    def format(self, record):
+        log_obj = {
+            "timestamp": datetime.utcnow().isoformat() + "Z",
+            "level": record.levelname,
+            "message": record.getMessage(),
+            "logger": record.name,
+        }
+        if record.exc_info:
+            log_obj["exception"] = self.formatException(record.exc_info)
+        return json.dumps(log_obj)
+
+# Setup
+handler = logging.StreamHandler()
+handler.setFormatter(JSONFormatter())
+logger = logging.getLogger()
+logger.addHandler(handler)
+logger.setLevel(logging.INFO)
+
+# Usage
+logger.info("User logged in", extra={"user_id": 123})
+```
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L7_MID
+
+---
+
+## 📍 Slide 26 – 📊 Section 4: Building Dashboards
+
+## 🎨 Dashboard Design Principles
+
+* 🎯 **Purpose**: What question does it answer?
+* 📊 **Hierarchy**: Most important at top
+* 🎨 **Color**: Red = bad, Green = good
+* 🔄 **Refresh**: Auto-refresh for real-time
+
+```mermaid
+flowchart TD
+  Top[🚨 Alerts & Errors]
+  Top --> Middle[📊 Request Rates]
+  Middle --> Bottom[📋 Log Stream]
+```
+
+---
+
+## 📍 Slide 27 – 📊 Essential Log Panels
+
+**1️⃣ Log Stream (Logs visualization)**
+```logql
+{app=~"devops-.*"}
+```
+
+**2️⃣ Error Rate (Time series)**
+```logql
+sum by (app) (rate({app=~"devops-.*"} |= "ERROR" [1m]))
+```
+
+**3️⃣ Request Rate (Time series)**
+```logql
+sum by (app) (rate({app=~"devops-.*"} [1m]))
+```
+
+**4️⃣ Level Distribution (Pie chart)**
+```logql
+sum by (level) (count_over_time({app=~"devops-.*"} | json [5m]))
+```
+
+---
+
+## 📍 Slide 28 – 📊 Grafana Panel Types
+
+| 📊 Type | 🎯 Use For |
+|---------|----------|
+| 📋 **Logs** | Raw log entries |
+| 📈 **Time series** | Trends over time |
+| 📊 **Stat** | Single values |
+| 🥧 **Pie chart** | Distribution |
+| 📋 **Table** | Structured data |
+| 🌡️ **Gauge** | Current status |
+
+```mermaid
+flowchart LR
+  Logs[📋 Logs] --> Debug[🔍 Debugging]
+  TimeSeries[📈 Time Series] --> Trends[📊 Trends]
+  Stat[📊 Stat] --> KPIs[🎯 KPIs]
+```
+
+---
+
+## 📍 Slide 29 – 📊 Logging Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| 📋 **Log Volume** | Logs per second | Stable |
+| ❌ **Error Rate** | Errors per minute | < 1% |
+| ⏱️ **Query Time** | Time to find logs | < 30s |
+| 💾 **Retention** | How long kept | 7+ days |
+
+> 📚 These metrics indicate logging health.
+
+**🤔 Question:** How quickly can you find relevant logs?
+
+---
+
+## 📍 Slide 30 – 🌊 From Blind to Observable
+
+```mermaid
+flowchart LR
+  subgraph 😱 Blind
+    SSH[🔌 SSH grep]
+    Guess[🤷 Guesswork]
+    Slow[⏱️ Hours]
+  end
+  subgraph 🔍 Observable
+    Dashboard[📊 Dashboard]
+    Query[🔍 LogQL]
+    Fast[⚡ Minutes]
+  end
+  Blind -->|🚀 Loki| Observable
+```
+
+**🎯 Observability State:**
+* ⚡ Find issues in minutes, not hours
+* 🔄 Unified view across all services
+* 📈 Data-driven debugging
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: Production Logging
+
+## 📅 A Day with Observability
+
+**☀️ Morning:**
+* 📊 Check Grafana dashboard — all green ✅
+* 📋 Review overnight logs — no anomalies
+* ☕ Coffee with confidence
+
+**🌤️ Afternoon:**
+* 🚨 Alert: Error rate spike
+* 🔍 LogQL: `{app="api"} |= "error" | json | level="ERROR"`
+* 🔧 Found: Database timeout
+* ⏱️ **10 minutes** to identify root cause
+
+**🌙 Evening:**
+* 📊 Review error trends
+* 📝 Create runbook for similar issues
+* 🏠 Go home knowing you can debug remotely
+
+---
+
+## 📍 Slide 32 – 👥 Team Logging Workflow
+
+| 👤 Role | 🎯 Observability Responsibility |
+|---------|----------------------|
+| 👨‍💻 **Developer** | Add structured logging |
+| 🔧 **DevOps** | Maintain logging stack |
+| 🛡️ **SRE** | Build dashboards, respond to alerts |
+| 📊 **On-call** | Use logs for incident response |
+
+**🔗 Incident Response Flow:**
+```mermaid
+flowchart LR
+  Alert[🚨 Alert] --> Dashboard[📊 Dashboard]
+  Dashboard --> LogQL[🔍 LogQL Query]
+  LogQL --> RootCause[🎯 Root Cause]
+  RootCause --> Fix[🔧 Fix]
+```
+
+---
+
+## 📍 Slide 33 – 🔐 Production Considerations
+
+```yaml
+# Production settings
+deploy:
+  resources:
+    limits:
+      memory: 1G
+      cpus: '1.0'
+    reservations:
+      memory: 512M
+
+healthcheck:
+  test: ["CMD", "wget", "--no-verbose", "--tries=1", "--spider", "http://localhost:3100/ready"]
+  interval: 10s
+  timeout: 5s
+  retries: 5
+```
+
+**🛡️ Production Checklist:**
+* 💾 Persistent volumes for data
+* 🔐 Secure Grafana (disable anonymous)
+* 📊 Resource limits on all services
+* 🏥 Health checks enabled
+* 🗓️ Retention policies configured
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: Observability Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Basic logging] --> Mid[💼 Mid: Structured logging & dashboards]
+  Mid --> Senior[⭐ Senior: Full observability stack]
+  Senior --> Principal[🏆 Principal: Observability strategy]
+```
+
+**🛠️ Skills to Build:**
+* 📋 Structured logging patterns
+* 🔍 LogQL/PromQL fluency
+* 📊 Dashboard design
+* 🚨 Alerting strategies
+* 🔗 Distributed tracing
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 Observability Leaders:**
+* 🎬 **Netflix**: Custom observability platform
+* 🔍 **Google**: Invented Dapper (tracing)
+* 📦 **Uber**: Jaeger (open-source tracing)
+
+**☁️ Modern Practices:**
+* 🏦 **Stripe**: Structured logging everywhere
+* 📦 **Spotify**: Centralized logging for 1000+ microservices
+* 🎮 **Riot Games**: Real-time game telemetry
+
+**📊 Stats:**
+* 🔍 **80%** of debugging time is finding problems
+* ⏱️ Good observability reduces MTTR by **70%+**
+* 💰 ROI: **10-100x** in reduced incident costs
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 🔍 **Observability = Logs + Metrics + Traces**
+2. 📋 **Structured logging** enables powerful queries
+3. 🏷️ **Labels** are how Loki indexes (keep cardinality low)
+4. 📊 **LogQL** is your query language
+5. 📈 **Dashboards** provide unified visibility
+
+> 💡 You can't fix what you can't see. Observability gives you eyes.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 🔍 Observable Mindset |
+|---------------|------------------|
+| 🙅 "SSH and grep" | 📊 "Query Grafana" |
+| 🚫 "Check the logs somewhere" | 🔍 "All logs in one place" |
+| 👉 "It's probably X" | 📊 "Data shows it's Y" |
+| 😨 "Debugging takes hours" | ⚡ "Root cause in minutes" |
+| 💻 "Works on my machine" | 🌍 "Production shows different" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ The three pillars of observability
+* ✅ Loki architecture and configuration
+* ✅ LogQL query syntax
+* ✅ Building effective dashboards
+* ✅ Production logging best practices
+
+> 🚀 **You're ready for Lab 7: Loki Logging Stack**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L7_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Monitoring with Prometheus
+
+* 📊 Metrics collection and storage
+* 🔢 PromQL query language
+* 📈 Application instrumentation
+* 💻 Hands-on: Building metrics dashboards
+
+**🎉 Your observability journey continues.**
+
+> 🔍 From blind operations to insight — one query at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Obs[🔍 Observability Skills]
+  Obs --> Insight[💡 System Insight]
+  Insight --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Observability Engineering* — Charity Majors
+* 📖 *Distributed Systems Observability* — Cindy Sridharan
+* 📖 *The Art of Monitoring* — James Turnbull
+
+**🔗 Links:**
+* 🌐 [Grafana Loki Documentation](https://grafana.com/docs/loki/latest/)
+* 🌐 [LogQL Reference](https://grafana.com/docs/loki/latest/query/)
+* 🌐 [Promtail Configuration](https://grafana.com/docs/loki/latest/send-data/promtail/)
+
+---
diff --git a/lectures/lec8.md b/lectures/lec8.md
new file mode 100644
index 0000000000..0b921df100
--- /dev/null
+++ b/lectures/lec8.md
@@ -0,0 +1,799 @@
+# 📌 Lecture 8 — Monitoring with Prometheus: From Guessing to Measuring
+
+## 📍 Slide 1 – 🚀 Welcome to Metrics Monitoring
+
+* 🌍 **Logs tell you what happened** — but how much and how fast?
+* 😰 Without metrics, capacity planning is guesswork
+* 📊 **Prometheus** = the industry standard for metrics
+* 🎯 This lecture: master metrics collection, PromQL, and dashboards
+
+```mermaid
+flowchart LR
+  App[📦 Application] -->|📊 Metrics| Prometheus[💾 Prometheus]
+  Prometheus --> Grafana[📊 Grafana]
+  Grafana --> Insight[💡 Insight]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand metrics types and instrumentation
+* ✅ Configure Prometheus for metrics collection
+* ✅ Query metrics with PromQL
+* ✅ Build effective monitoring dashboards
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Differentiate Counter, Gauge, Histogram |
+| 2 | 🔍 Configure Prometheus scrape targets |
+| 3 | 🛠️ Write PromQL queries for analysis |
+| 4 | 🗺️ Design RED method dashboards |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + Instrumentation** — hands-on focus
+* 🎮 **Real-world scenarios** — performance monitoring
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Methods**: RED, USE, Four Golden Signals
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Monitoring Problem
+Section 2: Prometheus Fundamentals
+Section 3: Application Instrumentation → 📝 MID Quiz
+Section 4: PromQL & Dashboards
+Section 5: Production Monitoring
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **83%** of organizations can't predict performance issues
+* ⏱️ Average time to detect capacity problems: **too late**
+* 💥 Without metrics, you're **reactive, not proactive**
+
+> 💬 *"Is the server slow or is it just me?"* — Everyone, always
+
+**🤔 Think about it:**
+* How do you know if your app can handle more load?
+* When did response times start degrading?
+* How much headroom do you have?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L8_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Monitoring Problem
+
+* 🤷 **No metrics** = can't measure performance
+* 📊 Users complain before you know there's a problem
+* 🔍 Can't identify bottlenecks
+* 💥 Result: **reactive firefighting**
+
+```mermaid
+flowchart LR
+  Users[👥 Users Complain] --> Support[📞 Support Ticket]
+  Support --> Team[👨‍💻 Team Investigates]
+  Team --> Guess[🤷 Guesswork]
+  Guess --> Hours[⏱️ Hours Later...]
+```
+
+---
+
+## 📍 Slide 7 – 📊 Metrics vs Logs
+
+```mermaid
+flowchart TD
+  subgraph 📋 Logs
+    L1[What happened?]
+    L2[Detailed events]
+    L3[High cardinality]
+  end
+  subgraph 📊 Metrics
+    M1[How much/fast?]
+    M2[Aggregated numbers]
+    M3[Low cardinality]
+  end
+```
+
+| 📋 Aspect | 📊 Metrics | 📝 Logs |
+|-----------|----------|---------|
+| 🎯 Question | How much? | What happened? |
+| 📈 Volume | Low | High |
+| 💾 Storage | Small | Large |
+| 🔍 Analysis | Trends, alerts | Debugging |
+| ⏱️ Retention | Long (months) | Short (days) |
+
+> 🔥 **Use both**: Logs for debugging, metrics for monitoring
+
+---
+
+## 📍 Slide 8 – 😱 Alert Blindness
+
+* 🚨 No alerts = problems go unnoticed
+* 📧 Too many alerts = alert fatigue
+* 🔍 Wrong thresholds = false positives
+* 💀 On-call burnout
+
+> ⚠️ **Good metrics = actionable alerts**
+
+```mermaid
+flowchart LR
+  NoMetrics[🙈 No Metrics] --> NoAlerts[🔇 No Alerts]
+  NoAlerts --> UserReports[👥 Users Report]
+  UserReports --> Scramble[😱 Scramble]
+```
+
+---
+
+## 📍 Slide 9 – 😨 Capacity Planning Without Metrics
+
+* 📅 "We need more servers" — but how many?
+* 🔮 Crystal ball capacity planning
+* 💰 Over-provision (waste money) or under-provision (outages)
+* 💀 No data to justify decisions
+
+> ⚠️ **Without metrics, capacity planning is gambling**
+
+**💬 Discussion:** How does your team plan capacity?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Blind Monitoring
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 No baseline | Can't detect degradation |
+| 📊 No trends | Can't predict growth |
+| 👉 No attribution | Can't identify bottlenecks |
+| 🙈 No thresholds | Can't alert proactively |
+
+**📈 Real Numbers:**
+* 🏢 **Reactive incident detection**: Users report first (30+ min delay)
+* 🚀 **Proactive with metrics**: Alert in seconds
+* 💰 **Cost of 30-minute delay**: $150,000+ (enterprise)
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Prometheus Is
+
+* 📊 **Time-series database** for metrics
+* 🔄 **Pull-based** model — scrapes targets
+* 📈 **PromQL** — powerful query language
+* 🎯 Industry standard for cloud-native monitoring
+
+```mermaid
+flowchart LR
+  App1[📦 App /metrics] --> Prometheus[💾 Prometheus]
+  App2[📦 Service /metrics] --> Prometheus
+  Prometheus -->|⏰ Every 15s| Scrape[🔄 Pull Metrics]
+```
+
+**📖 Definition:**
+> *Prometheus is an open-source monitoring system that collects metrics from targets by scraping HTTP endpoints, stores them in a time-series database, and provides a powerful query language (PromQL) for analysis.*
+
+---
+
+## 📍 Slide 12 – 🔄 Pull vs Push Model
+
+```mermaid
+flowchart TD
+  subgraph Pull (Prometheus)
+    P1[💾 Prometheus] -->|🔄 Scrape| T1[📦 Target]
+    P1 -->|🔄 Scrape| T2[📦 Target]
+  end
+  subgraph Push (StatsD)
+    S1[📦 App] -->|📤 Push| D1[💾 Collector]
+    S2[📦 App] -->|📤 Push| D1
+  end
+```
+
+**🔄 Pull Benefits:**
+* 🔍 Prometheus controls the rate
+* ✅ Know immediately if target is down (scrape fails)
+* 🎯 Apps don't need to know about monitoring
+* 🔧 Easy service discovery
+
+---
+
+## 📍 Slide 13 – 🏗️ Prometheus Architecture
+
+```mermaid
+flowchart TD
+  Targets[📦 Targets /metrics] --> Prometheus[💾 Prometheus TSDB]
+  Prometheus --> AlertManager[🚨 AlertManager]
+  Prometheus --> Grafana[📊 Grafana]
+  Prometheus --> API[🔗 HTTP API]
+  AlertManager --> Slack[💬 Slack]
+  AlertManager --> PagerDuty[📟 PagerDuty]
+```
+
+| 🧱 Component | 🎯 Purpose |
+|-------------|----------|
+| 💾 **Prometheus** | Scrape, store, query |
+| 📦 **Targets** | Expose /metrics endpoint |
+| 🚨 **AlertManager** | Handle alerts |
+| 📊 **Grafana** | Visualization |
+
+---
+
+## 📍 Slide 14 – 📊 Metric Types
+
+```mermaid
+flowchart LR
+  Counter[🔢 Counter] --> Always[Only goes UP]
+  Gauge[📊 Gauge] --> UpDown[Goes up AND down]
+  Histogram[📈 Histogram] --> Distribution[Value distribution]
+```
+
+| 📊 Type | 🎯 Use For | 📝 Example |
+|---------|----------|---------|
+| 🔢 **Counter** | Cumulative events | Total requests |
+| 📊 **Gauge** | Current value | Temperature, memory |
+| 📈 **Histogram** | Distribution | Request latency |
+| 📊 **Summary** | Percentiles | Pre-calculated p95 |
+
+---
+
+## 📍 Slide 15 – 🔢 Counter Deep Dive
+
+```python
+from prometheus_client import Counter
+
+# 🔢 Counter: Only goes up
+http_requests_total = Counter(
+    'http_requests_total',
+    'Total HTTP requests',
+    ['method', 'endpoint', 'status']
+)
+
+# Usage
+http_requests_total.labels(method='GET', endpoint='/', status='200').inc()
+```
+
+**📊 Query Patterns:**
+```promql
+# Total requests
+http_requests_total
+
+# Requests per second (rate over 5m)
+rate(http_requests_total[5m])
+
+# Requests per second by endpoint
+sum by (endpoint) (rate(http_requests_total[5m]))
+```
+
+**⚠️ Counter Rule:** Use `rate()` to get per-second values
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Application Instrumentation
+
+## 🐍 Python prometheus_client
+
+```python
+from prometheus_client import Counter, Gauge, Histogram, generate_latest
+from flask import Flask, Response
+
+app = Flask(__name__)
+
+# 📊 Define metrics
+requests = Counter('http_requests', 'Total requests', ['method', 'path'])
+latency = Histogram('http_latency_seconds', 'Request latency', ['path'])
+in_progress = Gauge('http_in_progress', 'Requests in progress')
+
+@app.route('/metrics')
+def metrics():
+    return Response(generate_latest(), content_type='text/plain')
+```
+
+**🎮 Let's instrument an application.**
+
+---
+
+## 📍 Slide 17 – 📊 Histogram Deep Dive
+
+```python
+from prometheus_client import Histogram
+
+# 📈 Histogram with buckets
+request_latency = Histogram(
+    'http_request_duration_seconds',
+    'Request latency in seconds',
+    ['method', 'endpoint'],
+    buckets=[0.01, 0.05, 0.1, 0.5, 1.0, 5.0]  # 🪣 Custom buckets
+)
+
+# Usage
+with request_latency.labels(method='GET', endpoint='/').time():
+    # ... handle request ...
+    pass
+```
+
+**📊 Query Patterns:**
+```promql
+# 95th percentile latency
+histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m]))
+
+# Average latency
+rate(http_request_duration_seconds_sum[5m]) / rate(http_request_duration_seconds_count[5m])
+```
+
+---
+
+## 📍 Slide 18 – 📈 The RED Method
+
+```mermaid
+flowchart LR
+  R[🔴 Rate] --> Requests[Requests per second]
+  E[🟡 Errors] --> Failures[Error rate]
+  D[🔵 Duration] --> Latency[Response time]
+```
+
+**📊 RED Method for Request-Driven Services:**
+
+| 📊 Metric | 🎯 Question | 📝 PromQL |
+|-----------|----------|---------|
+| 🔴 **Rate** | How busy? | `rate(requests[5m])` |
+| 🟡 **Errors** | How often failing? | `rate(errors[5m])` |
+| 🔵 **Duration** | How slow? | `histogram_quantile(0.95, ...)` |
+
+**🎯 If you monitor only 3 things, monitor these!**
+
+---
+
+## 📍 Slide 19 – 📈 The USE Method
+
+```mermaid
+flowchart LR
+  U[📊 Utilization] --> HowMuch[% resource busy]
+  S[📊 Saturation] --> Queuing[Extra work waiting]
+  E[📊 Errors] --> Failures[Error count]
+```
+
+**📊 USE Method for Resources (CPU, Memory, Disk):**
+
+| 📊 Metric | 🎯 Example |
+|-----------|----------|
+| 📊 **Utilization** | CPU at 80% |
+| 📊 **Saturation** | 10 requests queued |
+| 📊 **Errors** | Disk I/O errors |
+
+**🎯 USE for resources, RED for services**
+
+---
+
+## 📍 Slide 20 – ⚙️ Prometheus Configuration
+
+```yaml
+# prometheus/prometheus.yml
+global:
+  scrape_interval: 15s
+  evaluation_interval: 15s
+
+scrape_configs:
+  - job_name: 'prometheus'
+    static_configs:
+      - targets: ['localhost:9090']
+
+  - job_name: 'app'
+    static_configs:
+      - targets: ['app-python:8000']
+    metrics_path: '/metrics'
+
+  - job_name: 'loki'
+    static_configs:
+      - targets: ['loki:3100']
+```
+
+**🔑 Key Settings:**
+* ⏱️ `scrape_interval`: How often to collect (15s default)
+* 🎯 `targets`: What to scrape
+* 📍 `metrics_path`: Where metrics are exposed
+
+---
+
+## 📍 Slide 21 – 🎯 Scrape Targets
+
+```mermaid
+flowchart TD
+  Prometheus[💾 Prometheus] -->|🔄 Scrape| App[📦 app:8000/metrics]
+  Prometheus -->|🔄 Scrape| Loki[📦 loki:3100/metrics]
+  Prometheus -->|🔄 Scrape| Grafana[📦 grafana:3000/metrics]
+  Prometheus -->|🔄 Scrape| Self[📦 prometheus:9090/metrics]
+```
+
+**📊 Verify Targets:**
+```bash
+# Check targets status
+curl http://localhost:9090/api/v1/targets
+
+# Web UI
+http://localhost:9090/targets
+```
+
+**✅ All targets should show `UP`**
+
+---
+
+## 📍 Slide 22 – 📊 /metrics Endpoint Format
+
+```
+# HELP http_requests_total Total HTTP requests
+# TYPE http_requests_total counter
+http_requests_total{method="GET",endpoint="/",status="200"} 1234
+http_requests_total{method="GET",endpoint="/health",status="200"} 567
+http_requests_total{method="POST",endpoint="/api",status="201"} 89
+
+# HELP http_request_duration_seconds Request latency
+# TYPE http_request_duration_seconds histogram
+http_request_duration_seconds_bucket{le="0.01"} 100
+http_request_duration_seconds_bucket{le="0.05"} 200
+http_request_duration_seconds_bucket{le="0.1"} 250
+http_request_duration_seconds_bucket{le="+Inf"} 300
+http_request_duration_seconds_sum 45.67
+http_request_duration_seconds_count 300
+```
+
+**📊 Format:** `metric_name{labels} value`
+
+---
+
+## 📍 Slide 23 – 🏷️ Labels Best Practices
+
+```python
+# ✅ Good: Low cardinality labels
+http_requests.labels(method='GET', status='200', endpoint='/api')
+
+# ❌ Bad: High cardinality (user IDs, request IDs)
+http_requests.labels(user_id='12345')  # 💥 Millions of time series!
+```
+
+**🏷️ Label Rules:**
+* ✅ Use for: method, endpoint, status, service
+* ❌ Avoid: user_id, request_id, session_id
+* 📊 Target: < 1000 unique label combinations
+
+**⚠️ High cardinality = memory explosion**
+
+---
+
+## 📍 Slide 24 – 🔍 PromQL Basics
+
+```promql
+# Instant vector (current value)
+http_requests_total
+
+# Range vector (over time)
+http_requests_total[5m]
+
+# Rate (per-second)
+rate(http_requests_total[5m])
+
+# Sum by label
+sum by (endpoint) (rate(http_requests_total[5m]))
+
+# Filter by label
+http_requests_total{status="500"}
+```
+
+**🔑 Key Operators:**
+* `rate()` — Per-second rate for counters
+* `sum()` — Aggregate across series
+* `by ()` — Group results
+* `{}` — Filter by labels
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L8_MID
+
+---
+
+## 📍 Slide 26 – 📊 Section 4: Building Dashboards
+
+## 🎨 Dashboard Design with RED
+
+```mermaid
+flowchart TD
+  Row1[🔝 Row 1: Overview Stats]
+  Row2[📊 Row 2: Rate & Errors]
+  Row3[⏱️ Row 3: Latency]
+  Row4[📋 Row 4: Details]
+  Row1 --> Row2 --> Row3 --> Row4
+```
+
+**📊 Essential Panels:**
+1. 📊 **Request Rate** — Requests per second
+2. ❌ **Error Rate** — 5xx responses
+3. ⏱️ **Latency p95** — 95th percentile
+4. 📈 **Latency Heatmap** — Distribution
+
+---
+
+## 📍 Slide 27 – 📊 PromQL Dashboard Queries
+
+**1️⃣ Request Rate (Time series)**
+```promql
+sum(rate(http_requests_total[5m])) by (endpoint)
+```
+
+**2️⃣ Error Rate % (Time series)**
+```promql
+sum(rate(http_requests_total{status=~"5.."}[5m]))
+  / sum(rate(http_requests_total[5m])) * 100
+```
+
+**3️⃣ P95 Latency (Time series)**
+```promql
+histogram_quantile(0.95,
+  sum(rate(http_request_duration_seconds_bucket[5m])) by (le))
+```
+
+**4️⃣ Uptime (Stat)**
+```promql
+up{job="app"}
+```
+
+---
+
+## 📍 Slide 28 – 📈 Heatmap for Latency
+
+```promql
+# Latency distribution over time
+sum(rate(http_request_duration_seconds_bucket[1m])) by (le)
+```
+
+**🎨 Heatmap Benefits:**
+* 📊 See latency distribution
+* 🔍 Spot outliers
+* 📈 Track changes over time
+
+```mermaid
+flowchart LR
+  Green[🟢 Fast: < 100ms] --> Yellow[🟡 OK: 100-500ms]
+  Yellow --> Red[🔴 Slow: > 500ms]
+```
+
+---
+
+## 📍 Slide 29 – 📊 Monitoring Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| ⏱️ **Scrape Success** | Targets reachable | 100% |
+| 📊 **Series Count** | Time series | Stable |
+| 💾 **Storage Size** | Disk usage | Predictable |
+| 🔍 **Query Latency** | PromQL speed | < 1s |
+
+> 📚 Monitor your monitoring!
+
+**🤔 Question:** What happens if Prometheus goes down?
+
+---
+
+## 📍 Slide 30 – 🌊 From Guessing to Measuring
+
+```mermaid
+flowchart LR
+  subgraph 😱 Guessing
+    NoData[🤷 No Data]
+    Reactive[🔥 Reactive]
+    Slow[⏱️ Slow Detection]
+  end
+  subgraph 📊 Measuring
+    Metrics[📈 Real Metrics]
+    Proactive[⚡ Proactive]
+    Fast[🚀 Instant Detection]
+  end
+  Guessing -->|🚀 Prometheus| Measuring
+```
+
+**🎯 Monitoring State:**
+* ⚡ Detect issues before users
+* 📊 Data-driven capacity planning
+* 📈 Trend analysis and predictions
+
+---
+
+## 📍 Slide 31 – 🏢 Section 5: Production Monitoring
+
+## 📅 A Day with Prometheus
+
+**☀️ Morning:**
+* 📊 Check Grafana — all green ✅
+* 📈 Review overnight trends
+* 🔍 No anomalies detected
+
+**🌤️ Afternoon:**
+* 🚨 Alert: Latency p95 > 500ms
+* 📊 Dashboard shows spike at 2pm
+* 🔍 PromQL: `histogram_quantile(0.95, ...)`
+* 🔧 Found: Database slow query
+* ⏱️ **5 minutes** to identify
+
+**🌙 Evening:**
+* 📊 Review daily trends
+* 📈 Plan tomorrow's capacity
+* 🏠 Go home with confidence
+
+---
+
+## 📍 Slide 32 – 👥 Team Monitoring Workflow
+
+| 👤 Role | 🎯 Monitoring Responsibility |
+|---------|----------------------|
+| 👨‍💻 **Developer** | Add metrics to code |
+| 🔧 **DevOps** | Maintain Prometheus |
+| 🛡️ **SRE** | Design dashboards & alerts |
+| 📊 **On-call** | Respond to alerts |
+
+**🔗 Alert Flow:**
+```mermaid
+flowchart LR
+  Prometheus[💾 Prometheus] -->|🚨 Alert| AlertManager[📬 AlertManager]
+  AlertManager --> Slack[💬 Slack]
+  AlertManager --> PagerDuty[📟 PagerDuty]
+  PagerDuty --> OnCall[👤 On-call]
+```
+
+---
+
+## 📍 Slide 33 – 🔐 Production Considerations
+
+```yaml
+# Prometheus with retention
+command:
+  - '--config.file=/etc/prometheus/prometheus.yml'
+  - '--storage.tsdb.retention.time=15d'
+  - '--storage.tsdb.retention.size=10GB'
+
+deploy:
+  resources:
+    limits:
+      memory: 1G
+      cpus: '1.0'
+
+healthcheck:
+  test: ["CMD", "wget", "-q", "--spider", "http://localhost:9090/-/healthy"]
+  interval: 10s
+  timeout: 5s
+  retries: 5
+```
+
+**🛡️ Production Checklist:**
+* 💾 Persistent storage configured
+* 🗓️ Retention policy set
+* 📊 Resource limits defined
+* 🏥 Health checks enabled
+
+---
+
+## 📍 Slide 34 – 📈 Career Path: Monitoring Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: Basic metrics] --> Mid[💼 Mid: PromQL & dashboards]
+  Mid --> Senior[⭐ Senior: Full observability]
+  Senior --> Principal[🏆 Principal: SRE practices]
+```
+
+**🛠️ Skills to Build:**
+* 📊 Application instrumentation
+* 🔍 PromQL fluency
+* 📈 Dashboard design
+* 🚨 Alert engineering
+* 📊 SLO/SLI definition
+
+---
+
+## 📍 Slide 35 – 🌍 Real Company Examples
+
+**🏢 Prometheus at Scale:**
+* ☁️ **SoundCloud**: Created Prometheus (2012)
+* 🔍 **Google**: Inspired Prometheus (Borgmon)
+* 🎬 **Netflix**: Millions of time series
+
+**☁️ Modern Practices:**
+* 📦 **Spotify**: Custom Prometheus federation
+* 🏦 **Stripe**: Fine-grained latency tracking
+* 🎮 **Riot Games**: Real-time game metrics
+
+**📊 Stats:**
+* 🌍 **#1** cloud-native monitoring tool
+* 📦 **CNCF graduated** project
+* 🏢 Adopted by **70%+** of K8s users
+
+---
+
+## 📍 Slide 36 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. 📊 **Metrics complement logs** — different purposes
+2. 🔢 **Counter, Gauge, Histogram** — choose wisely
+3. 🔴 **RED method** for services (Rate, Errors, Duration)
+4. 🏷️ **Labels** — keep cardinality low
+5. 📈 **PromQL** is powerful — learn it well
+
+> 💡 If you can't measure it, you can't improve it.
+
+---
+
+## 📍 Slide 37 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | 📊 Metrics Mindset |
+|---------------|------------------|
+| 🙅 "Seems fine" | 📊 "Data shows it's fine" |
+| 🚫 "Users will tell us" | 🚨 "Alerts tell us first" |
+| 👉 "We need more servers" | 📈 "Data shows we need 3 more" |
+| 😨 "Deploy and hope" | 📊 "Deploy and measure" |
+| 💻 "Performance is subjective" | 🔢 "p95 is 250ms" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 38 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Metrics types and when to use each
+* ✅ Prometheus architecture and configuration
+* ✅ Application instrumentation patterns
+* ✅ PromQL query syntax
+* ✅ Dashboard design with RED method
+
+> 🚀 **You're ready for Lab 8: Prometheus Monitoring**
+
+---
+
+## 📍 Slide 39 – 📝 QUIZ — DEVOPS_L8_POST
+
+---
+
+## 📍 Slide 40 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Kubernetes Fundamentals
+
+* ☸️ Container orchestration
+* 📦 Deployments and Services
+* 🔄 Scaling and self-healing
+* 💻 Hands-on: Deploying to Kubernetes
+
+**🎉 Your monitoring journey continues.**
+
+> 📊 From guessing to measuring — one metric at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> Metrics[📊 Metrics Skills]
+  Metrics --> DataDriven[📈 Data-Driven Ops]
+  DataDriven --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Prometheus: Up & Running* — Brian Brazil
+* 📖 *Site Reliability Engineering* — Google
+* 📖 *The Art of Monitoring* — James Turnbull
+
+**🔗 Links:**
+* 🌐 [Prometheus Documentation](https://prometheus.io/docs/)
+* 🌐 [PromQL Basics](https://prometheus.io/docs/prometheus/latest/querying/basics/)
+* 🌐 [RED Method](https://grafana.com/blog/2018/08/02/the-red-method-how-to-instrument-your-services/)
+
+---
diff --git a/lectures/lec9.md b/lectures/lec9.md
new file mode 100644
index 0000000000..e5a265fd11
--- /dev/null
+++ b/lectures/lec9.md
@@ -0,0 +1,853 @@
+# 📌 Lecture 9 — Kubernetes Fundamentals: Container Orchestration
+
+## 📍 Slide 1 – 🚀 Welcome to Kubernetes
+
+* 🌍 **Containers are great** — but who manages them at scale?
+* 😰 Manual container management doesn't scale
+* ☸️ **Kubernetes** = the operating system for containers
+* 🎯 This lecture: master deployments, services, and orchestration
+
+```mermaid
+flowchart LR
+  Containers[🐳 Containers] -->|☸️ Kubernetes| Orchestration[🎭 Orchestration]
+  Orchestration --> Scaling[📈 Auto-scaling]
+  Orchestration --> Healing[🏥 Self-healing]
+  Orchestration --> Updates[🔄 Rolling updates]
+```
+
+---
+
+## 📍 Slide 2 – 🎯 What You Will Learn
+
+* ✅ Understand Kubernetes architecture and concepts
+* ✅ Write production-ready Deployment manifests
+* ✅ Expose applications with Services and Ingress
+* ✅ Implement health checks and resource management
+
+**🎓 Learning Outcomes:**
+| # | Outcome |
+|---|---------|
+| 1 | 🧠 Explain Kubernetes declarative model |
+| 2 | 🔍 Create Deployments with probes and limits |
+| 3 | 🛠️ Configure Services for networking |
+| 4 | 🗺️ Perform scaling and rolling updates |
+
+---
+
+## 📍 Slide 3 – 📋 How This Lecture Works
+
+* 📚 **Concepts + YAML manifests** — hands-on focus
+* 🎮 **Real-world scenarios** — production deployment challenges
+* 📝 **3 quiz checkpoints**: PRE / MID / POST
+* 🛠️ **Tools**: kubectl, minikube, manifests
+
+**⏱️ Lecture Structure:**
+```
+Section 0: Introduction (now)     → 📝 PRE Quiz
+Section 1: The Orchestration Problem
+Section 2: Kubernetes Architecture
+Section 3: Core Resources          → 📝 MID Quiz
+Section 4: Health & Resource Management
+Section 5: Production Kubernetes
+Section 6: Reflection             → 📝 POST Quiz
+```
+
+---
+
+## 📍 Slide 4 – ❓ The Big Question
+
+* 📊 **92%** of organizations use containers in production
+* ⏱️ Average container lifecycle: **minutes to hours** (not days)
+* 💥 Managing 100+ containers manually is **impossible**
+
+> 💬 *"Why did container 47 crash? Where's the replacement?"* — Nobody wants to ask this manually
+
+**🤔 Think about it:**
+* How do you ensure 10 copies of your app are always running?
+* What happens when a container crashes at 3am?
+* How do you update without downtime?
+
+---
+
+## 📍 Slide 5 – 📝 QUIZ — DEVOPS_L9_PRE
+
+---
+
+## 📍 Slide 6 – 🔥 Section 1: The Orchestration Problem
+
+* 🐳 **One container is easy** — just `docker run`
+* 📦 100 containers? 1000 containers?
+* 🔧 Manual restart on crash?
+* 💥 Result: **operations nightmare**
+
+```mermaid
+flowchart LR
+  Single[🐳 1 Container] -->|Easy| Manual[👤 Manual]
+  Hundred[🐳 100 Containers] -->|Hard| Manual
+  Thousand[🐳 1000 Containers] -->|💥 Impossible| Manual
+```
+
+---
+
+## 📍 Slide 7 – 😱 Container Management Chaos
+
+* 📋 Tracking which containers run where
+* 🔄 Restarting crashed containers
+* 📊 Load balancing between replicas
+* 🔒 Managing secrets and configs
+* 💀 Scaling up/down based on load
+
+```mermaid
+flowchart TD
+  Crash[💥 Container Crash] --> Detect[🔍 Detect (how?)]
+  Detect --> Restart[🔄 Restart (where?)]
+  Restart --> LoadBalance[⚖️ Update LB (manually?)]
+  LoadBalance --> Hope[🙏 Hope it works]
+```
+
+**📊 The Numbers:**
+* 🔍 **Netflix**: 100,000+ container instances
+* 📦 **Spotify**: 10,000+ services
+* ⏱️ Manual management: **impossible**
+
+---
+
+## 📍 Slide 8 – 🔧 Docker Compose Limitations
+
+* ✅ Great for development and simple deployments
+* ❌ Single host only
+* ❌ No automatic restart across nodes
+* ❌ No rolling updates
+* ❌ No auto-scaling
+
+> ⚠️ **Docker Compose ≠ production orchestration**
+
+```mermaid
+flowchart TD
+  Compose[🐳 Docker Compose] --> SingleHost[🖥️ Single Host]
+  K8s[☸️ Kubernetes] --> MultiHost[🖥️🖥️🖥️ Multi-Host Cluster]
+  SingleHost --> DevTest[✅ Dev/Test]
+  MultiHost --> Production[✅ Production]
+```
+
+---
+
+## 📍 Slide 9 – 😨 Zero Downtime Deployments
+
+* 📅 Traditional: Schedule maintenance window
+* 🔧 Stop old version, start new version
+* ⏱️ Downtime = lost revenue
+* 💀 Risky deployments = fear of deploying
+
+> ⚠️ **Every minute of downtime costs money**
+
+**💬 Discussion:** How do you update without any downtime?
+
+---
+
+## 📍 Slide 10 – 💸 The Cost of Manual Orchestration
+
+| 🔥 Problem | 💥 Impact |
+|------------|-----------|
+| 🐢 Slow scaling | Can't handle traffic spikes |
+| 📋 Manual recovery | Long outages |
+| 👉 No load balancing | Uneven distribution |
+| 🙈 Version confusion | "Which version is running?" |
+
+**📈 Real Numbers:**
+* 🏢 **Manual ops**: 10+ hours/week
+* 🚀 **With Kubernetes**: Minutes/week
+* 💰 **Downtime cost**: $5,600/minute (average)
+
+---
+
+## 📍 Slide 11 – 💡 Section 2: What Kubernetes Is
+
+* ☸️ **Container orchestration platform**
+* 🎭 **Manages** container lifecycle automatically
+* 🔄 **Declarative** — you define desired state
+* 🌐 **Portable** — runs anywhere (cloud, on-prem, laptop)
+
+```mermaid
+flowchart LR
+  You[👤 You] -->|📝 Declare| K8s[☸️ Kubernetes]
+  K8s -->|🔄 Reconcile| Cluster[🖥️ Cluster]
+  K8s -->|🔁 Continuously| Monitor[👀 Monitor & Fix]
+```
+
+**📖 Definition:**
+> *Kubernetes is an open-source container orchestration platform that automates deployment, scaling, and management of containerized applications.*
+
+---
+
+## 📍 Slide 12 – 🎭 Declarative vs Imperative
+
+```mermaid
+flowchart TD
+  subgraph Declarative
+    D1[📝 Define: 3 replicas]
+    D2[☸️ K8s makes it happen]
+    D1 --> D2
+  end
+  subgraph Imperative
+    I1[💻 Run: create pod 1]
+    I2[💻 Run: create pod 2]
+    I3[💻 Run: create pod 3]
+    I1 --> I2 --> I3
+  end
+```
+
+| 📋 Approach | 📝 You Say | ☸️ K8s Does |
+|-------------|----------|------------|
+| 🎭 **Declarative** | "I want 3 replicas" | Creates/maintains 3 |
+| 💻 **Imperative** | "Create this pod" | Creates 1 pod |
+
+**🎯 Always prefer declarative manifests!**
+
+---
+
+## 📍 Slide 13 – 🏗️ Kubernetes Architecture
+
+```mermaid
+flowchart TD
+  subgraph Control Plane
+    API[📡 API Server]
+    Scheduler[📊 Scheduler]
+    Controller[🔄 Controller Manager]
+    ETCD[💾 etcd]
+  end
+  subgraph Worker Nodes
+    Kubelet[🤖 kubelet]
+    Proxy[🌐 kube-proxy]
+    Runtime[🐳 Container Runtime]
+  end
+  API --> Scheduler
+  API --> Controller
+  API --> ETCD
+  API --> Kubelet
+  Kubelet --> Runtime
+```
+
+| 🧱 Component | 🎯 Purpose |
+|-------------|----------|
+| 📡 **API Server** | Gateway to cluster |
+| 📊 **Scheduler** | Places pods on nodes |
+| 🔄 **Controller** | Ensures desired state |
+| 💾 **etcd** | Cluster state database |
+| 🤖 **kubelet** | Node agent |
+
+---
+
+## 📍 Slide 14 – 📦 Core Resources
+
+```mermaid
+flowchart TD
+  Pod[📦 Pod] --> Containers[🐳 Containers]
+  Deployment[🚀 Deployment] --> ReplicaSet[📊 ReplicaSet]
+  ReplicaSet --> Pod
+  Service[🌐 Service] --> Pod
+  Ingress[🚪 Ingress] --> Service
+```
+
+| 📦 Resource | 🎯 Purpose |
+|-------------|----------|
+| 📦 **Pod** | Smallest unit, contains containers |
+| 🚀 **Deployment** | Manages replicas and updates |
+| 🌐 **Service** | Stable network endpoint |
+| 🚪 **Ingress** | HTTP routing and TLS |
+
+---
+
+## 📍 Slide 15 – ⚡ Before vs After Kubernetes
+
+| 😰 Before | 🚀 After |
+|----------|---------|
+| 📅 Manual restart on crash | 🔄 Auto-restart |
+| 📋 Manual scaling | 📈 Auto-scaling |
+| 👉 Downtime for updates | 🔄 Rolling updates |
+| 😨 Fear of deploying | 💪 Deploy anytime |
+| 🐌 Hours to scale | ⚡ Seconds to scale |
+| 📝 Track servers manually | 🎭 Declarative state |
+
+> 🤔 Ready to orchestrate?
+
+---
+
+## 📍 Slide 16 – 🎮 Section 3: Core Resources
+
+## 📦 The Pod
+
+* 🐳 **One or more containers** sharing network/storage
+* 📦 **Smallest deployable unit**
+* ⏱️ **Ephemeral** — created and destroyed
+* 🏷️ **Labeled** for selection
+
+```yaml
+apiVersion: v1
+kind: Pod
+metadata:
+  name: my-app
+  labels:
+    app: web
+spec:
+  containers:
+  - name: web
+    image: nginx:latest
+    ports:
+    - containerPort: 80
+```
+
+**⚠️ Never create pods directly — use Deployments!**
+
+---
+
+## 📍 Slide 17 – 🚀 Deployments
+
+```mermaid
+flowchart TD
+  Deployment[🚀 Deployment] --> RS1[📊 ReplicaSet v1]
+  RS1 --> Pod1[📦 Pod]
+  RS1 --> Pod2[📦 Pod]
+  RS1 --> Pod3[📦 Pod]
+```
+
+**🚀 Deployment manages:**
+* 📊 Desired replica count
+* 🔄 Rolling updates
+* 🔙 Rollback capability
+* 🏷️ Pod template
+
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: web-app
+spec:
+  replicas: 3
+  selector:
+    matchLabels:
+      app: web
+  template:
+    metadata:
+      labels:
+        app: web
+    spec:
+      containers:
+      - name: web
+        image: myapp:1.0
+```
+
+---
+
+## 📍 Slide 18 – 🏷️ Labels and Selectors
+
+```mermaid
+flowchart LR
+  Deployment[🚀 Deployment] -->|selector: app=web| Pods[📦 Pods with label app=web]
+  Service[🌐 Service] -->|selector: app=web| Pods
+```
+
+**🏷️ Labels = Key-value pairs for organization**
+
+```yaml
+metadata:
+  labels:
+    app: web-frontend
+    environment: production
+    version: v1.2.3
+
+selector:
+  matchLabels:
+    app: web-frontend
+```
+
+**🎯 Labels enable:**
+* 🔍 Service discovery
+* 📊 Resource selection
+* 🏗️ Organization
+
+---
+
+## 📍 Slide 19 – 🌐 Services
+
+```mermaid
+flowchart LR
+  Client[👥 Client] --> Service[🌐 Service: ClusterIP]
+  Service --> Pod1[📦 Pod 1]
+  Service --> Pod2[📦 Pod 2]
+  Service --> Pod3[📦 Pod 3]
+```
+
+**🌐 Service types:**
+| 🔧 Type | 🎯 Use Case |
+|---------|----------|
+| 🔒 **ClusterIP** | Internal cluster access |
+| 🔓 **NodePort** | External via node IP |
+| ☁️ **LoadBalancer** | Cloud load balancer |
+| 🔗 **ExternalName** | DNS alias |
+
+```yaml
+apiVersion: v1
+kind: Service
+metadata:
+  name: web-service
+spec:
+  type: NodePort
+  selector:
+    app: web
+  ports:
+  - port: 80
+    targetPort: 8000
+    nodePort: 30080
+```
+
+---
+
+## 📍 Slide 20 – 🔄 Rolling Updates
+
+```mermaid
+flowchart LR
+  V1[📦 v1] --> V1_V2[📦 v1 + v2]
+  V1_V2 --> V2[📦 v2]
+```
+
+**🔄 How it works:**
+1. 📦 Create new pods with new version
+2. ⏳ Wait for them to be ready
+3. 🗑️ Terminate old pods gradually
+4. ✅ Zero downtime!
+
+```yaml
+spec:
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1        # Extra pods during update
+      maxUnavailable: 0  # Always maintain capacity
+```
+
+---
+
+## 📍 Slide 21 – 📊 kubectl Commands
+
+```bash
+# 📋 Get resources
+kubectl get pods
+kubectl get deployments
+kubectl get services
+
+# 🔍 Describe (detailed info)
+kubectl describe pod <name>
+
+# 📝 Apply manifest
+kubectl apply -f deployment.yaml
+
+# 📊 Watch changes
+kubectl get pods -w
+
+# 🔙 Rollback
+kubectl rollout undo deployment/<name>
+
+# 📈 Scale
+kubectl scale deployment/<name> --replicas=5
+```
+
+---
+
+## 📍 Slide 22 – 🚪 Ingress
+
+```mermaid
+flowchart LR
+  Internet[🌐 Internet] --> Ingress[🚪 Ingress Controller]
+  Ingress -->|/app1| Svc1[🌐 Service 1]
+  Ingress -->|/app2| Svc2[🌐 Service 2]
+  Svc1 --> Pods1[📦 Pods]
+  Svc2 --> Pods2[📦 Pods]
+```
+
+**🚪 Ingress provides:**
+* 🔗 URL routing
+* 🔐 TLS termination
+* 🏷️ Name-based virtual hosting
+
+```yaml
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+metadata:
+  name: app-ingress
+spec:
+  rules:
+  - host: app.example.com
+    http:
+      paths:
+      - path: /
+        pathType: Prefix
+        backend:
+          service:
+            name: web-service
+            port:
+              number: 80
+```
+
+---
+
+## 📍 Slide 23 – 🏥 Health Checks
+
+```yaml
+spec:
+  containers:
+  - name: app
+    image: myapp:1.0
+    livenessProbe:
+      httpGet:
+        path: /health
+        port: 8000
+      initialDelaySeconds: 10
+      periodSeconds: 5
+    readinessProbe:
+      httpGet:
+        path: /ready
+        port: 8000
+      initialDelaySeconds: 5
+      periodSeconds: 3
+```
+
+| 🏥 Probe | 🎯 Purpose | ❌ Failure Action |
+|----------|----------|------------------|
+| 🔴 **Liveness** | Is it alive? | Restart container |
+| 🟢 **Readiness** | Is it ready? | Remove from service |
+| 🟡 **Startup** | Did it start? | Keep waiting |
+
+---
+
+## 📍 Slide 24 – 📊 Resource Management
+
+```yaml
+spec:
+  containers:
+  - name: app
+    image: myapp:1.0
+    resources:
+      requests:
+        memory: "128Mi"
+        cpu: "100m"       # 0.1 CPU core
+      limits:
+        memory: "256Mi"
+        cpu: "200m"       # 0.2 CPU core
+```
+
+**📊 Requests vs Limits:**
+| 📊 Setting | 🎯 Purpose |
+|-----------|----------|
+| 📋 **Requests** | Guaranteed resources, scheduling |
+| 🔒 **Limits** | Maximum allowed, OOM if exceeded |
+
+**⚠️ Always set both!**
+
+---
+
+## 📍 Slide 25 – 📝 QUIZ — DEVOPS_L9_MID
+
+---
+
+## 📍 Slide 26 – 📁 Section 4: Manifest Best Practices
+
+## 📄 Complete Deployment Example
+
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: web-app
+  labels:
+    app: web-app
+spec:
+  replicas: 3
+  selector:
+    matchLabels:
+      app: web-app
+  strategy:
+    type: RollingUpdate
+    rollingUpdate:
+      maxSurge: 1
+      maxUnavailable: 0
+  template:
+    metadata:
+      labels:
+        app: web-app
+    spec:
+      containers:
+      - name: web-app
+        image: username/web-app:1.0.0
+        ports:
+        - containerPort: 8000
+        resources:
+          requests:
+            memory: "128Mi"
+            cpu: "100m"
+          limits:
+            memory: "256Mi"
+            cpu: "200m"
+        livenessProbe:
+          httpGet:
+            path: /health
+            port: 8000
+          initialDelaySeconds: 10
+        readinessProbe:
+          httpGet:
+            path: /health
+            port: 8000
+          initialDelaySeconds: 5
+```
+
+---
+
+## 📍 Slide 27 – 🔐 Security Best Practices
+
+```yaml
+spec:
+  containers:
+  - name: app
+    image: myapp:1.0
+    securityContext:
+      runAsNonRoot: true
+      runAsUser: 1000
+      readOnlyRootFilesystem: true
+      allowPrivilegeEscalation: false
+```
+
+**🔐 Security Checklist:**
+* ✅ Run as non-root user
+* ✅ Read-only filesystem
+* ✅ No privilege escalation
+* ✅ Specific image tags (not `:latest`)
+* ✅ Resource limits defined
+
+---
+
+## 📍 Slide 28 – 📊 Kubernetes Metrics
+
+| 📊 Metric | 📏 Measures | 🏆 Target |
+|-----------|------------|---------|
+| 📦 **Pod Restarts** | Stability | 0 |
+| ⏱️ **Pod Startup Time** | Speed | < 30s |
+| 📊 **Resource Usage** | Efficiency | 50-80% |
+| ✅ **Probe Success** | Health | 100% |
+
+> 📚 Monitor your cluster health!
+
+**🤔 Question:** How many pod restarts is "normal"?
+
+---
+
+## 📍 Slide 29 – 🌊 From Manual to Orchestrated
+
+```mermaid
+flowchart LR
+  subgraph 😱 Manual
+    SSH[🔌 SSH to servers]
+    Docker[🐳 docker run]
+    Restart[🔄 Manual restart]
+  end
+  subgraph ☸️ Orchestrated
+    Manifest[📝 YAML Manifest]
+    Apply[kubectl apply]
+    AutoHeal[🏥 Auto-healing]
+  end
+  Manual -->|🚀 Kubernetes| Orchestrated
+```
+
+**🎯 Orchestration State:**
+* ⚡ Deploy in seconds
+* 🔄 Auto-healing always
+* 📈 Scale on demand
+
+---
+
+## 📍 Slide 30 – 🏢 Section 5: Production Kubernetes
+
+## 📅 A Day with Kubernetes
+
+**☀️ Morning:**
+* 📊 Check cluster health — all green ✅
+* 📈 Review resource usage
+* 🔄 Approve deployment PR
+
+**🌤️ Afternoon:**
+* 🚀 `kubectl apply -f deployment.yaml`
+* 📊 Watch rolling update: `kubectl rollout status`
+* ✅ Zero downtime update complete
+
+**🌙 Evening:**
+* 📈 Auto-scaling handles traffic spike
+* 🏥 Crashed pod auto-restarted
+* 🏠 Sleep peacefully
+
+---
+
+## 📍 Slide 31 – 👥 Team Kubernetes Workflow
+
+| 👤 Role | 🎯 Kubernetes Responsibility |
+|---------|----------------------|
+| 👨‍💻 **Developer** | Write manifests, define resources |
+| 🔧 **DevOps** | Manage cluster, set policies |
+| 🛡️ **SRE** | Monitor, scale, incident response |
+| 📊 **Platform** | Build internal tooling |
+
+**🔗 GitOps Flow:**
+```mermaid
+flowchart LR
+  PR[📝 Manifest PR] --> Review[👀 Review]
+  Review --> Merge[✅ Merge]
+  Merge --> ArgoCD[🔄 ArgoCD]
+  ArgoCD --> Cluster[☸️ Cluster]
+```
+
+---
+
+## 📍 Slide 32 – 🔧 Local Development
+
+```bash
+# 🎯 minikube: Full-featured local cluster
+minikube start
+minikube status
+minikube service web-service --url
+
+# 🐳 kind: Lightweight, Docker-based
+kind create cluster
+kind load docker-image myapp:latest
+
+# 📊 Useful addons
+minikube addons enable ingress
+minikube addons enable metrics-server
+```
+
+**🛠️ Local Options:**
+| 🔧 Tool | 🎯 Best For |
+|---------|----------|
+| 🚀 **minikube** | Learning, full features |
+| 🐳 **kind** | CI/CD, fast startup |
+| 🖥️ **Docker Desktop** | Mac/Windows convenience |
+
+---
+
+## 📍 Slide 33 – 📈 Career Path: Kubernetes Skills
+
+```mermaid
+flowchart LR
+  Junior[🌱 Junior: kubectl basics] --> Mid[💼 Mid: Manifests & debugging]
+  Mid --> Senior[⭐ Senior: Architecture & scaling]
+  Senior --> Principal[🏆 Principal: Platform design]
+```
+
+**🛠️ Skills to Build:**
+* 📝 YAML manifest fluency
+* 🔍 kubectl debugging
+* 🏗️ Architecture patterns
+* 📊 Resource optimization
+* 🔐 Security hardening
+
+---
+
+## 📍 Slide 34 – 🌍 Real Company Examples
+
+**🏢 Kubernetes at Scale:**
+* 📦 **Spotify**: 10,000+ services on K8s
+* 🔍 **Google**: Runs everything on Kubernetes
+* 🎬 **Netflix**: Titus (K8s-inspired)
+
+**☁️ Modern Practices:**
+* 📦 **Airbnb**: 1000+ microservices
+* 🏦 **Capital One**: K8s for banking workloads
+* 🎮 **Pokemon Go**: Global scale with K8s
+
+**📊 Stats:**
+* 🌍 **5.6M+** Kubernetes developers
+* 📦 **92%** container adoption uses K8s
+* 🏢 **#1** CNCF project
+
+---
+
+## 📍 Slide 35 – 🎯 Section 6: Reflection
+
+## 📝 Key Takeaways
+
+1. ☸️ **Kubernetes orchestrates containers** at scale
+2. 🎭 **Declarative** — define desired state, K8s maintains it
+3. 🚀 **Deployments** manage replicas and updates
+4. 🌐 **Services** provide stable networking
+5. 🏥 **Probes** ensure health, **limits** ensure stability
+
+> 💡 Kubernetes is the operating system for cloud-native applications.
+
+---
+
+## 📍 Slide 36 – 🧠 The Mindset Shift
+
+| 😰 Old Mindset | ☸️ K8s Mindset |
+|---------------|------------------|
+| 🙅 "Restart manually" | 🔄 "K8s restarts automatically" |
+| 🚫 "SSH to fix" | 📝 "Fix manifest, apply" |
+| 👉 "Which server?" | 📦 "Which pod?" |
+| 😨 "Scale takes hours" | ⚡ "Scale in seconds" |
+| 💻 "Deploy on weekends" | 🚀 "Deploy anytime" |
+
+> ❓ Which mindset describes your team?
+
+---
+
+## 📍 Slide 37 – ✅ Your Progress
+
+## 🎓 What You Now Understand
+
+* ✅ Kubernetes architecture and concepts
+* ✅ Deployments, Services, and Ingress
+* ✅ Health checks and resource management
+* ✅ Rolling updates and scaling
+* ✅ kubectl commands for daily use
+
+> 🚀 **You're ready for Lab 9: Kubernetes Fundamentals**
+
+---
+
+## 📍 Slide 38 – 📝 QUIZ — DEVOPS_L9_POST
+
+---
+
+## 📍 Slide 39 – 🚀 What Comes Next
+
+## 📚 Next Lecture: Helm Package Management
+
+* ⛵ Helm charts for packaging
+* 📝 Templating with Go templates
+* 🔧 Values management
+* 💻 Hands-on: Creating Helm charts
+
+**🎉 Your Kubernetes journey continues.**
+
+> ☸️ From manual containers to orchestration — one manifest at a time.
+
+```mermaid
+flowchart LR
+  You[👤 You] --> K8s[☸️ Kubernetes Skills]
+  K8s --> CloudNative[☁️ Cloud-Native]
+  CloudNative --> Career[🚀 Career Growth]
+```
+
+**👋 See you in the next lecture!**
+
+---
+
+## 📍 Slide 40 – 📚 Resources & Further Reading
+
+**📕 Books:**
+* 📖 *Kubernetes: Up & Running* — Brendan Burns
+* 📖 *The Kubernetes Book* — Nigel Poulton
+* 📖 *Cloud Native DevOps with Kubernetes* — John Arundel
+
+**🔗 Links:**
+* 🌐 [Kubernetes Documentation](https://kubernetes.io/docs/)
+* 🌐 [kubectl Cheat Sheet](https://kubernetes.io/docs/reference/kubectl/cheatsheet/)
+* 🌐 [Kubernetes the Hard Way](https://github.com/kelseyhightower/kubernetes-the-hard-way)
+
+---