From eaf4a8405a8a043e5c4bca4a4d40bb2801880f4f Mon Sep 17 00:00:00 2001
From: Edward Oliveira <edwardr@senado.gov.br>
Date: Mon, 13 Apr 2026 22:24:16 -0300
Subject: [PATCH] Phase 0 hardening: nginx GeoIP2, rate limits, Gunicorn
 tuning, N+1 fix

- nginx: sendfile on, tcp_nopush, reduced keepalive/proxy timeouts
- nginx: GeoIP2 ASN-based bot blocking (cloud providers + known scrapers)
- nginx: UA blocklist (GPTBot, ClaudeBot, Chrome/98.0.4758 impersonator, etc.)
- nginx: rate-limit zones (30r/m general, 10r/m heavy/relatorios), 429/500 error pages
- nginx: proper ETags + Cache-Control on /media/ to stop 30GB logo re-transfers
- Dockerfile: install libnginx-mod-http-geoip2; download GeoLite2-ASN.mmdb via
  BuildKit secret (key never baked into image layers); ARG GEOIP_CACHE_BUST for
  forced re-download without --no-cache
- Gunicorn: workers 3->2, threads 8->4, timeout 300->120, max_memory 300->400MB
- Django: FILE_UPLOAD_MAX_MEMORY_SIZE=2MB, FILE_UPLOAD_TEMP_DIR for large uploads
- relatorios/views.py: fix N+1 in get_etiqueta_protocolos with bulk-fetch
  MateriaLegislativa + DocumentoAdministrativo using select_related + dict lookups
- Add robots.txt, 429.html, 500.html static pages
- docker-compose.yaml: use sapl:local for local dev
- docker/README.md: build instructions with MAXMIND_LICENSE_KEY
- rate-limiter-v2.md: canonical planning document (Architecture through Phase 5)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 docker/Dockerfile                       |   39 +-
 docker/README.md                        |  107 ++
 docker/config/nginx/nginx.conf          |   82 +-
 docker/config/nginx/sapl.conf           |  146 ++-
 docker/docker-compose.yaml              |    2 +-
 docker/startup_scripts/gunicorn.conf.py |   10 +-
 rate-limiter-v2.md                      | 1231 +++++++++++++++++++++++
 sapl/relatorios/views.py                |   43 +-
 sapl/settings.py                        |    4 +
 sapl/static/429.html                    |   42 +
 sapl/static/500.html                    |   42 +
 sapl/static/robots.txt                  |   19 +
 12 files changed, 1714 insertions(+), 53 deletions(-)
 create mode 100644 docker/README.md
 create mode 100644 rate-limiter-v2.md
 create mode 100644 sapl/static/429.html
 create mode 100644 sapl/static/500.html
 create mode 100644 sapl/static/robots.txt

diff --git a/docker/Dockerfile b/docker/Dockerfile
index 831627ec8..be71b413c 100644
--- a/docker/Dockerfile
+++ b/docker/Dockerfile
@@ -57,7 +57,7 @@ RUN set -eux; \
     if [ "$WITH_GRAPHVIZ" = "1" ]; then apt-get install -y --no-install-recommends graphviz; fi; \
     if [ "$WITH_POPPLER" = "1" ]; then apt-get install -y --no-install-recommends poppler-utils; fi; \
     if [ "$WITH_PSQL_CLIENT" = "1" ]; then apt-get install -y --no-install-recommends postgresql-client; fi; \
-    if [ "$WITH_NGINX" = "1" ]; then apt-get install -y --no-install-recommends nginx; fi; \
+    if [ "$WITH_NGINX" = "1" ]; then apt-get install -y --no-install-recommends nginx libnginx-mod-http-geoip2 libmaxminddb0; fi; \
     rm -rf /var/lib/apt/lists/*
 
 # Usuários/grupos (idempotente)
@@ -67,7 +67,13 @@ RUN useradd --system --no-create-home --shell /usr/sbin/nologin sapl || true \
  && usermod -aG nginx sapl || true
 
 # Estrutura de diretórios
-RUN mkdir -p /var/interlegis/sapl /var/interlegis/sapl/data /var/interlegis/sapl/media /var/interlegis/sapl/run \
+RUN mkdir -p \
+      /var/interlegis/sapl \
+      /var/interlegis/sapl/data \
+      /var/interlegis/sapl/media \
+      /var/interlegis/sapl/run \
+      /var/interlegis/sapl/tmp \
+      /etc/nginx/geoip \
  && chown -R root:nginx /var/interlegis/sapl /var/interlegis/sapl/run \
  && chmod -R g+rwX /var/interlegis/sapl \
  && chmod 2775 /var/interlegis/sapl /var/interlegis/sapl/run \
@@ -88,6 +94,35 @@ RUN if [ "$WITH_NGINX" = "1" ]; then \
       cp docker/config/nginx/nginx.conf /etc/nginx/nginx.conf; \
     fi
 
+# GeoLite2-ASN database for nginx ASN-based bot blocking.
+# The key is injected via BuildKit secret — it is NEVER stored in any image layer.
+#
+# Build command:
+#   DOCKER_BUILDKIT=1 docker build \
+#     --secret id=maxmind_key,src=.env \
+#     -f docker/Dockerfile .
+#
+# .env must contain: MAXMIND_LICENSE_KEY=your_key
+# The weekly host cron (/etc/cron.weekly/update-geoip) refreshes the db in production.
+#
+# Pass --build-arg GEOIP_CACHE_BUST=$(date +%s) to force re-download.
+ARG GEOIP_CACHE_BUST=0
+RUN --mount=type=secret,id=maxmind_key \
+    if [ "$WITH_NGINX" = "1" ]; then \
+      MAXMIND_LICENSE_KEY=$(grep -E '^MAXMIND_LICENSE_KEY=' /run/secrets/maxmind_key 2>/dev/null | cut -d= -f2- | tr -d '[:space:]' || true); \
+      if [ -n "$MAXMIND_LICENSE_KEY" ]; then \
+        tmpdir=$(mktemp -d) \
+        && curl -fsSL \
+          "https://download.maxmind.com/app/geoip_download?edition_id=GeoLite2-ASN&license_key=${MAXMIND_LICENSE_KEY}&suffix=tar.gz" \
+          | tar -xz --strip-components=1 -C "$tmpdir" \
+        && mv "$tmpdir"/*.mmdb /etc/nginx/geoip/GeoLite2-ASN.mmdb \
+        && rm -rf "$tmpdir" \
+        && echo "GeoLite2-ASN.mmdb downloaded successfully."; \
+      else \
+        echo "MAXMIND_LICENSE_KEY not set in secret — GeoLite2-ASN.mmdb skipped. Add it to .env and rebuild."; \
+      fi; \
+    fi
+
 # Scripts + gunicorn.conf no diretório da app
 RUN install -m 755 docker/startup_scripts/start.sh               /var/interlegis/sapl/start.sh \
  && install -m 755 docker/startup_scripts/wait-for-pg.sh         /var/interlegis/sapl/wait-for-pg.sh \
diff --git a/docker/README.md b/docker/README.md
new file mode 100644
index 000000000..9f4776ad7
--- /dev/null
+++ b/docker/README.md
@@ -0,0 +1,107 @@
+# SAPL Docker Build
+
+## Building locally
+
+### 1. Prerequisites
+
+- Docker 23+ with BuildKit enabled (default since Docker 23)
+- A free [MaxMind account](https://www.maxmind.com/en/geolite2/signup) with a license key
+
+### 2. Set your MaxMind license key
+
+Add the key to the project root `.env` file (already gitignored):
+
+```
+MAXMIND_LICENSE_KEY=your_key_here
+```
+
+The key is used **only at build time** to download the `GeoLite2-ASN.mmdb` database for
+nginx ASN-based bot blocking. It is injected via a BuildKit secret and is **never stored
+in any image layer** — it will not appear in `docker history` or any registry push.
+
+### 3. Build the image
+
+```bash
+docker build \
+  --secret id=maxmind_key,src=.env \
+  -f docker/Dockerfile \
+  -t sapl:local \
+  .
+```
+
+Run from the **project root** (not from inside `docker/`), so the build context includes
+the full source tree.
+
+#### Optional build args
+
+| Arg | Default | Description |
+|---|---|---|
+| `WITH_NGINX` | `1` | Include nginx in the image |
+| `WITH_GRAPHVIZ` | `1` | Include Graphviz |
+| `WITH_POPPLER` | `1` | Include Poppler (PDF utilities) |
+| `WITH_PSQL_CLIENT` | `1` | Include `psql` client |
+
+Example — build without Graphviz:
+
+```bash
+docker build \
+  --secret id=maxmind_key,src=.env \
+  --build-arg WITH_GRAPHVIZ=0 \
+  -f docker/Dockerfile \
+  -t sapl:local \
+  .
+```
+
+### 4. If the MaxMind key is not provided
+
+The build will succeed but nginx will log an error on startup because
+`/etc/nginx/geoip/GeoLite2-ASN.mmdb` will be missing. ASN-based bot blocking will
+be inactive. All other Phase 0 mitigations (UA blocklist, rate limits, ETags) still apply.
+
+You can mount the database file at runtime as a workaround:
+
+```bash
+docker run \
+  -v /path/to/GeoLite2-ASN.mmdb:/etc/nginx/geoip/GeoLite2-ASN.mmdb:ro \
+  sapl:local
+```
+
+---
+
+## Production — Harbor
+
+Official images are built and pushed through **Harbor**. Before the next release, configure
+the MaxMind license key as a build secret in the Harbor / CI pipeline:
+
+1. Add `MAXMIND_LICENSE_KEY` as a **masked CI/CD secret** in the Harbor build project
+   (do not put it in any Helm values file or ConfigMap).
+2. Pass it to the build step:
+   ```bash
+   docker build \
+     --secret id=maxmind_key,env=MAXMIND_LICENSE_KEY \
+     -f docker/Dockerfile \
+     -t harbor.your-registry/sapl/sapl:$VERSION \
+     .
+   ```
+   Note: `env=` variant reads the secret from an environment variable instead of a file —
+   useful in CI where `.env` files are not present.
+3. Push as normal — the key will not be present in the pushed image.
+
+### Keeping GeoLite2-ASN up to date
+
+MaxMind updates the database every Tuesday. On production hosts, install the weekly refresh
+cron (run as root):
+
+```bash
+cat > /etc/cron.weekly/update-geoip << 'EOF'
+#!/bin/bash
+MAXMIND_KEY="$(kubectl get secret sapl-build-secrets -n interlegis-infra \
+  -o jsonpath='{.data.MAXMIND_LICENSE_KEY}' | base64 -d)"
+curl -fsSL \
+  "https://download.maxmind.com/app/geoip_download?edition_id=GeoLite2-ASN&license_key=${MAXMIND_KEY}&suffix=tar.gz" \
+  | tar -xz -C /tmp --wildcards '*.mmdb'
+mv /tmp/GeoLite2-ASN_*/GeoLite2-ASN.mmdb /etc/nginx/geoip/GeoLite2-ASN.mmdb
+nginx -s reload
+EOF
+chmod +x /etc/cron.weekly/update-geoip
+```
diff --git a/docker/config/nginx/nginx.conf b/docker/config/nginx/nginx.conf
index e002a6905..ab18f7540 100644
--- a/docker/config/nginx/nginx.conf
+++ b/docker/config/nginx/nginx.conf
@@ -1,3 +1,5 @@
+load_module modules/ngx_http_geoip2_module.so;
+
 user  www-data nginx;
 worker_processes  1;
 
@@ -14,20 +16,88 @@ http {
     include       /etc/nginx/mime.types;
     default_type  application/octet-stream;
 
+    # ----------------------------------------------------------------
+    # Real client IP extracted from X-Forwarded-For set by K8s Ingress.
+    # ----------------------------------------------------------------
+    real_ip_header     X-Forwarded-For;
+    real_ip_recursive  on;
+    set_real_ip_from   10.0.0.0/8;
+    set_real_ip_from   172.16.0.0/12;
+    set_real_ip_from   192.168.0.0/16;
+    set_real_ip_from   127.0.0.1;
+
     log_format  main  '$remote_addr - $remote_user [$time_local] "$request" '
                       '$status $body_bytes_sent "$http_referer" '
-                      '"$http_user_agent" "$http_x_forwarded_for"';
+                      '"$http_user_agent" "$http_x_forwarded_for" '
+                      'rt=$request_time';
 
     access_log  /var/log/nginx/access.log  main;
 
-    sendfile        off;
-    #tcp_nopush     on;
+    # ----------------------------------------------------------------
+    # FIX: kernel bypass — was off (disables zero-copy file serving)
+    # ----------------------------------------------------------------
+    sendfile        on;
+    tcp_nopush      on;
+    tcp_nodelay     on;
+
+    # ----------------------------------------------------------------
+    # Timeouts — reduced from 300s to prevent bots holding threads.
+    # Per-location overrides in sapl.conf handle legitimate slow ops.
+    # ----------------------------------------------------------------
+    keepalive_timeout     75;          # was 300
+    proxy_connect_timeout 10s;
+    proxy_read_timeout    120s;        # was 300s — overridden per-location
+    proxy_send_timeout    120s;
+
+    # ----------------------------------------------------------------
+    # Rate limiting zones (effective once real_ip is resolved).
+    # sapl_general : 30 req/min for most traffic
+    # sapl_heavy   : 10 req/min for PDF/report endpoints
+    # ----------------------------------------------------------------
+    limit_req_zone $binary_remote_addr zone=sapl_general:20m rate=30r/m;
+    limit_req_zone $binary_remote_addr zone=sapl_heavy:20m   rate=10r/m;
 
-    keepalive_timeout  300;
+    # ----------------------------------------------------------------
+    # ASN-Based Blocking (datacenter / scraper ASNs).
+    # Requires libnginx-mod-http-geoip2 and GeoLite2-ASN.mmdb.
+    # See rate-limiter-v2.md Phase 0 §3.4 for install instructions.
+    # ----------------------------------------------------------------
+    geoip2 /etc/nginx/geoip/GeoLite2-ASN.mmdb {
+        $geoip2_asn_number autonomous_system_number;
+        $geoip2_asn_org    autonomous_system_organization;
+    }
 
-    proxy_connect_timeout 75s;
-    proxy_read_timeout 300s;
+    map $geoip2_asn_number $bot_asn {
+        default  0;
+        16509    1;  # Amazon AWS
+        14618    1;  # Amazon AWS us-east
+        8075     1;  # Microsoft Azure
+        396982   1;  # Google Cloud
+        20473    1;  # Vultr
+        24940    1;  # Hetzner
+        16276    1;  # OVH
+        36352    1;  # ColoCrossing
+        63949    1;  # Linode / Akamai
+    }
 
+    # ----------------------------------------------------------------
+    # Bot blocking by User-Agent.
+    # Chrome/98.0.4758 is a confirmed scraper (no real user runs a
+    # 2022 browser version in 2026). Googlebot excluded for SEO.
+    # ----------------------------------------------------------------
+    map $http_user_agent $bot_ua_blocked {
+        default                    0;
+        "~*GPTBot"                 1;
+        "~*ClaudeBot"              1;
+        "~*PerplexityBot"          1;
+        "~*Bytespider"             1;
+        "~*AhrefsBot"              1;
+        "~*SemrushBot"             1;
+        "~*DotBot"                 1;
+        "~*meta-externalagent"     1;
+        "~*OAI-SearchBot"          1;
+        "~*Chrome/98\.0\.4758"     1;
+    }
 
     gzip on;
     gzip_disable "MSIE [1-6]\\.(?!.*SV1)";
diff --git a/docker/config/nginx/sapl.conf b/docker/config/nginx/sapl.conf
index 015538c96..16d26e7c7 100644
--- a/docker/config/nginx/sapl.conf
+++ b/docker/config/nginx/sapl.conf
@@ -1,10 +1,8 @@
 upstream sapl_server {
-
-  server unix:/var/interlegis/sapl/run/gunicorn.sock fail_timeout=0;
-
+    server unix:/var/interlegis/sapl/run/gunicorn.sock fail_timeout=0;
 }
 
-# Se o cliente já manda X-Request-ID, reaproveita; senão, usa $request_id (nginx)
+# Reuse X-Request-ID from ingress if present; otherwise generate one.
 map $http_x_request_id $req_id {
     default $http_x_request_id;
     ""      $request_id;
@@ -18,52 +16,144 @@ server {
 
     client_max_body_size 4G;
 
+    # ----------------------------------------------------------------
+    # Block known scraper ASNs (datacenter traffic) — zero Python cost.
+    # ----------------------------------------------------------------
+    if ($bot_asn = 1) {
+        return 429 "Too Many Requests";
+    }
+
+    # ----------------------------------------------------------------
+    # Block known bots by User-Agent — zero Python cost.
+    # ----------------------------------------------------------------
+    if ($bot_ua_blocked = 1) {
+        return 429 "Too Many Requests";
+    }
+
+    # ----------------------------------------------------------------
+    # robots.txt served directly by nginx.
+    # ----------------------------------------------------------------
+    location = /robots.txt {
+        alias /var/interlegis/sapl/collected_static/robots.txt;
+    }
+
+    # ----------------------------------------------------------------
+    # Static files — no rate limiting, no proxy.
+    # ----------------------------------------------------------------
+    location /static/ {
+        alias /var/interlegis/sapl/collected_static/;
+    }
+
+    # ----------------------------------------------------------------
+    # Media files — FIX: add ETags and Cache-Control headers.
+    # sendfile on + etag on converts repeat bot requests to 304s.
+    # ----------------------------------------------------------------
+    location /media/ {
+        alias  /var/interlegis/sapl/media/;
+        sendfile on;
+        etag on;
+        add_header Cache-Control "public, max-age=86400, stale-while-revalidate=3600";
+        add_header X-Robots-Tag  "noindex" always;
+    }
+
+    # Private documents — X-Accel-Redirect after auth check in Django.
+    location /media/documentos_privados/ {
+        internal;
+        alias /var/interlegis/sapl/media/documentos_privados/;
+    }
+
+    # ----------------------------------------------------------------
+    # /relatorios/ — heaviest endpoint (PDF generation).
+    # Tighter rate limit; extended timeout for uncached generation.
+    # ----------------------------------------------------------------
+    location /relatorios/ {
+        limit_req zone=sapl_heavy burst=5 nodelay;
+        limit_req_status 429;
+
+        proxy_read_timeout  180s;
+        proxy_send_timeout  180s;
+
+        proxy_set_header X-Request-ID      $req_id;
+        proxy_set_header X-Forwarded-For   $proxy_add_x_forwarded_for;
+        proxy_set_header X-Forwarded-Proto $scheme;
+        proxy_set_header Host              $http_host;
+        proxy_redirect off;
+        proxy_pass http://sapl_server;
+    }
+
+    # ----------------------------------------------------------------
+    # Upload endpoints — nginx buffers the full upload before forwarding.
+    # Protects workers from slow municipal-link clients uploading 150 MB.
+    # ----------------------------------------------------------------
+    location ~* ^/(protocoloadm/criar-protocolo|materia/.*upload|norma/.*upload) {
+        proxy_request_buffering on;
+        proxy_read_timeout  180s;
+        proxy_send_timeout  180s;
+
+        proxy_set_header X-Request-ID      $req_id;
+        proxy_set_header X-Forwarded-For   $proxy_add_x_forwarded_for;
+        proxy_set_header X-Forwarded-Proto $scheme;
+        proxy_set_header Host              $http_host;
+        proxy_redirect off;
+        proxy_pass http://sapl_server;
+    }
+
+    # ----------------------------------------------------------------
+    # /api/ — rate limited, CORS maintained from original config.
+    # ----------------------------------------------------------------
     location /api/ {
+        limit_req zone=sapl_general burst=30 nodelay;
+        limit_req_status 429;
+
         add_header 'Access-Control-Allow-Origin' '*';
         add_header 'Access-Control-Allow-Credentials' 'true';
         add_header 'Access-Control-Allow-Methods' 'GET, POST, PUT, DELETE, HEAD, OPTIONS';
         add_header 'Access-Control-Allow-Headers' 'Access-Control-Allow-Origin,XMLHttpRequest,Accept,Authorization,Cache-Control,Content-Type,DNT,If-Modified-Since,Keep-Alive,Origin,User-Agent,X-Mx-ReqToken,X-Requested-With';
         add_header 'Access-Control-Expose-Headers' 'Access-Control-Allow-Origin,XMLHttpRequest,Accept,Authorization,Cache-Control,Content-Type,DNT,If-Modified-Since,Keep-Alive,Origin,User-Agent,X-Mx-ReqToken,X-Requested-With';
 
-#      handle the browser's preflight steps
-       if ($request_method = 'OPTIONS') {
-             add_header 'Access-Control-Allow-Origin' '*';
-             add_header 'Access-Control-Allow-Methods' 'GET, POST, PUT, DELETE, HEAD, OPTIONS';
-             add_header 'Access-Control-Allow-Headers' 'Authorization,Accept,DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range';
-             add_header 'Access-Control-Expose-Headers' 'DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range';
-             add_header 'Access-Control-Max-Age' 1728000;
-             add_header 'Content-Type' 'text/plain; charset=utf-8';
-             add_header 'Content-Length' 0;
-             return 204;
+        if ($request_method = 'OPTIONS') {
+            add_header 'Access-Control-Allow-Origin' '*';
+            add_header 'Access-Control-Allow-Methods' 'GET, POST, PUT, DELETE, HEAD, OPTIONS';
+            add_header 'Access-Control-Allow-Headers' 'Authorization,Accept,DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range';
+            add_header 'Access-Control-Expose-Headers' 'DNT,X-CustomHeader,Keep-Alive,User-Agent,X-Requested-With,If-Modified-Since,Cache-Control,Content-Type,Content-Range,Range';
+            add_header 'Access-Control-Max-Age' 1728000;
+            add_header 'Content-Type' 'text/plain; charset=utf-8';
+            add_header 'Content-Length' 0;
+            return 204;
         }
 
-        proxy_set_header X-Request-ID $req_id;
-        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+        proxy_set_header X-Request-ID      $req_id;
+        proxy_set_header X-Forwarded-For   $proxy_add_x_forwarded_for;
         proxy_set_header X-Forwarded-Proto $scheme;
-        proxy_set_header Host $http_host;
+        proxy_set_header Host              $http_host;
         proxy_redirect off;
         proxy_pass http://sapl_server;
     }
 
-    location /static/ {
-        alias  /var/interlegis/sapl/collected_static/;
-    }
-
-    location /media/ {
-        alias  /var/interlegis/sapl/media/;
-    }
-
+    # ----------------------------------------------------------------
+    # General traffic — moderate rate limit.
+    # ----------------------------------------------------------------
     location / {
-        proxy_set_header X-Request-ID $req_id;
-        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+        limit_req zone=sapl_general burst=20 nodelay;
+        limit_req_status 429;
+
+        proxy_set_header X-Request-ID      $req_id;
+        proxy_set_header X-Forwarded-For   $proxy_add_x_forwarded_for;
         proxy_set_header X-Forwarded-Proto $scheme;
-        proxy_set_header Host $http_host;
+        proxy_set_header Host              $http_host;
         proxy_redirect off;
         proxy_pass http://sapl_server;
     }
 
+    error_page 429 /429.html;
+    location = /429.html {
+        root /var/interlegis/sapl/sapl/static/;
+        internal;
+    }
+
     error_page 500 502 503 504 /500.html;
     location = /500.html {
         root /var/interlegis/sapl/sapl/static/;
+        internal;
     }
 }
diff --git a/docker/docker-compose.yaml b/docker/docker-compose.yaml
index dc8559812..69e3559da 100644
--- a/docker/docker-compose.yaml
+++ b/docker/docker-compose.yaml
@@ -33,7 +33,7 @@ services:
     networks:
       - sapl-net
   sapl:
-    image: interlegis/sapl:3.1.165-RC2
+    image: sapl:local
 #    build:
 #      context: ../
 #      dockerfile: ./docker/Dockerfile
diff --git a/docker/startup_scripts/gunicorn.conf.py b/docker/startup_scripts/gunicorn.conf.py
index 6bdcacb02..795a1d817 100644
--- a/docker/startup_scripts/gunicorn.conf.py
+++ b/docker/startup_scripts/gunicorn.conf.py
@@ -10,9 +10,9 @@ DJANGODIR = "/var/interlegis/sapl"
 SOCKFILE = f"unix:{DJANGODIR}/run/gunicorn.sock"
 USER = "sapl"
 GROUP = "nginx"
-NUM_WORKERS = int(os.getenv("WEB_CONCURRENCY", "3"))
-THREADS = int(os.getenv("GUNICORN_THREADS", "8"))
-TIMEOUT = int(os.getenv("GUNICORN_TIMEOUT", "300"))
+NUM_WORKERS = int(os.getenv("WEB_CONCURRENCY", "2"))        # was 3
+THREADS = int(os.getenv("GUNICORN_THREADS", "4"))           # was 8
+TIMEOUT = int(os.getenv("GUNICORN_TIMEOUT", "120"))         # was 300
 MAX_REQUESTS = 1000
 WORKER_CLASS = "gthread"
 DJANGO_SETTINGS = "sapl.settings"
@@ -36,7 +36,7 @@ chdir = DJANGODIR
 wsgi_app = WSGI_APP
 
 # Logs
-loglevel = "debug"
+loglevel = "info"                                            # was debug — reduces log I/O
 accesslog = "/var/log/sapl/access.log"
 errorlog = "/var/log/sapl/error.log"
 # errorlog = "-"          # send to stderr (so you see it in docker logs or terminal)
@@ -53,7 +53,7 @@ keepalive = 10
 backlog = 2048
 max_requests = MAX_REQUESTS
 max_requests_jitter = 200
-worker_max_memory_per_child = 300 * 1024 * 1024  # 300 MB cap
+worker_max_memory_per_child = 400 * 1024 * 1024  # 400 MB — was 300 MB
 
 # Environment (same as exporting before running)
 raw_env = [
diff --git a/rate-limiter-v2.md b/rate-limiter-v2.md
new file mode 100644
index 000000000..33c05124a
--- /dev/null
+++ b/rate-limiter-v2.md
@@ -0,0 +1,1231 @@
+# SAPL — OOM Investigation & Remediation Plan (v2)
+
+> **Scope**: Django 2.2 / Gunicorn / nginx / Kubernetes fleet of 1,200+ pods.  
+> Each pod has a dedicated PostgreSQL instance. A K8s Ingress sits in front of all tenants.  
+> **This document is canonical** — all earlier session notes are consolidated here.
+
+---
+
+## Table of Contents
+
+1. [Architecture Overview](#0-architecture-overview)
+2. [Context & Problem Statement](#1-context--problem-statement)
+3. [Decision Log](#2-decision-log)
+4. [Phase 0 — Immediate Hardening (No New Infra)](#3-phase-0--immediate-hardening-no-new-infra)
+5. [Phase 1 — Shared Redis (Single Pod)](#4-phase-1--shared-redis-single-pod)
+6. [Phase 2 — Rate Limiting & Bot Mitigation](#5-phase-2--rate-limiting--bot-mitigation)
+7. [Phase 3 — File Serving Corrections](#6-phase-3--file-serving-corrections)
+8. [Phase 4 — Dynamic Page Caching](#7-phase-4--dynamic-page-caching)
+9. [Phase 5 — Async PDF & WebSocket (Follow-up)](#8-phase-5--async-pdf--websocket-follow-up)
+10. [Open Questions](#9-open-questions)
+
+---
+
+## 0. Architecture Overview
+
+### 0.1 Component Diagram
+
+```mermaid
+graph TD
+    Client([Bot / Human Client])
+    nginx[nginx\nDebian pkg]
+    gunicorn[Gunicorn\n2 workers / 4 threads]
+    mw[Django Middleware\nRateLimitMiddleware]
+    view[View Layer\nCBV + decorators]
+    redis[(Redis\nDB0: cache\nDB1: rate limiter)]
+    pg[(PostgreSQL\nper-pod)]
+    fs[Filesystem\nPDFs / media]
+
+    Client -->|HTTP| nginx
+    nginx -->|proxy_pass| gunicorn
+    gunicorn --> mw
+    mw -->|pass| view
+    mw -->|429| nginx
+    view --> pg
+    view --> fs
+    view --> redis
+    mw --> redis
+    nginx -->|SISMEMBER / GET| redis
+```
+
+> DB2 is reserved for Django Channels (WebSocket — future Phase 5).
+
+### 0.2 Redis Memory Budget and Key Layout
+
+| Key type | Key schema | TTL | DB | Est. size |
+|---|---|---|---|---|
+| Static cache (images/logos) | `static:{ns}:{sha256}` | 3–24 h | 0 | ~2.4 GB |
+| PDF cache (≤ 360 KB) | `file:{ns}:{sha256}` | 1 h | 0 | ~0.9 GB |
+| IP request counter | `rl:ip:{ip}:reqs` | 60 s | 1 | ~0.6 MB |
+| IP blocked marker | `rl:ip:{ip}:blocked` | 300 s | 1 | ~0.06 MB |
+| User request counter | `rl:{ns}:user:{id}:reqs` | 60 s | 1 | negligible |
+| User blocked marker | `rl:{ns}:user:{id}:blocked` | 300 s | 1 | negligible |
+| Path counter | `rl:{ns}:path:{sha256}:reqs` | 60 s | 1 | ~0.3 MB |
+| UA deny list | `rl:bot:ua:blocked` | permanent SET | 1 | ~0.03 MB |
+| NS/IP/window counter | `rl:ns:{ns}:ip:{ip}:w:{bucket}` | 60 s × 2 | 1 | ~0.6 MB |
+| **Redis overhead (× 1.5)** | | | | ~1.6 GB |
+| **Total ceiling** | | | | **~5 GB** |
+
+**Key conventions:**
+- `{ns}` = Kubernetes namespace (tenant identifier). All path and user keys include it.
+- `{user}` / `{id}` = normalized user PK: `str(user.pk).lower().strip()`.
+- Django `CACHES` uses `KEY_PREFIX: "sapl"` to namespace DB0 cache keys.  
+  DB1 (rate limiter) uses raw keys — no prefix — for compatibility with the Lua / middleware INCR scripts.
+- DB2 is reserved for Django Channels; allocate separately when WebSocket work resumes.
+
+---
+
+## 1. Context & Problem Statement
+
+### Fleet
+
+| Item | Detail |
+|---|---|
+| System | SAPL — Django 2.2, legislative management for Brazilian municipal chambers |
+| Fleet | ~1,200 Kubernetes pods, each with a dedicated PostgreSQL pod |
+| Pod limits | 1 core CPU (limit) / 35m (request) · 1600Mi RAM (limit) / 800Mi (request) |
+| Users | Legislative house staff, often behind NAT (many users, one public IP) |
+| Workloads | PDF generation (synchronous, ReportLab), file uploads up to 150 MB, WebSocket voting panel |
+
+### OOM Kill Pattern
+
+Workers grow from ~35 MB at birth to 800–900 MB within 2–3 minutes, then are killed and replaced in a continuous cycle.
+
+Root causes:
+- Bot scraping triggers synchronous PDF generation — entire document built in RAM (ReportLab)
+- `worker_max_memory_per_child` only checks **between requests**; workers blocked on long requests are never recycled
+- `TIMEOUT=300` lets bots hold threads for up to 5 minutes while memory accumulates
+- 3 workers × 300 MB each = ~900 MB — breaching the 800Mi request threshold
+
+### Bot Traffic Profile (Barueri pod, 16 days, 662k requests)
+
+| Actor | Requests | % of total |
+|---|---|---|
+| Googlebot | ~154,000 | 23.2% |
+| Chrome/98.0.4758 (spoofed scraper) | 90,774 | 13.7% |
+| kube-probe (healthcheck) | 69,065 | 10.4% |
+| meta-externalagent | 28,325 | 4.3% |
+| GPTBot | 11,489 | 1.7% |
+| bingbot | 7,639 | 1.1% |
+| OAI-SearchBot + Applebot | 6,681 | 1.0% |
+| **Total identified bots** | **~377,000** | **~56.9%** |
+
+**Botnet fingerprint:**
+- Rotates User-Agents (Chrome/121, Chrome/122, Firefox/123, Safari/17…) across requests
+- Crawls all sub-endpoints of the same matéria within 1 second from different IPs
+- Distributes crawling across tenants — each pod stays under the per-pod rate limit, never triggering it
+- Primary targets: `/relatorios/{id}/etiqueta-materia-legislativa` (~40 KB PDF) and all `/materia/{id}/*` sub-endpoints
+
+### Static File Traffic (from CSV analysis)
+
+| Category | Requests | Transfers |
+|---|---|---|
+| Logos / images | 62,776 | ~24 GB |
+| PDFs | 8,869 | 5.1 GB |
+| Parliamentarian photos | 11,856 | ~0.5 GB |
+| **Total** | **83,501** | **~30 GB** |
+
+Top offender: `Brasão - Foz do Iguaçu.png` — 14,512 requests, 5.6 GB from a single 392 KB file.
+
+### Confirmed Bugs
+
+```nginx
+# nginx.conf — WRONG (disables kernel bypass)
+sendfile off;
+
+# sapl.conf — missing on /media/ location
+location /media/ {
+    alias /var/interlegis/sapl/media/;
+    # no ETag, no Cache-Control, no X-Robots-Tag
+}
+```
+
+```python
+# settings.py — per-pod cache, not shared
+CACHES = {
+    'default': {
+        'BACKEND': 'django.core.cache.backends.filebased.FileBasedCache',
+        'LOCATION': '/var/tmp/django_cache',
+        'OPTIONS': {"MAX_ENTRIES": 10000},
+    }
+}
+```
+
+Django rate limiter (`django-ratelimit` at 35/m) uses `FileBasedCache` — counters are isolated per pod, making rate limiting completely ineffective at fleet scale.
+
+### Hard Constraints
+
+| Constraint | Impact |
+|---|---|
+| Per-pod PostgreSQL | Rate-limit counters not shared across pods |
+| No Redis initially | No shared state for rate limiting or caching |
+| NAT environments | IP-based rate limiting causes false positives |
+| `TIMEOUT=300` / uploads to 150 MB | Must not be broken — intentional for slow workflows |
+
+---
+
+## 2. Decision Log
+
+| Decision | Chosen | Rationale | Session |
+|---|---|---|---|
+| Redis topology | **Single pod** (no Sentinel, no Cluster) | 65 MB of active data fits comfortably on one node; cluster complexity not justified at this data volume | v2 |
+| PDF caching in Redis | **No** — ETags + sendfile are sufficient | Once rate limiting + ETags are active, repeat requests become 304s with zero bytes transferred | Session 4 |
+| nginx rate-limit end state | **Django middleware** with shared Redis | No nginx image changes required; solves cross-pod consistency immediately | Session 5 |
+| `worker_max_memory_per_child` | **400 MB** | Pod limit 1600Mi, 2 workers × 400 MB = 800 MB — leaves 800 Mi headroom; previous 300 MB was OOMKilled before recycling could act | v2 |
+| `sendfile off` | **Bug** — flip to `on` | No valid production reason found in uploaded config; disabling userspace copy is always correct | Session 5 |
+| nginx serves `/media/` directly | Confirmed via `alias` in `sapl.conf` | `X-Accel-Redirect` only needed for LGPD-restricted documents | Session 5 |
+| Cache backend switch timing | **At pod startup** via `start.sh` + waffle switch | Pod restart is acceptable; avoids per-request runtime overhead | Session 5 |
+| Secret injection | Per-namespace Secret with `optional: true` | Enables gradual rollout; pod starts on file cache if Secret is absent | Session 5 |
+| Redis k8s files location | `$PROJECT_ROOT/docker/k8s/` | Consistent with existing Docker artifacts in the repo | v2 |
+
+---
+
+## 3. Phase 0 — Immediate Hardening (No New Infra)
+
+**Goal**: Stop the OOM kill cycle and reduce bot load with zero infrastructure additions.  
+**Risk**: Low — all changes are config-only.
+
+### 3.1 Gunicorn Tuning
+
+The core tension: reducing workers protects memory but reduces concurrency. The fix is to reduce the **number** of workers (from 3 to 2) and raise the per-worker **ceiling** so the recycling mechanism has time to act.
+
+```python
+# docker/startup_scripts/gunicorn.conf.py
+import os
+import pathlib
+
+NAME     = "SAPL"
+DJANGODIR = "/var/interlegis/sapl"
+SOCKFILE  = f"unix:{DJANGODIR}/run/gunicorn.sock"
+USER  = "sapl"
+GROUP = "nginx"
+
+NUM_WORKERS = int(os.getenv("WEB_CONCURRENCY", "2"))      # was 3
+THREADS     = int(os.getenv("GUNICORN_THREADS", "4"))      # was 8
+TIMEOUT     = int(os.getenv("GUNICORN_TIMEOUT", "120"))    # was 300
+WORKER_CLASS     = "gthread"
+DJANGO_SETTINGS  = "sapl.settings"
+WSGI_APP         = "sapl.wsgi:application"
+
+proc_name = NAME
+bind      = SOCKFILE
+umask     = 0o007
+user      = USER
+group     = GROUP
+chdir     = DJANGODIR
+wsgi_app  = WSGI_APP
+
+loglevel    = "info"          # was debug — reduces log I/O
+accesslog   = "/var/log/sapl/access.log"
+errorlog    = "/var/log/sapl/error.log"
+capture_output = True
+
+workers          = NUM_WORKERS
+worker_class     = WORKER_CLASS
+threads          = THREADS
+timeout          = TIMEOUT
+graceful_timeout = 30
+keepalive        = 10
+backlog          = 2048
+
+max_requests        = 1000
+max_requests_jitter = 200
+worker_max_memory_per_child = 400 * 1024 * 1024  # 400 MB — was 300 MB
+
+raw_env = [f"DJANGO_SETTINGS_MODULE={DJANGO_SETTINGS}"]
+preload_app = False
+
+def on_starting(server):
+    pathlib.Path(SOCKFILE).parent.mkdir(parents=True, exist_ok=True)
+
+def post_fork(server, worker):
+    try:
+        from django import db
+        db.connections.close_all()
+    except Exception:
+        pass
+```
+
+**Per-location timeout strategy** — replace the one-size-fits-all 300s:
+
+| Operation | Previous | Recommended | Rationale |
+|---|---|---|---|
+| Normal page rendering | 300 s | 60 s | No legitimate page should take > 60 s |
+| API endpoints | 300 s | 30 s | Stateless, fast by design |
+| PDF download (cached / nginx) | 300 s | 30 s | nginx serves from disk, worker not involved |
+| PDF generation (uncached) | 300 s | 180 s | Kept high — addressed in Phase 5 |
+| Large file upload | 300 s | 180 s | nginx buffers upload, worker processes after |
+
+---
+
+### 3.2 nginx Fixes
+
+Three confirmed bugs in the uploaded config — all fixed here.
+
+```nginx
+# /etc/nginx/nginx.conf — http {} block
+
+# FIX 1: kernel bypass (was off — CRITICAL)
+sendfile    on;
+tcp_nopush  on;
+tcp_nodelay on;
+
+# FIX 2: reduced timeouts (was 300s everywhere)
+keepalive_timeout     75;
+proxy_read_timeout    120s;    # overridden per-location for slow ops
+proxy_connect_timeout 10s;
+proxy_send_timeout    120s;
+
+# Real client IP from X-Forwarded-For set by K8s Ingress
+real_ip_header     X-Forwarded-For;
+real_ip_recursive  on;
+set_real_ip_from   10.0.0.0/8;
+set_real_ip_from   172.16.0.0/12;
+set_real_ip_from   192.168.0.0/16;
+```
+
+```nginx
+# sapl.conf — FIX 3: add caching headers to /media/
+location /media/ {
+    alias  /var/interlegis/sapl/media/;
+    sendfile on;
+    etag on;
+    add_header Cache-Control "public, max-age=86400, stale-while-revalidate=3600";
+    add_header X-Robots-Tag  "noindex" always;
+}
+```
+
+**Upload endpoints** — keep `proxy_request_buffering on` so nginx absorbs slow uploads before handing off to Gunicorn:
+
+```nginx
+location ~* ^/(protocoloadm/criar-protocolo|materia/.*upload|norma/.*upload) {
+    proxy_request_buffering on;
+    proxy_read_timeout  180s;
+    proxy_send_timeout  180s;
+    proxy_set_header X-Forwarded-For   $proxy_add_x_forwarded_for;
+    proxy_set_header X-Forwarded-Proto $scheme;
+    proxy_set_header Host              $http_host;
+    proxy_redirect off;
+    proxy_pass http://sapl_server;
+}
+```
+
+---
+
+### 3.3 Bot UA Blocklist in nginx
+
+Blocks known bots at nginx — before any Gunicorn worker is allocated.
+
+```nginx
+# nginx.conf — http {} block
+map $http_user_agent $bot_ua_blocked {
+    default                    0;
+    "~*GPTBot"                 1;
+    "~*ClaudeBot"              1;
+    "~*PerplexityBot"          1;
+    "~*Bytespider"             1;
+    "~*AhrefsBot"              1;
+    "~*SemrushBot"             1;
+    "~*DotBot"                 1;
+    "~*meta-externalagent"     1;
+    "~*OAI-SearchBot"          1;
+    "~*Chrome/98\.0\.4758"     1;  # confirmed scraper — no real user runs a 2022 browser in 2026
+}
+
+# sapl.conf — server {} block (before any location)
+if ($bot_ua_blocked = 1) {
+    return 429 "Too Many Requests";
+}
+```
+
+**Limitation**: Bots with rotating or spoofed UAs are not caught here. They are handled by Django middleware in Phase 2 (checks 3–5). This is intentional — nginx handles the cheap deterministic case; Django handles the expensive probabilistic case.
+
+---
+
+### 3.4 ASN-Based Blocking (Mandatory)
+
+Blocks bot traffic by datacenter ASN — before UA parsing, before any Python process is touched.
+
+**Step 1 — install the GeoIP2 module and database:**
+
+```bash
+# Debian / Ubuntu
+apt install libnginx-mod-http-geoip2 libmaxminddb0 mmdb-bin
+
+# Download GeoLite2-ASN (free MaxMind account required)
+mkdir -p /etc/nginx/geoip
+curl -sL "https://download.maxmind.com/app/geoip_download?edition_id=GeoLite2-ASN&license_key=YOUR_KEY&suffix=tar.gz" \
+  | tar -xz --strip-components=1 --wildcards '*.mmdb' -C /etc/nginx/geoip/
+```
+
+**Step 2 — configure nginx:**
+
+```nginx
+# nginx.conf — top-level (outside http {})
+load_module modules/ngx_http_geoip2_module.so;
+
+# nginx.conf — http {} block
+geoip2 /etc/nginx/geoip/GeoLite2-ASN.mmdb {
+    $geoip2_asn_number autonomous_system_number;
+    $geoip2_asn_org    autonomous_system_organization;
+}
+
+map $geoip2_asn_number $bot_asn {
+    default  0;
+    16509    1;  # Amazon AWS
+    14618    1;  # Amazon AWS us-east
+    8075     1;  # Microsoft Azure
+    396982   1;  # Google Cloud
+    20473    1;  # Vultr
+    24940    1;  # Hetzner
+    16276    1;  # OVH
+    36352    1;  # ColoCrossing
+    63949    1;  # Linode / Akamai
+}
+
+# sapl.conf — server {} block (before bot_ua_blocked check)
+if ($bot_asn = 1) {
+    return 429 "Too Many Requests";
+}
+```
+
+**Step 3 — keep the database fresh** (host cron — no k8s CronJob):
+
+```bash
+# /etc/cron.weekly/update-geoip
+#!/bin/bash
+curl -sL "https://download.maxmind.com/app/geoip_download?edition_id=GeoLite2-ASN&license_key=${MAXMIND_KEY}&suffix=tar.gz" \
+  | tar -xz -C /tmp --wildcards '*.mmdb'
+mv /tmp/GeoLite2-ASN_*/GeoLite2-ASN.mmdb /etc/nginx/geoip/GeoLite2-ASN.mmdb
+nginx -s reload
+```
+
+**Tradeoff**: Blocks datacenter ASNs where bots originate. May over-block VPN users and developers on cloud instances — mitigate with a per-namespace IP whitelist once available (see Open Question 2).
+
+---
+
+### 3.5 robots.txt
+
+Passive mitigation — effective over days/weeks for compliant bots. The spoofed Chrome/98 botnet ignores it; handled by nginx UA blocking above.
+
+```
+# Place at /var/interlegis/sapl/collected_static/robots.txt
+User-agent: GPTBot
+Disallow: /
+Crawl-delay: 10
+
+User-agent: ClaudeBot
+Disallow: /
+Crawl-delay: 10
+
+User-agent: meta-externalagent
+Disallow: /
+Crawl-delay: 10
+
+User-agent: OAI-SearchBot
+Disallow: /
+Crawl-delay: 10
+
+User-agent: *
+Disallow: /relatorios/
+Crawl-delay: 10
+```
+
+Serve directly from nginx (no Django involvement):
+
+```nginx
+# sapl.conf
+location = /robots.txt {
+    alias /var/interlegis/sapl/collected_static/robots.txt;
+}
+```
+
+---
+
+### 3.6 N+1 Fix in `get_etiqueta_protocolos`
+
+Confirmed in `sapl/protocoloadm/utils.py` — `MateriaLegislativa.objects.filter()` called inside a loop over protocols. Two queries total regardless of volume:
+
+```python
+# BEFORE — one query per protocol (N+1)
+def get_etiqueta_protocolos(prots):
+    protocolos = []
+    for p in prots:
+        dic = {}
+        for materia in MateriaLegislativa.objects.filter(
+                numero_protocolo=p.numero, ano=p.ano):
+            dic['num_materia'] = (
+                materia.tipo.sigla + ' ' +
+                str(materia.numero) + '/' + str(materia.ano)
+            )
+        protocolos.append(dic)
+    return protocolos
+
+
+# AFTER — two queries total regardless of volume
+def get_etiqueta_protocolos(prots):
+    from django.db.models import Q
+    import functools, operator
+
+    prot_list = list(prots)
+    if not prot_list:
+        return []
+
+    query = functools.reduce(
+        operator.or_,
+        [Q(numero_protocolo=p.numero, ano=p.ano) for p in prot_list]
+    )
+    materias_map = {
+        (m.numero_protocolo, m.ano): m
+        for m in MateriaLegislativa.objects.filter(query).select_related('tipo')
+    }
+
+    protocolos = []
+    for p in prot_list:
+        dic = {}
+        materia = materias_map.get((p.numero, p.ano))
+        dic['num_materia'] = (
+            f"{materia.tipo.sigla} {materia.numero}/{materia.ano}"
+            if materia else ''
+        )
+        # ... rest of existing loop body unchanged
+        protocolos.append(dic)
+    return protocolos
+```
+
+---
+
+### 3.7 ETags / 304 Responses
+
+Adding `etag on` and `Cache-Control` to the `/media/` location (§3.2) converts repeat bot requests from full downloads to 304 responses with empty bodies.
+
+For `Brasão - Foz do Iguaçu.png` (392 KB × 14,512 requests = **5.6 GB**), even a 50% conditional hit rate saves ~2.8 GB immediately — without any Redis.
+
+**Why this is sufficient for PDFs**: See Phase 3 §6.2.
+
+---
+
+### 3.8 Django Upload Settings
+
+```python
+# sapl/settings.py
+# Files above 2 MB are streamed to a temp file on disk rather than
+# held in worker RAM. Critical for 150 MB upload support.
+FILE_UPLOAD_MAX_MEMORY_SIZE = 2 * 1024 * 1024       # 2 MB
+DATA_UPLOAD_MAX_MEMORY_SIZE = 10 * 1024 * 1024      # 10 MB
+MAX_DOC_UPLOAD_SIZE         = 150 * 1024 * 1024     # 150 MB
+FILE_UPLOAD_TEMP_DIR        = '/var/interlegis/sapl/tmp'
+```
+
+---
+
+## 4. Phase 1 — Shared Redis (Single Pod)
+
+**Goal**: Deploy Redis so all subsequent phases have shared state.  
+**Risk**: Medium — new stateful infrastructure. Non-fatal fallback to file cache if Redis is unreachable.
+
+### 4.1 Redis Kubernetes Manifests
+
+Files live under `$PROJECT_ROOT/docker/k8s/`.
+
+```yaml
+# docker/k8s/redis-configmap.yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: redis-config
+  namespace: redis
+data:
+  redis.conf: |
+    save ""
+    appendonly no
+
+    maxmemory 5gb
+    maxmemory-policy allkeys-lru
+    maxmemory-samples 10
+
+    maxclients 20000
+    tcp-backlog 511
+    timeout 300
+    tcp-keepalive 60
+
+    hz 20
+    lazyfree-lazy-eviction yes
+    lazyfree-lazy-expire yes
+    lazyfree-lazy-server-del yes
+
+    slowlog-log-slower-than 10000
+    slowlog-max-len 256
+    latency-monitor-threshold 10
+
+    bind 0.0.0.0
+    protected-mode no
+    databases 4     # DB0: cache, DB1: rate limiter, DB2: channels (future)
+
+    activedefrag yes
+    active-defrag-ignore-bytes 100mb
+    active-defrag-threshold-lower 10
+```
+
+```yaml
+# docker/k8s/redis-pod.yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: sapl-redis
+  namespace: redis
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: sapl-redis
+  template:
+    metadata:
+      labels:
+        app: sapl-redis
+    spec:
+      containers:
+      - name: redis
+        image: redis:7-alpine
+        command: ["redis-server", "/etc/redis/redis.conf"]
+        resources:
+          requests:
+            memory: "1Gi"
+            cpu: "250m"
+          limits:
+            memory: "6Gi"
+            cpu: "1000m"
+        ports:
+        - containerPort: 6379
+        volumeMounts:
+        - name: redis-config
+          mountPath: /etc/redis
+      volumes:
+      - name: redis-config
+        configMap:
+          name: redis-config
+```
+
+```yaml
+# docker/k8s/redis-service.yaml
+apiVersion: v1
+kind: Service
+metadata:
+  name: sapl-redis
+  namespace: redis
+spec:
+  selector:
+    app: sapl-redis
+  ports:
+  - port: 6379
+    targetPort: 6379
+```
+
+**Pod budget rationale:**
+
+| Data type | Estimated memory |
+|---|---|
+| Rate limit counters (all pods, all IPs) | ~50–110 MB |
+| View / template cache | ~300–600 MB |
+| Small file cache (logos, etiquetas) | ~500 MB–1 GB |
+| Redis overhead (× 1.5) | ~1.6 GB |
+| **Total ceiling** | **~5 GB** |
+
+---
+
+### 4.2 Use-Case / Key-Prefix Mapping
+
+| Use case | Key prefix | DB | TTL | Notes |
+|---|---|---|---|---|
+| Page / view cache | `sapl:cache:*` | 0 | 60–3600 s | `KEY_PREFIX=sapl` in Django CACHES |
+| Static file cache (logos) | `static:{ns}:{sha256}` | 0 | 3–24 h | ns = namespace/tenant |
+| PDF cache (≤ 360 KB) | `file:{ns}:{sha256}` | 0 | 1 h | ns required |
+| Rate limiter counters | `rl:*` | 1 | 60–300 s | Raw keys, no prefix |
+| UA deny list | `rl:bot:ua:blocked` | 1 | permanent SET | Seed once after deploy |
+| WebSocket / Channels | `channels:*` | 2 | session TTL | **Future — Phase 5** |
+
+---
+
+### 4.3 Django Settings — Startup-Time Backend Selection
+
+```python
+# sapl/settings.py
+REDIS_URL     = config('REDIS_URL',     default='')
+CACHE_BACKEND = config('CACHE_BACKEND', default='file')
+
+_redis_ready = CACHE_BACKEND == 'redis' and bool(REDIS_URL)
+
+CACHES = {
+    'default': {
+        'BACKEND': (
+            'django_redis.cache.RedisCache' if _redis_ready
+            else 'django.core.cache.backends.filebased.FileBasedCache'
+        ),
+        'LOCATION': REDIS_URL + '/0' if _redis_ready else '/var/tmp/django_cache',
+        'KEY_PREFIX': 'sapl',
+        **(
+            {
+                'OPTIONS': {
+                    'CLIENT_CLASS': 'django_redis.client.DefaultClient',
+                    'CONNECTION_POOL_KWARGS': {
+                        # 1,200 pods × 2 workers × 6 = 14,400 peak connections
+                        # maxclients=20,000 gives 40% headroom
+                        'max_connections': 6,
+                        'socket_timeout': 0.5,
+                        'socket_connect_timeout': 0.5,
+                    },
+                    'IGNORE_EXCEPTIONS': True,  # cache miss on Redis failure — app degrades gracefully
+                },
+                'TIMEOUT': 300,
+            } if _redis_ready else {
+                'OPTIONS': {'MAX_ENTRIES': 10000},
+            }
+        ),
+    },
+    'ratelimit': {
+        'BACKEND': 'django_redis.cache.RedisCache',
+        'LOCATION': REDIS_URL + '/1' if _redis_ready else '',
+        'OPTIONS': {
+            'CLIENT_CLASS': 'django_redis.client.DefaultClient',
+            'CONNECTION_POOL_KWARGS': {
+                'max_connections': 6,
+                'socket_timeout': 0.5,
+                'socket_connect_timeout': 0.5,
+            },
+            'IGNORE_EXCEPTIONS': True,
+        },
+    } if _redis_ready else {
+        'BACKEND': 'django.core.cache.backends.filebased.FileBasedCache',
+        'LOCATION': '/var/tmp/django_ratelimit_cache',
+        'OPTIONS': {'MAX_ENTRIES': 5000},
+    },
+}
+
+RATELIMIT_USE_CACHE = 'ratelimit'
+```
+
+`start.sh` additions — resolve URL and read waffle switch before Gunicorn starts:
+
+```bash
+resolve_redis_url() {
+    # 1. Already set by local Secret via envFrom — highest precedence
+    [[ -n "${REDIS_URL:-}" ]] && { log "REDIS_URL from local secret."; return 0; }
+
+    # 2. Try global cluster Secret via k8s API
+    local api="https://kubernetes.default.svc"
+    local token ca
+    token="$(<'/var/run/secrets/kubernetes.io/serviceaccount/token')"
+    ca="/var/run/secrets/kubernetes.io/serviceaccount/ca.crt"
+
+    local url
+    url=$(curl -sf --cacert "$ca" \
+        -H "Authorization: Bearer $token" \
+        "${api}/api/v1/namespaces/interlegis-infra/secrets/sapl-global-redis" \
+        | python3 -c "
+import sys, json, base64
+d = json.load(sys.stdin).get('data', {})
+v = d.get('REDIS_URL', '')
+print(base64.b64decode(v).decode() if v else '')
+" 2>/dev/null || echo "")
+
+    if [[ -n "$url" ]]; then
+        export REDIS_URL="$url"
+        log "REDIS_URL from global cluster secret."
+        return 0
+    fi
+    log "No REDIS_URL found — file-based cache will be used."
+}
+
+resolve_cache_backend() {
+    [[ -z "${REDIS_URL:-}" ]] && return 0
+    log "REDIS_URL set — checking REDIS_CACHE waffle switch..."
+    local active
+    active=$(psql "$DATABASE_URL" -At -v ON_ERROR_STOP=0 -c \
+        "SELECT active FROM waffle_switch WHERE name='REDIS_CACHE' LIMIT 1;" \
+        2>/dev/null || echo "")
+    if [[ "$active" == "t" ]]; then
+        log "REDIS_CACHE switch ON — activating Redis cache backend."
+        export CACHE_BACKEND="redis"
+    else
+        log "REDIS_CACHE switch OFF — using file-based cache."
+        export CACHE_BACKEND="file"
+    fi
+}
+
+wait_for_redis() {
+    [[ -z "${REDIS_URL:-}" ]] && return 0
+    log "Checking Redis connectivity..."
+    local host port
+    host=$(python3 -c "from urllib.parse import urlparse; u=urlparse('${REDIS_URL}'); print(u.hostname or 'localhost')")
+    port=$(python3 -c "from urllib.parse import urlparse; u=urlparse('${REDIS_URL}'); print(u.port or 6379)")
+    local retries=10
+    until python3 -c "import socket; s=socket.create_connection(('${host}',${port}),2); s.close()" 2>/dev/null; do
+        retries=$((retries-1))
+        [[ $retries -eq 0 ]] && { log "WARNING: Redis unreachable — continuing on file cache."; return 0; }
+        log "Waiting for Redis... ($retries retries left)"
+        sleep 2
+    done
+    log "Redis reachable at ${host}:${port}."
+}
+
+configure_redis_cache() {
+    [[ -z "${REDIS_URL:-}" ]] && return 0
+    log "Creating REDIS_CACHE waffle switch (default: off)"
+    python3 manage.py waffle_switch REDIS_CACHE off --create
+}
+```
+
+---
+
+### 4.4 Rollout Sequence
+
+```bash
+# Enable Redis for one namespace
+kubectl create secret generic sapl-redis \
+  --namespace=fortaleza-ce \
+  --from-literal=REDIS_URL="redis://sapl-redis.redis.svc.cluster.local:6379" \
+  --dry-run=client -o yaml | kubectl apply -f -
+
+kubectl exec -n fortaleza-ce deploy/sapl -- \
+  python manage.py waffle_switch REDIS_CACHE on --create
+
+kubectl rollout restart deployment/sapl -n fortaleza-ce
+
+# Disable without removing secret
+kubectl exec -n fortaleza-ce deploy/sapl -- \
+  python manage.py waffle_switch REDIS_CACHE off
+kubectl rollout restart deployment/sapl -n fortaleza-ce
+
+# Fleet-wide rollout (parallel)
+kubectl get namespaces -l app=sapl -o name | sed 's|namespace/||' | \
+  xargs -P 10 -I{} kubectl exec -n {} deploy/sapl -- \
+    python manage.py waffle_switch REDIS_CACHE on --create
+
+kubectl get namespaces -l app=sapl -o name | sed 's|namespace/||' | \
+  xargs -P 5 -I{} kubectl rollout restart deployment/sapl -n {}
+```
+
+**Seed the UA deny list once after Redis is deployed:**
+
+```bash
+kubectl exec -n redis deploy/sapl-redis -- redis-cli -n 1 \
+  SADD rl:bot:ua:blocked \
+    "$(echo -n 'GPTBot'          | sha256sum | cut -d' ' -f1)" \
+    "$(echo -n 'ClaudeBot'       | sha256sum | cut -d' ' -f1)" \
+    "$(echo -n 'PerplexityBot'   | sha256sum | cut -d' ' -f1)" \
+    "$(echo -n 'Bytespider'      | sha256sum | cut -d' ' -f1)" \
+    "$(echo -n 'AhrefsBot'       | sha256sum | cut -d' ' -f1)" \
+    "$(echo -n 'meta-externalagent' | sha256sum | cut -d' ' -f1)"
+
+# Add new offenders at runtime without restart
+kubectl exec -n redis deploy/sapl-redis -- redis-cli -n 1 \
+  SADD rl:bot:ua:blocked "$(echo -n 'NewBot/1.0' | sha256sum | cut -d' ' -f1)"
+```
+
+**Production monitoring commands:**
+
+```bash
+# Memory usage
+kubectl exec -n redis deploy/sapl-redis -- redis-cli info memory \
+  | grep -E 'used_memory_human|maxmemory_human|mem_fragmentation_ratio'
+
+# Connection pressure
+kubectl exec -n redis deploy/sapl-redis -- redis-cli info stats \
+  | grep -E 'rejected_connections|instantaneous_ops_per_sec'
+
+# Key distribution per DB
+kubectl exec -n redis deploy/sapl-redis -- redis-cli info keyspace
+
+# Slow log
+kubectl exec -n redis deploy/sapl-redis -- redis-cli slowlog get 25
+```
+
+---
+
+## 5. Phase 2 — Rate Limiting & Bot Mitigation
+
+**Goal**: Effective cross-pod throttling using shared Redis.  
+**Prerequisite**: Phase 1 (Redis deployed and `CACHE_BACKEND=redis`).
+
+### 5.1 Middleware Architecture
+
+```mermaid
+flowchart TD
+    A([Request arrives at nginx]) --> B{SISMEMBER\nrl:bot:ua:blocked}
+    B -->|hit| Z1[429 — zero Django cost]
+    B -->|miss| C{GET\nrl:ip:blocked}
+    C -->|exists| Z2[429 — zero Django cost]
+    C -->|nil| D[proxy_pass to Gunicorn]
+    D --> E{authenticated?}
+    E -->|yes| F{INCR\nrl:{ns}:user:{id}:reqs\n>= 120/min?}
+    E -->|no| G{suspicious\nheaders?}
+    F -->|yes| Z3[SET user:blocked\n429]
+    F -->|no| H[call view]
+    G -->|yes| Z4[429]
+    G -->|no| I{INCR\nrl:ip:reqs\n>= 30/min?}
+    I -->|yes| Z5[SET ip:blocked\n429]
+    I -->|no| J{INCR\nrl:ns:ip:window\n>= 30/min?}
+    J -->|yes| Z6[SET ip:blocked\n429]
+    J -->|no| H
+    H --> K[Filesystem / ORM / Response]
+```
+
+### 5.2 RateLimitMiddleware Implementation
+
+```python
+# sapl/middleware/ratelimit.py
+import hashlib
+import logging
+import time
+
+from django.conf import settings
+from django.core.cache import caches
+from django.http import HttpResponse
+
+logger = logging.getLogger('sapl.ratelimit')
+
+BOT_UA_FRAGMENTS = [
+    'GPTBot', 'ClaudeBot', 'PerplexityBot',
+    'Bytespider', 'AhrefsBot', 'meta-externalagent',
+    'Chrome/98.0.4758',
+]
+
+
+def _sha256(s: str) -> str:
+    return hashlib.sha256(s.encode()).hexdigest()
+
+
+def _is_suspicious_headers(request) -> bool:
+    # Real browsers send all three; bots frequently omit them
+    missing = sum([
+        not request.META.get('HTTP_ACCEPT_LANGUAGE'),
+        not request.META.get('HTTP_ACCEPT'),
+        not request.META.get('HTTP_REFERER'),
+    ])
+    return missing >= 2
+
+
+def _get_ip(request) -> str:
+    return (
+        request.META.get('HTTP_X_FORWARDED_FOR', '').split(',')[0].strip()
+        or request.META.get('REMOTE_ADDR', '')
+    )
+
+
+class RateLimitMiddleware:
+    ANON_IP_THRESHOLD   = 30    # req/min — tune from dry-run data
+    AUTH_USER_THRESHOLD = 120   # req/min
+    BLOCK_TTL           = 300   # seconds
+
+    def __init__(self, get_response):
+        self.get_response = get_response
+        self.dry_run = getattr(settings, 'RATELIMIT_DRY_RUN', True)
+        self._rl_cache = caches['ratelimit']
+
+    def __call__(self, request):
+        decision = self._evaluate(request)
+        if decision['action'] == 'block':
+            logger.warning('ratelimit_block', extra={
+                'ip':        decision['ip'],
+                'reason':    decision['reason'],
+                'ua':        request.META.get('HTTP_USER_AGENT', ''),
+                'path':      request.path,
+                'dry_run':   self.dry_run,
+                'namespace': getattr(request, 'tenant', 'unknown'),
+            })
+            if not self.dry_run:
+                return HttpResponse(status=429)
+        return self.get_response(request)
+
+    def _evaluate(self, request):
+        ip = _get_ip(request)
+
+        # Check 1: known UA (all requests)
+        ua = request.META.get('HTTP_USER_AGENT', '')
+        for fragment in BOT_UA_FRAGMENTS:
+            if fragment.lower() in ua.lower():
+                return {'action': 'block', 'reason': 'known_ua', 'ip': ip}
+
+        # Check 2: IP blocked marker
+        if self._rl_cache.get(f'rl:ip:{ip}:blocked'):
+            if not getattr(request, 'user', None) or not request.user.is_authenticated:
+                return {'action': 'block', 'reason': 'ip_blocked', 'ip': ip}
+
+        if getattr(request, 'user', None) and request.user.is_authenticated:
+            return self._evaluate_authenticated(request, ip)
+        return self._evaluate_anonymous(request, ip)
+
+    def _evaluate_authenticated(self, request, ip):
+        user_id = str(request.user.pk).lower().strip()
+        ns = getattr(request, 'tenant', 'global')
+
+        if self._rl_cache.get(f'rl:{ns}:user:{user_id}:blocked'):
+            return {'action': 'block', 'reason': 'user_blocked', 'ip': ip}
+
+        if _is_suspicious_headers(request):
+            return {'action': 'block', 'reason': 'suspicious_headers_auth', 'ip': ip}
+
+        count = self._incr_with_ttl(f'rl:{ns}:user:{user_id}:reqs', ttl=60)
+        if count >= self.AUTH_USER_THRESHOLD:
+            self._rl_cache.set(f'rl:{ns}:user:{user_id}:blocked', 1,
+                               timeout=self.BLOCK_TTL)
+            return {'action': 'block', 'reason': 'auth_user_rate', 'ip': ip}
+
+        return {'action': 'pass', 'ip': ip}
+
+    def _evaluate_anonymous(self, request, ip):
+        # Check 3: suspicious headers
+        if _is_suspicious_headers(request):
+            return {'action': 'block', 'reason': 'suspicious_headers', 'ip': ip}
+
+        # Check 4: IP request rate
+        count = self._incr_with_ttl(f'rl:ip:{ip}:reqs', ttl=60)
+        if count >= self.ANON_IP_THRESHOLD:
+            self._rl_cache.set(f'rl:ip:{ip}:blocked', 1, timeout=self.BLOCK_TTL)
+            return {'action': 'block', 'reason': 'ip_rate', 'ip': ip}
+
+        # Check 5: per-ns/ip/window (catches UA rotators)
+        ns     = getattr(request, 'tenant', 'global')
+        bucket = int(time.time() // 60)
+        count  = self._incr_with_ttl(f'rl:ns:{ns}:ip:{ip}:w:{bucket}', ttl=120)
+        if count >= self.ANON_IP_THRESHOLD:
+            self._rl_cache.set(f'rl:ip:{ip}:blocked', 1, timeout=self.BLOCK_TTL)
+            return {'action': 'block', 'reason': 'ua_rotation', 'ip': ip}
+
+        return {'action': 'pass', 'ip': ip}
+
+    def _incr_with_ttl(self, key: str, ttl: int) -> int:
+        """Atomic INCR + EXPIRE — TTL only set on key creation."""
+        lua = """
+            local n = redis.call('INCR', KEYS[1])
+            if n == 1 then redis.call('EXPIRE', KEYS[1], ARGV[1]) end
+            return n
+        """
+        client = self._rl_cache._cache.get_client()
+        return client.eval(lua, 1, key, ttl)
+```
+
+---
+
+### 5.3 Settings Reference
+
+```python
+# sapl/settings.py
+MIDDLEWARE = [
+    'sapl.middleware.ratelimit.RateLimitMiddleware',  # before session/auth
+    'django.contrib.sessions.middleware.SessionMiddleware',
+    # ... rest unchanged
+]
+
+# Start in dry-run — flip to False check-by-check after validation
+RATELIMIT_DRY_RUN = config('RATELIMIT_DRY_RUN', default=True, cast=bool)
+
+RATE_LIMITER_RATE               = config('RATE_LIMITER_RATE',               default='35/m')
+RATE_LIMITER_RATE_AUTHENTICATED = config('RATE_LIMITER_RATE_AUTHENTICATED', default='120/m')
+RATE_LIMITER_RATE_BOT           = config('RATE_LIMITER_RATE_BOT',           default='5/m')
+
+# Optional / future — see Open Question 2
+RATE_LIMIT_WHITELIST_IPS = config(
+    'RATE_LIMIT_WHITELIST_IPS',
+    default='',
+    cast=lambda v: [x.strip() for x in v.split(',') if x.strip()]
+)
+```
+
+---
+
+### 5.4 Enforcement Graduation Order
+
+Enable `RATELIMIT_DRY_RUN=False` one check at a time, in order of false-positive risk:
+
+| Order | Check | Risk | Condition to enable |
+|---|---|---|---|
+| 1st | `known_ua` | Zero | UA strings are deterministic |
+| 2nd | `ip_blocked` | Zero | Key only set by prior proven-bad requests |
+| 3rd | `ip_rate` | Low | Threshold calibrated from dry-run data |
+| 4th | `suspicious_headers` | Medium | Confirmed no legitimate clients omit all 3 headers |
+| 5th | `ua_rotation` (ns/window) | Medium | NAT IP whitelist in place (see Open Question 2) |
+
+---
+
+### 5.5 Decorator Migration
+
+For views where `django-ratelimit` decorators already exist:
+
+| Endpoint type | Action | Reason |
+|---|---|---|
+| List views (GET) | Remove after Phase 2 stable | Middleware covers equivalent threshold |
+| Detail views (GET) | Remove after Phase 2 stable | Middleware covers equivalent threshold |
+| Search / filter views | Remove last | Expensive queries — keep stricter per-view limit |
+| PDF / file generation | **Keep permanently** | Most expensive; per-view limit tighter than global |
+| Write endpoints (POST/PUT/DELETE) | **Keep permanently** | Different abuse surface |
+| Auth endpoints (login, reset) | **Keep permanently** | Credential stuffing; must be independent |
+
+---
+
+## 6. Phase 3 — File Serving Corrections
+
+**Goal**: Ensure nginx serves files correctly with kernel bypass and caching headers.  
+**Risk**: Low — config changes only.
+
+### 6.1 Confirmed Architecture
+
+nginx already serves `/media/` directly via `alias` — **Django is not involved in file serving for public media**. `X-Accel-Redirect` is only needed for LGPD-restricted documents that must pass through Django for access control.
+
+The corrected `nginx.conf` and `sapl.conf` are shown in Phase 0 §3.2. No additional changes needed here.
+
+### 6.2 Why Redis is NOT Needed for PDFs
+
+With the full mitigation stack active:
+- **ASN blocking** (Phase 0) drops datacenter bot traffic at nginx
+- **UA blocking** (Phase 0) drops known-UA bots at nginx
+- **Shared Redis rate counters** (Phase 2) enforce limits across all pods
+- **ETags** (Phase 0 §3.2) convert repeat requests to 304 with zero bytes transferred
+- **`sendfile on`** (Phase 0 §3.2) means disk reads bypass userspace entirely
+
+Redis PDF caching would solve "high request volume reaching the file layer" — but that problem no longer exists once the above stack is active. Redis memory is better reserved for rate counters, page cache, and sessions.
+
+### 6.3 File Serving Decision Matrix
+
+| File type | Size | Strategy |
+|---|---|---|
+| Logos / images | Any | nginx `alias` + `sendfile` + ETag + `Cache-Control` |
+| Small PDFs | ≤ 360 KB | nginx direct + ETag |
+| Medium PDFs | 360 KB – 2 MB | nginx direct + ETag + rate limit |
+| Large PDFs | > 2 MB | nginx + strict rate limit; never Redis |
+| LGPD-restricted | Any | Django view → `X-Accel-Redirect` → nginx (access control enforced) |
+
+---
+
+## 7. Phase 4 — Dynamic Page Caching
+
+**Goal**: Eliminate ORM queries for anonymous bot requests on list views.  
+**Prerequisite**: Phase 1 (shared Redis, `CACHE_BACKEND=redis`).
+
+### 7.1 The Key Insight
+
+Many SAPL list views (`pesquisar-materia`, `norma`, etc.) are not truly dynamic for anonymous users between edits. A bot hammering `?page=1` through `?page=100` triggers 100 ORM queries per pod. With Redis page cache, each unique URL is queried once per TTL across the entire fleet.
+
+```python
+# views.py — apply to anonymous list views only
+from django.views.decorators.cache import cache_page
+from django.utils.decorators import method_decorator
+
+@method_decorator(cache_page(60 * 5), name='dispatch')  # 5-minute TTL
+class PesquisarMateriaView(FilterView):
+    ...
+```
+
+> **Critical safety check**: `cache_page` sets `Cache-Control: private` for authenticated sessions automatically. Verify this is working before deploying — accidentally caching a session-aware response is a data leak.
+
+### 7.2 Cache TTL Guidelines
+
+| View type | TTL | Reasoning |
+|---|---|---|
+| Matéria list (anonymous) | 300 s | Changes infrequently between sessions |
+| Norma list (anonymous) | 300 s | Same |
+| Parlamentar list | 3600 s | Changes rarely |
+| Search results | 60 s | Query-dependent, shorter TTL safer |
+| Authenticated views | Never | `cache_page` respects this automatically |
+| PDF generation | Never | Too large — serve from disk via nginx |
+
+---
+
+## 8. Phase 5 — Async PDF & WebSocket (Follow-up)
+
+**Goal**: Eliminate synchronous PDF generation as a memory pressure source; add WebSocket support.  
+**Prerequisite**: Phase 1 (Redis deployed). WebSocket work resumes **after** Redis is on k8s, bot siege is resolved, and OOM pressure is reduced.
+
+### 8.1 Async PDF via Celery
+
+Current synchronous flow — holds worker memory for entire PDF build:
+
+```mermaid
+sequenceDiagram
+    participant B as Browser
+    participant G as Gunicorn worker
+    participant ORM as PostgreSQL
+    participant RL as ReportLab
+
+    B->>G: GET /pdf/materia/12345
+    G->>ORM: N+1 queries (get_etiqueta_protocolos)
+    ORM-->>G: data
+    G->>RL: build entire PDF in RAM
+    RL-->>G: PDF bytes (held in worker memory)
+    G-->>B: stream response
+    note over G: worker blocked for full duration
+```
+
+Target async flow — worker freed immediately:
+
+```mermaid
+sequenceDiagram
+    participant B as Browser
+    participant G as Gunicorn worker
+    participant Q as Redis (Celery queue)
+    participant W as Celery worker
+    participant D as Disk
+
+    B->>G: POST /pdf/materia/12345
+    G->>Q: enqueue task
+    G-->>B: 202 Accepted + task_id
+    W->>W: build PDF (out of band)
+    W->>D: write PDF to disk
+    B->>G: GET /pdf/status/task_id
+    G-->>B: 302 → nginx /media/pdf/task_id.pdf
+```
+
+### 8.2 Celery Configuration
+
+> **Critical**: Celery broker **must** be a **separate** Redis instance (Redis B) with `noeviction` policy. The cache Redis (Redis A) uses `allkeys-lru` — tasks would silently disappear if evicted under memory pressure.
+
+```yaml
+# docker/k8s/redis-celery-configmap.yaml
+data:
+  redis.conf: |
+    maxmemory-policy noeviction   # never evict tasks
+    appendonly yes                 # AOF persistence ON
+    save "900 1"                   # RDB snapshot
+```
+
+```python
+# sapl/settings.py
+CELERY_BROKER_URL    = config('CELERY_BROKER_URL',    default='')
+CELERY_RESULT_BACKEND = config('CELERY_RESULT_BACKEND', default='')
+```
+
+### 8.3 Django Channels (WebSocket Voting Panel)
+
+Uses Redis DB2 on the same Redis A instance (cache + rate limiter pod):
+
+```python
+# sapl/settings.py
+CHANNEL_LAYERS = {
+    "default": {
+        "BACKEND": "channels_redis.core.RedisChannelLayer",
+        "CONFIG": {
+            "hosts": [("sapl-redis.redis.svc.cluster.local", 6379)],
+            "db": 2,      # DB2 reserved for channels
+            "capacity": 1500,
+            "expiry": 10,
+        },
+    }
+}
+```
+
+---
+
+## 9. Open Questions
+
+| # | Question | Status | Blocks |
+|---|---|---|---|
+| 1 | Does Chrome/98.0.4758 impersonator appear consistently in nginx access logs? | Needs investigation | Phase 0 UA block safety |
+| 2 | Which legislative house IPs can be pre-whitelisted in `RATE_LIMIT_WHITELIST_IPS`? | We don't have this list yet — plan to obtain in the future. Setting is **optional / future**. | Phase 2 enforcement safety |
+| 3 | Dockerfile scope | Single image for all tenants (confirmed). All path-based Redis keys include `{ns}`. | — |
+| 4 | WebSocket voting panel priority | Separate project. Resumes after Redis is on k8s, bot siege addressed, and OOM pressure reduced. | Phase 5 sequencing |
+| 5 | `CONN_MAX_AGE` tuning | Currently **300 s** (`sapl/settings.py:272`). Evaluate whether to reduce given worker recycling at 400 MB. | Phase 0 tuning |
+| 6 | k8s Redis manifests | Development artifacts go under `$PROJECT_ROOT/docker/k8s/` (redis-pod.yaml, redis-service.yaml, redis-configmap.yaml). | Phase 1 delivery |
+
+---
+
+*Document consolidated from multi-session architecture review — Edward / Interlegis SAPL infrastructure.*
diff --git a/sapl/relatorios/views.py b/sapl/relatorios/views.py
index bc28b3ffc..beec4f3af 100755
--- a/sapl/relatorios/views.py
+++ b/sapl/relatorios/views.py
@@ -1141,8 +1141,29 @@ def relatorio_etiqueta_protocolo(request, nro, ano):
 
 
 def get_etiqueta_protocolos(prots):
+    prot_list = list(prots)
+    if not prot_list:
+        return []
+
+    # Pre-fetch MateriaLegislativa for all protocols in one query.
+    materia_query = Q()
+    for p in prot_list:
+        materia_query |= Q(numero_protocolo=p.numero, ano=p.ano)
+    materias_map = {
+        (m.numero_protocolo, m.ano): m
+        for m in MateriaLegislativa.objects.filter(
+            materia_query).select_related('tipo')
+    }
+
+    # Pre-fetch DocumentoAdministrativo for all protocols in one query.
+    documentos_map = {
+        doc.protocolo_id: doc
+        for doc in DocumentoAdministrativo.objects.filter(
+            protocolo__in=prot_list).select_related('tipo')
+    }
+
     protocolos = []
-    for p in prots:
+    for p in prot_list:
         dic = {}
 
         dic['titulo'] = str(p.numero) + '/' + str(p.ano)
@@ -1159,11 +1180,11 @@ def get_etiqueta_protocolos(prots):
 
         dic['nom_autor'] = str(p.autor or ' ')
 
-        dic['num_materia'] = ''
-        for materia in MateriaLegislativa.objects.filter(
-                numero_protocolo=p.numero, ano=p.ano):
-            dic['num_materia'] = materia.tipo.sigla + ' ' + \
-                                 str(materia.numero) + '/' + str(materia.ano)
+        materia = materias_map.get((p.numero, p.ano))
+        dic['num_materia'] = (
+            materia.tipo.sigla + ' ' + str(materia.numero) + '/' + str(materia.ano)
+            if materia else ''
+        )
 
         dic['natureza'] = ''
         if p.tipo_processo == 0:
@@ -1171,11 +1192,11 @@ def get_etiqueta_protocolos(prots):
         if p.tipo_processo == 1:
             dic['natureza'] = 'Legislativo'
 
-        dic['num_documento'] = ''
-        for documento in DocumentoAdministrativo.objects.filter(
-                protocolo=p):
-            dic['num_documento'] = documento.tipo.sigla + ' ' + \
-                                   str(documento.numero) + '/' + str(documento.ano)
+        documento = documentos_map.get(p.pk)
+        dic['num_documento'] = (
+            documento.tipo.sigla + ' ' + str(documento.numero) + '/' + str(documento.ano)
+            if documento else ''
+        )
 
         dic['ident_processo'] = dic['num_materia'] or dic['num_documento']
 
diff --git a/sapl/settings.py b/sapl/settings.py
index 4be58ab0c..ee7669263 100644
--- a/sapl/settings.py
+++ b/sapl/settings.py
@@ -315,6 +315,10 @@ WAFFLE_ENABLE_ADMIN_PAGES = True
 MAX_DOC_UPLOAD_SIZE = 150 * 1024 * 1024  # 150MB
 MAX_IMAGE_UPLOAD_SIZE = 2 * 1024 * 1024  # 2MB
 DATA_UPLOAD_MAX_MEMORY_SIZE = 10 * 1024 * 1024  # 10MB
+# Files above 2 MB are streamed to a temp file on disk rather than held in
+# worker RAM. Critical for large upload support without memory blowup.
+FILE_UPLOAD_MAX_MEMORY_SIZE = 2 * 1024 * 1024   # 2MB
+FILE_UPLOAD_TEMP_DIR = '/var/interlegis/sapl/tmp'
 
 RATE_LIMITER_RATE = config('RATE_LIMITER_RATE', default='35/m')
 
diff --git a/sapl/static/429.html b/sapl/static/429.html
new file mode 100644
index 000000000..2f1bc8ead
--- /dev/null
+++ b/sapl/static/429.html
@@ -0,0 +1,42 @@
+<!DOCTYPE html>
+<html lang="pt-BR">
+<head>
+  <meta charset="UTF-8">
+  <meta name="viewport" content="width=device-width, initial-scale=1.0">
+  <title>429 – Muitas Requisições</title>
+  <style>
+    *, *::before, *::after { box-sizing: border-box; margin: 0; padding: 0; }
+    body {
+      font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+      background: #f5f5f5;
+      color: #333;
+      display: flex;
+      align-items: center;
+      justify-content: center;
+      min-height: 100vh;
+    }
+    .card {
+      background: #fff;
+      border-top: 4px solid #e74c3c;
+      border-radius: 4px;
+      padding: 2.5rem 3rem;
+      max-width: 480px;
+      width: 90%;
+      text-align: center;
+      box-shadow: 0 2px 8px rgba(0,0,0,.08);
+    }
+    .code { font-size: 4rem; font-weight: 700; color: #e74c3c; line-height: 1; }
+    h1 { font-size: 1.25rem; margin: .75rem 0 1rem; }
+    p  { font-size: .95rem; line-height: 1.6; color: #555; }
+    .retry { margin-top: 1.5rem; font-size: .85rem; color: #888; }
+  </style>
+</head>
+<body>
+  <div class="card">
+    <div class="code">429</div>
+    <h1>Muitas Requisições</h1>
+    <p>Você realizou muitas requisições em um curto período. Aguarde um momento e tente novamente.</p>
+    <p class="retry">Se o problema persistir, entre em contato com o suporte da sua Câmara Municipal.</p>
+  </div>
+</body>
+</html>
diff --git a/sapl/static/500.html b/sapl/static/500.html
new file mode 100644
index 000000000..6dd771897
--- /dev/null
+++ b/sapl/static/500.html
@@ -0,0 +1,42 @@
+<!DOCTYPE html>
+<html lang="pt-BR">
+<head>
+  <meta charset="UTF-8">
+  <meta name="viewport" content="width=device-width, initial-scale=1.0">
+  <title>500 – Erro Interno do Servidor</title>
+  <style>
+    *, *::before, *::after { box-sizing: border-box; margin: 0; padding: 0; }
+    body {
+      font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+      background: #f5f5f5;
+      color: #333;
+      display: flex;
+      align-items: center;
+      justify-content: center;
+      min-height: 100vh;
+    }
+    .card {
+      background: #fff;
+      border-top: 4px solid #e67e22;
+      border-radius: 4px;
+      padding: 2.5rem 3rem;
+      max-width: 480px;
+      width: 90%;
+      text-align: center;
+      box-shadow: 0 2px 8px rgba(0,0,0,.08);
+    }
+    .code { font-size: 4rem; font-weight: 700; color: #e67e22; line-height: 1; }
+    h1 { font-size: 1.25rem; margin: .75rem 0 1rem; }
+    p  { font-size: .95rem; line-height: 1.6; color: #555; }
+    .retry { margin-top: 1.5rem; font-size: .85rem; color: #888; }
+  </style>
+</head>
+<body>
+  <div class="card">
+    <div class="code">500</div>
+    <h1>Erro Interno do Servidor</h1>
+    <p>Ocorreu um erro inesperado. Nossa equipe foi notificada e trabalhará para resolver o problema.</p>
+    <p class="retry">Tente novamente em alguns instantes. Se o problema persistir, entre em contato com o suporte da sua Câmara Municipal.</p>
+  </div>
+</body>
+</html>
diff --git a/sapl/static/robots.txt b/sapl/static/robots.txt
new file mode 100644
index 000000000..50c5a7328
--- /dev/null
+++ b/sapl/static/robots.txt
@@ -0,0 +1,19 @@
+User-agent: GPTBot
+Disallow: /
+Crawl-delay: 10
+
+User-agent: ClaudeBot
+Disallow: /
+Crawl-delay: 10
+
+User-agent: meta-externalagent
+Disallow: /
+Crawl-delay: 10
+
+User-agent: OAI-SearchBot
+Disallow: /
+Crawl-delay: 10
+
+User-agent: *
+Disallow: /relatorios/
+Crawl-delay: 10