diff --git a/.gitignore b/.gitignore
index 84c9a25..09b30fb 100644
--- a/.gitignore
+++ b/.gitignore
@@ -61,6 +61,7 @@ credentials.json
 # AWS
 .aws/
 aws-credentials
+ip-ranges.json
 
 # Registry and data files
 block_registry.json
diff --git a/README.md b/README.md
index 4f6e763..ec63782 100644
--- a/README.md
+++ b/README.md
@@ -3,118 +3,112 @@
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
 [![Python 3.8+](https://img.shields.io/badge/python-3.8+-blue.svg)](https://www.python.org/downloads/)
 [![Code style: black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black)
+[![Tests](https://img.shields.io/badge/tests-197%20passing-brightgreen.svg)]()
 
-Automated AWS Network ACL (NACL) management tool that analyzes Application Load Balancer (ALB) access logs, detects malicious traffic patterns, and implements tiered time-based IP blocking with persistent storage.
-
-## 🚀 Features
-
-- **Tiered Blocking System**: Automatically categorizes attackers into 5 tiers (Critical, High, Medium, Low, Minimal) based on attack volume
-- **Time-Based Persistence**: Blocks persist for hours to days depending on severity, with expiration tracking via JSON registry
-- **Priority-Based Slot Management**: Critical attackers won't be displaced by lower-priority threats when NACL slots are full
-- **Attack Pattern Detection**: Comprehensive regex patterns detect LFI, XSS, SQL injection, command injection, and more
-- **Smart API Caching**: Built-in IPInfo API caching reduces rate limit concerns
-- **Slack Integration**: Real-time notifications with detailed attack context and tier information
-- **AWS IP Exclusion**: Automatically excludes AWS service IPs from blocking
-- **Dry-Run Mode**: Test blocking logic without making actual changes
-- **Self-Healing**: Handles corrupted registry files, missing configurations, and API failures gracefully
-
-## 📋 Table of Contents
-
-- [Features](#-features)
-- [Prerequisites](#-prerequisites)
-- [Installation](#-installation)
-- [Quick Start](#-quick-start)
-- [Configuration](#-configuration)
-- [Usage](#-usage)
-- [Tier System](#-tier-system)
-- [Architecture](#-architecture)
-- [Monitoring](#-monitoring)
-- [Troubleshooting](#-troubleshooting)
-- [Contributing](#-contributing)
-- [License](#-license)
-- [Security](#-security)
-
-## 📦 Prerequisites
+Automated AWS security tool that analyzes Application Load Balancer (ALB) access logs, detects malicious traffic patterns using multi-signal analysis, and implements tiered time-based IP blocking via Network ACLs (NACLs) and AWS WAF IP Sets.
+
+## What's New in v2.0
+
+- **Cloud-Native Storage**: DynamoDB and S3 backends for distributed deployments
+- **IPv6 Support**: Full dual-stack blocking with separate rule ranges
+- **AWS WAF Integration**: Parallel blocking via WAF IP Sets for edge protection
+- **Multi-Signal Detection**: Reduces false positives by correlating multiple threat indicators
+- **O(log N) AWS IP Lookup**: Fast binary search for AWS IP exclusion with auto-download of ip-ranges.json
+- **Athena Integration**: SQL-based analysis for large-scale log processing
+- **Enhanced Slack Notifications**: Color-coded severity, threading, Block Kit formatting
+- **CloudWatch Metrics**: Built-in observability with custom namespace support
+- **Structured JSON Logging**: CloudWatch Logs compatible output
+
+## Features
+
+### Core Capabilities
+
+- **Tiered Blocking System**: 5-tier classification (Critical→Minimal) with proportional block durations
+- **Multi-Signal Threat Detection**: Correlates attack patterns, scanner signatures, error rates, and path diversity
+- **IPv4 + IPv6 Support**: Dual-stack blocking with independent rule management
+- **Priority-Based Slot Management**: Critical attackers won't be displaced by lower-priority threats
+
+### Attack Detection
+
+- **30+ Attack Patterns**: LFI, XSS, SQL injection, command injection, path traversal, etc.
+- **Scanner Detection**: Known scanner user-agent identification (Nikto, sqlmap, etc.)
+- **Behavioral Analysis**: Error rate and path diversity scoring
+
+### Integration Options
+
+- **AWS WAF IP Sets**: Parallel blocking at edge (CloudFront, ALB, API Gateway)
+- **Slack Notifications**: Real-time alerts with severity-based color coding
+- **CloudWatch Metrics**: Operational metrics for dashboards and alarms
+- **Athena Queries**: SQL-based analysis for historical data
+
+### Operational Features
+
+- **Cloud-Native Storage**: DynamoDB, S3, or local file persistence
+- **Incremental Processing**: Skip already-analyzed log files
+- **Circuit Breakers**: Graceful degradation on external service failures
+- **Dry-Run Mode**: Test blocking logic without making changes
+
+## Table of Contents
+
+- [Prerequisites](#prerequisites)
+- [Installation](#installation)
+- [Quick Start](#quick-start)
+- [Configuration](#configuration)
+- [Tier System](#tier-system)
+- [Storage Backends](#storage-backends)
+- [AWS WAF Integration](#aws-waf-integration)
+- [Multi-Signal Detection](#multi-signal-detection)
+- [Athena Integration](#athena-integration)
+- [Observability](#observability)
+- [Architecture](#architecture)
+- [Troubleshooting](#troubleshooting)
+- [Contributing](#contributing)
+- [License](#license)
+
+## Prerequisites
 
 ### Required
 
 - **Python**: 3.8 or higher
-- **AWS Account**: With ALB access logs enabled
-- **IAM Permissions**: See [IAM Policy](#iam-permissions) below
-- **ALB Logging**: Must be enabled and configured to S3
+- **AWS Account**: With ALB access logs enabled to S3
+- **IAM Permissions**: See [IAM Policy](#iam-permissions)
 
 ### Optional
 
-- **Slack Bot Token**: For notifications (recommended)
-- **IPInfo API Token**: For IP geolocation (optional)
-
-## 🔧 Installation
+- **Slack Bot Token**: For notifications
+- **IPInfo API Token**: For IP geolocation
+- **DynamoDB/S3**: For cloud-native state storage
+- **Athena**: For large-scale log analysis
 
-### Option 1: Using uv (Recommended)
+## Installation
 
-[uv](https://github.com/astral-sh/uv) is a fast Python package installer and resolver.
+### Using uv (Recommended)
 
 ```bash
-# Install uv (if not already installed)
 curl -LsSf https://astral.sh/uv/install.sh | sh
-
-# Clone the repository
 git clone https://github.com/davidlu1001/aws-auto-block-attackers.git
 cd aws-auto-block-attackers
-
-# Install dependencies with uv
 uv sync
-
-# Copy example configuration files
-cp examples/whitelist.example.txt whitelist.txt
-cp examples/.env.example .env
-
-# Edit configuration files with your settings
-vim .env
-vim whitelist.txt
 ```
 
-### Option 2: Using pip
+### Using pip
 
 ```bash
-# Clone the repository
 git clone https://github.com/davidlu1001/aws-auto-block-attackers.git
 cd aws-auto-block-attackers
-
-# Create virtual environment
 python3 -m venv venv
-source venv/bin/activate  # On Windows: venv\Scripts\activate
-
-# Install dependencies
+source venv/bin/activate
 pip install -e .
-
-# Copy example configuration
-cp examples/whitelist.example.txt whitelist.txt
-cp examples/.env.example .env
 ```
 
-### Option 3: Using Docker
+### Using Docker
 
 ```bash
 docker pull davidlu1001/aws-auto-block-attackers:latest
-docker run -v $(pwd)/config.yaml:/app/config.yaml aws-auto-block-attackers
+docker run -v $(pwd)/config:/app/config aws-auto-block-attackers --live-run
 ```
 
-### Option 4: Manual Installation
-
-```bash
-# Install dependencies
-pip install boto3 ipinfo slack-sdk requests
-
-# Download the scripts
-wget https://raw.githubusercontent.com/davidlu1001/aws-auto-block-attackers/main/auto_block_attackers.py
-wget https://raw.githubusercontent.com/davidlu1001/aws-auto-block-attackers/main/slack_client.py
-
-# Make them executable
-chmod +x auto_block_attackers.py
-```
-
-## 🚀 Quick Start
+## Quick Start
 
 ### 1. Configure AWS Credentials
 
@@ -123,374 +117,347 @@ chmod +x auto_block_attackers.py
 aws configure
 
 # Option B: Environment variables
-export AWS_ACCESS_KEY_ID="your-access-key"
-export AWS_SECRET_ACCESS_KEY="your-secret-key"
-export AWS_DEFAULT_REGION="ap-southeast-2"
-
-# Option C: IAM Role (recommended for EC2)
-# Attach IAM role to EC2 instance
-```
-
-### 2. Enable ALB Access Logs
+export AWS_ACCESS_KEY_ID="your-key"
+export AWS_SECRET_ACCESS_KEY="your-secret"
+export AWS_DEFAULT_REGION="us-east-1"
 
-```bash
-# Via AWS CLI
-aws elbv2 modify-load-balancer-attributes \
-  --load-balancer-arn arn:aws:elasticloadbalancing:region:account-id:loadbalancer/app/my-alb/... \
-  --attributes Key=access_logs.s3.enabled,Value=true Key=access_logs.s3.bucket,Value=my-bucket
+# Option C: IAM Role (recommended for EC2/ECS)
 ```
 
-### 3. Run Your First Scan (Dry-Run)
+### 2. Run Dry-Run Scan
 
 ```bash
-# Using uv (recommended)
-uv run python3 auto_block_attackers.py \
+python3 auto_block_attackers.py \
   --lb-name-pattern "alb-*" \
-  --region ap-southeast-2 \
   --lookback 1h \
   --threshold 50 \
   --debug
+```
+
+### 3. Run Live Blocking
 
-# Or directly with python (if using pip install)
+```bash
 python3 auto_block_attackers.py \
-  --lb-name-pattern "alb-*" \
-  --region ap-southeast-2 \
+  --lb-name-pattern "prod-*" \
   --lookback 1h \
   --threshold 50 \
-  --debug
+  --live-run
 ```
 
-### 4. Deploy to Production
+### 4. Production Deployment (Cron)
 
 ```bash
-# Add to crontab for automated execution every 15 minutes
-crontab -e
-
-# Using uv (recommended):
-*/15 * * * * cd /opt/aws-auto-block-attackers && /usr/local/bin/uv run python3 auto_block_attackers.py \
-  --lb-name-pattern "alb-prod-*" \
+# Run every 15 minutes
+*/15 * * * * cd /opt/auto-block && python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
   --threshold 75 \
   --lookback 90m \
-  --live-run \
-  >> /var/log/auto-block-attackers.log 2>&1
-
-# Or using systemd timer (see examples/systemd-timer-example.timer)
+  --storage-backend dynamodb \
+  --dynamodb-table block-registry \
+  --enable-cloudwatch-metrics \
+  --enhanced-slack \
+  --live-run >> /var/log/auto-block.log 2>&1
 ```
 
-## ⚙️ Configuration
+## Configuration
 
-### Environment Variables
+### Command-Line Arguments
 
-```bash
-# Slack (optional but recommended)
-export SLACK_BOT_TOKEN="xoxb-your-token"
-export SLACK_CHANNEL="C04ABCDEFG"
+| Argument | Default | Description |
+|----------|---------|-------------|
+| `--lb-name-pattern` | `alb-*` | Pattern to match load balancer names |
+| `--region` | `ap-southeast-2` | AWS region |
+| `--lookback` | `60m` | Lookback period (30m, 2h, 1d) |
+| `--threshold` | `50` | Minimum hits to trigger block |
+| `--start-rule` | `80` | Starting NACL rule number (IPv4) |
+| `--limit` | `20` | Maximum DENY rules (IPv4) |
+| `--start-rule-ipv6` | `180` | Starting NACL rule number (IPv6) |
+| `--limit-ipv6` | `20` | Maximum DENY rules (IPv6) |
+| `--live-run` | `False` | Actually make changes |
+| `--debug` | `False` | Verbose logging |
+
+### Storage Options
+
+| Argument | Default | Description |
+|----------|---------|-------------|
+| `--storage-backend` | `local` | Storage type: local, dynamodb, s3 |
+| `--dynamodb-table` | - | DynamoDB table name |
+| `--create-dynamodb-table` | `False` | Auto-create DynamoDB table |
+| `--s3-state-bucket` | - | S3 bucket for state |
+| `--s3-state-key` | - | S3 key for state |
+
+### WAF Options
+
+| Argument | Default | Description |
+|----------|---------|-------------|
+| `--waf-ip-set-name` | - | WAF IP Set name |
+| `--waf-ip-set-scope` | `REGIONAL` | REGIONAL or CLOUDFRONT |
+| `--create-waf-ip-set` | `False` | Auto-create IP Set |
+
+### Observability Options
+
+| Argument | Default | Description |
+|----------|---------|-------------|
+| `--json-logging` | `False` | JSON log format |
+| `--enable-cloudwatch-metrics` | `False` | Publish metrics |
+| `--cloudwatch-namespace` | `AutoBlockAttackers` | Metrics namespace |
+| `--enhanced-slack` | `False` | Rich Slack notifications |
+
+### Multi-Signal Options
+
+| Argument | Default | Description |
+|----------|---------|-------------|
+| `--disable-multi-signal` | `False` | Disable multi-signal detection |
+| `--min-threat-score` | `40` | Minimum score (0-100) |
+
+### Athena Options
+
+| Argument | Default | Description |
+|----------|---------|-------------|
+| `--athena` | `False` | Enable Athena queries |
+| `--athena-database` | `alb_logs` | Athena database name |
+| `--athena-output-location` | - | S3 path for results |
 
-# IPInfo (optional)
-export IPINFO_TOKEN="your-ipinfo-token"
+### Environment Variables
 
-# AWS (if not using IAM role)
-export AWS_ACCESS_KEY_ID="your-key"
-export AWS_SECRET_ACCESS_KEY="your-secret"
-export AWS_DEFAULT_REGION="ap-southeast-2"
+```bash
+SLACK_BOT_TOKEN="xoxb-your-token"
+SLACK_CHANNEL="C04ABCDEFG"
+IPINFO_TOKEN="your-ipinfo-token"
+STORAGE_BACKEND="dynamodb"
+DYNAMODB_TABLE="block-registry"
 ```
 
-### Command-Line Arguments
-
-| Argument               | Default               | Description                                     |
-| ---------------------- | --------------------- | ----------------------------------------------- |
-| `--lb-name-pattern`    | `alb-*`               | Pattern to match load balancer names            |
-| `--region`             | `ap-southeast-2`      | AWS region                                      |
-| `--lookback`           | `60m`                 | Lookback period (format: 30m, 2h, 1d)           |
-| `--threshold`          | `50`                  | Minimum malicious requests to trigger block     |
-| `--start-rule`         | `80`                  | Starting NACL rule number                       |
-| `--limit`              | `20`                  | Maximum number of DENY rules to manage          |
-| `--whitelist-file`     | `whitelist.txt`       | Path to whitelist file                          |
-| `--aws-ip-ranges-file` | `ip-ranges.json`      | Path to AWS IP ranges JSON                      |
-| `--registry-file`      | `block_registry.json` | Path to block registry                          |
-| `--live-run`           | `False`               | Actually create NACL rules (default is dry-run) |
-| `--debug`              | `False`               | Enable verbose debug logging                    |
-
-### Whitelist File Format
-
-```text
-# Comments start with #
-203.0.113.1
-203.0.113.2
-# Corporate office
-198.51.100.0/24
-```
+See [docs/CLI_GUIDE.md](docs/CLI_GUIDE.md) for complete reference.
 
-## 🎯 Tier System
+## Tier System
 
-The script automatically categorizes attackers into tiers based on request volume:
+Attackers are classified into tiers based on malicious request volume:
 
-| Tier         | Hit Count | Block Duration | Priority | Description               |
-| ------------ | --------- | -------------- | -------- | ------------------------- |
-| **Critical** | 2000+     | 7 days         | 4        | Major coordinated attacks |
-| **High**     | 1000-1999 | 3 days         | 3        | Severe automated scanning |
-| **Medium**   | 500-999   | 48 hours       | 2        | Moderate attack attempts  |
-| **Low**      | 100-499   | 24 hours       | 1        | Light scanning activity   |
-| **Minimal**  | <100      | 1 hour         | 0        | Minor probes              |
+| Tier | Hit Count | Block Duration | Priority |
+|------|-----------|----------------|----------|
+| **Critical** | 2000+ | 7 days | 4 |
+| **High** | 1000-1999 | 3 days | 3 |
+| **Medium** | 500-999 | 48 hours | 2 |
+| **Low** | 100-499 | 24 hours | 1 |
+| **Minimal** | <100 | 1 hour | 0 |
 
-### Example Scenarios
+### Tier Upgrade
 
-#### Scenario 1: High-Volume Attacker
-```
-IP: 1.2.3.4 sends 1,568 malicious requests
-→ Classified as "High" tier
-→ Blocked for 3 days
-→ Entry saved to registry with expiration
-→ Slack notification: "Blocked 1.2.3.4 (1568 hits, tier: HIGH, blocked for 3d)"
-```
+When an IP reoffends, its tier is upgraded and block duration extended:
 
-#### Scenario 2: Tier Upgrade
 ```
 T+0:  IP sends 150 requests → Blocked as "Low" (24 hours)
-T+2h: Same IP returns with 600 more → Upgraded to "Medium" (48 hours)
-      → Block duration extended from T+2h
+T+2h: Same IP returns with 600 more → Upgraded to "Medium" (48 hours from T+2h)
 ```
 
-#### Scenario 3: Priority Protection
-```
-NACL Full: 20 IPs blocked (5 High, 10 Medium, 5 Low)
-New Critical attacker (2500 hits) arrives
-→ Replaces lowest priority IP (one of the "Low" tier)
-→ High/Medium tier IPs remain protected
-```
-
-## 🏗️ Architecture
+## Storage Backends
 
-### System Flow
+### Local File (Default)
 
-```
-┌─────────────────────────────────────────────────────────────┐
-│ 1. Scan ALB Logs (S3)                                        │
-│    └─> Date-based filtering (fast!)                          │
-└─────────────────────────────────────────────────────────────┘
-                           ↓
-┌─────────────────────────────────────────────────────────────┐
-│ 2. Detect Malicious Patterns                                 │
-│    └─> Regex: LFI, XSS, SQLi, Command Injection, etc.       │
-└─────────────────────────────────────────────────────────────┘
-                           ↓
-┌─────────────────────────────────────────────────────────────┐
-│ 3. Apply Filters                                             │
-│    ├─> Whitelist check                                       │
-│    ├─> AWS IP exclusion                                      │
-│    └─> Threshold validation                                  │
-└─────────────────────────────────────────────────────────────┘
-                           ↓
-┌─────────────────────────────────────────────────────────────┐
-│ 4. Tier Classification                                       │
-│    └─> Determine block duration based on hit count          │
-└─────────────────────────────────────────────────────────────┘
-                           ↓
-┌─────────────────────────────────────────────────────────────┐
-│ 5. Registry Management                                       │
-│    ├─> Load existing blocks                                  │
-│    ├─> Check expirations                                     │
-│    ├─> Update/merge new blocks                               │
-│    └─> Save to JSON                                          │
-└─────────────────────────────────────────────────────────────┘
-                           ↓
-┌─────────────────────────────────────────────────────────────┐
-│ 6. NACL Updates                                              │
-│    ├─> Remove expired blocks                                 │
-│    ├─> Add new blocks (priority-based)                       │
-│    └─> Handle slot exhaustion                                │
-└─────────────────────────────────────────────────────────────┘
-                           ↓
-┌─────────────────────────────────────────────────────────────┐
-│ 7. Notifications                                             │
-│    └─> Slack summary with tier breakdown                    │
-└─────────────────────────────────────────────────────────────┘
+```bash
+--storage-backend local
+--registry-file ./block_registry.json
 ```
 
-### File Structure
+### DynamoDB
 
-```
-aws-auto-block-attackers/
-├── .github/
-│   └── workflows/
-│       └── ci.yml                      # CI/CD pipeline with uv
-├── examples/
-│   ├── .env.example                    # Environment variables template
-│   ├── config.example.yaml             # Full configuration reference
-│   ├── cron-example.txt                # Cron job examples
-│   ├── systemd-example.service         # Systemd service file
-│   ├── systemd-timer-example.timer     # Systemd timer
-│   └── whitelist.example.txt           # IP whitelist template
-├── scripts/
-│   ├── README.md                       # Scripts documentation
-│   └── update_aws_ip_ranges.sh         # AWS IP ranges updater
-├── tests/
-│   ├── test_auto_block_attackers.py    # Main script tests
-│   ├── test_integration.py             # Integration tests
-│   ├── test_ipinfo_integration.py      # IPInfo tests
-│   ├── test_notification_logic.py      # Notification tests
-│   ├── test_slack_client.py            # Slack client tests
-│   ├── test_tiered_blocking.py         # Tiered blocking tests
-│   └── test_timestamp_fix.py           # Timestamp tests
-├── .gitignore                          # Git ignore patterns
-├── auto_block_attackers.py             # Main script
-├── CONTRIBUTING.md                     # Contribution guidelines
-├── LICENSE                             # MIT License
-├── pyproject.toml                      # Project configuration (uv)
-├── README.md                           # This file
-├── SECURITY.md                         # Security policy
-├── slack_client.py                     # Slack integration module
-└── uv.lock                             # Dependency lock file
+```bash
+--storage-backend dynamodb
+--dynamodb-table my-block-registry
+--create-dynamodb-table
 ```
 
-## 📊 Monitoring
+**Benefits**: Multi-AZ, concurrent access, automatic scaling
 
-### Log Files
+### S3
 
 ```bash
-# View real-time logs
-tail -f /var/log/auto-block-attackers.log
-
-# Check for errors
-grep -i error /var/log/auto-block-attackers.log
-
-# View blocked IPs
-grep "ACTIVE BLOCK" /var/log/auto-block-attackers.log
+--storage-backend s3
+--s3-state-bucket my-bucket
+--s3-state-key security/registry.json
 ```
 
-### Registry File
+**Benefits**: 11 9's durability, versioning, cross-region replication
 
-```bash
-# View current blocks
-cat ./block_registry.json | jq '.'
+## AWS WAF Integration
 
-# Check when an IP will be unblocked
-cat block_registry.json | jq '.["1.2.3.4"]'
+Block attackers at the edge in addition to VPC-level NACL blocking:
 
-# Count active blocks by tier
-cat block_registry.json | jq '[.[] | .tier] | group_by(.) | map({tier: .[0], count: length})'
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --waf-ip-set-name "blocked-attackers" \
+  --waf-ip-set-scope REGIONAL \
+  --create-waf-ip-set \
+  --live-run
 ```
 
-### CloudWatch Metrics (Optional)
+**Use Cases**:
+- Block at CloudFront edge before requests reach origin
+- Consistent blocking across multiple ALBs
+- Complement NACL blocking for defense in depth
 
-```bash
-# Send custom metrics
-aws cloudwatch put-metric-data \
-  --namespace "Security/AutoBlock" \
-  --metric-name "IPsBlocked" \
-  --value 5 \
-  --dimensions Tier=High
-```
+## Multi-Signal Detection
 
-## 🔍 Troubleshooting
+Reduces false positives by correlating multiple threat indicators:
 
-### Common Issues
+| Signal | Weight | Description |
+|--------|--------|-------------|
+| Attack Patterns | 50% | ATTACK_PATTERNS regex matches |
+| Scanner UA | 20% | Known scanner user-agents |
+| Error Rate | 15% | 4xx/5xx response percentage |
+| Path Diversity | 15% | Unique paths (scanner behavior) |
 
-#### 1. No IPs Being Blocked
+**Threat Score Calculation**:
 
-**Symptoms**: Script runs but no blocks created
+```
+Score = (0.5 × attack_rate) + (0.2 × scanner_rate) +
+        (0.15 × error_rate) + (0.15 × diversity_score)
+```
 
-**Possible Causes**:
-- Threshold too high
-- All IPs whitelisted
-- ALB logs not recent
-- Attack patterns not matched
+IPs with score < `--min-threat-score` are considered false positives.
 
-**Solutions**:
-```bash
-# Lower threshold temporarily
---threshold 10
+## Athena Integration
 
-# Check what's being detected
---debug
+For large-scale log analysis (>1000 files), use Athena:
 
-# Verify ALB logs exist
-aws s3 ls s3://your-bucket/your-prefix/ --recursive | tail -20
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --athena \
+  --athena-database "security_logs" \
+  --athena-output-location "s3://my-bucket/athena-results/" \
+  --lookback 24h \
+  --live-run
 ```
 
-#### 2. Registry File Growing Large
+**Benefits**:
+- SQL-based filtering at scale
+- Historical analysis across days/weeks
+- Cost-effective for large datasets
+
+## Observability
 
-**Symptoms**: block_registry.json is several MB
+### Structured Logging
 
-**Solution**: Script auto-cleans entries >30 days old. If still large:
 ```bash
-# Backup and reset
-cp block_registry.json block_registry.json.bak
-echo "{}" > block_registry.json
+python3 auto_block_attackers.py --json-logging 2>&1 | tee logs.json
 ```
 
-#### 3. IPInfo Rate Limit
-
-**Symptoms**: Warnings about IPInfo API failures
-
-**Solution**: Script has built-in caching. For high volume:
-- Upgrade IPInfo plan
-- Disable IPInfo: Don't set `IPINFO_TOKEN`
+Output:
+```json
+{"timestamp": "2026-01-09T10:30:00Z", "level": "INFO", "message": "Blocked 5 IPs"}
+```
 
-#### 4. NACL Slots Full
+### CloudWatch Metrics
 
-**Symptoms**: "Cannot add IP: all existing rules have higher priority"
+```bash
+--enable-cloudwatch-metrics
+--cloudwatch-namespace "Security/AutoBlock"
+```
 
-**Solutions**:
-- Increase `--limit` (max 20 with default start-rule 80)
-- Manually remove low-priority blocks
-- Adjust tier thresholds
+**Metrics Published**:
+- `LogFilesProcessed`
+- `MaliciousIPsDetected`
+- `IPsBlocked`
+- `IPsUnblocked`
+- `ProcessingTimeMs`
+- `AverageThreatScore`
 
-### Debug Mode
+### Enhanced Slack Notifications
 
 ```bash
-# Enable detailed logging
-uv run python3 auto_block_attackers.py --debug
-
-# Check what patterns are matching
-uv run python3 auto_block_attackers.py --debug 2>&1 | grep "malicious"
+--enhanced-slack
 ```
 
-## 🤝 Contributing
+Features:
+- Severity-based color coding (green→red)
+- Incident threading
+- Tier breakdown fields
+- Top offenders by tier
 
-We welcome contributions! Please see [CONTRIBUTING.md](CONTRIBUTING.md) for details.
+## Architecture
 
-### Quick Contribution Guide
+```
+┌─────────────────────────────────────────────────────────────────┐
+│                    AWS Auto Block Attackers                      │
+├─────────────────────────────────────────────────────────────────┤
+│                                                                  │
+│  ┌──────────────┐                        ┌──────────────┐       │
+│  │   S3 Logs    │───────┬───────────────▶│  CloudWatch  │       │
+│  └──────────────┘       │                │   Metrics    │       │
+│                         ▼                └──────────────┘       │
+│  ┌──────────────┐  ┌──────────────┐                             │
+│  │    Athena    │──│    Threat    │                             │
+│  │   (Optional) │  │   Detection  │                             │
+│  └──────────────┘  └──────┬───────┘                             │
+│                          │                                       │
+│                          ▼                                       │
+│                   ┌──────────────┐                               │
+│                   │    Tier      │                               │
+│                   │Classification│                               │
+│                   └──────┬───────┘                               │
+│                          │                                       │
+│          ┌───────────────┼───────────────┐                      │
+│          ▼               ▼               ▼                      │
+│   ┌─────────────┐ ┌─────────────┐ ┌─────────────┐              │
+│   │    NACL     │ │   WAF IP    │ │   Storage   │              │
+│   │   Manager   │ │    Sets     │ │   Backend   │              │
+│   └──────┬──────┘ └──────┬──────┘ └──────┬──────┘              │
+│          │               │               │                      │
+└──────────┼───────────────┼───────────────┼──────────────────────┘
+           │               │               │
+           ▼               ▼               ▼
+    ┌─────────────┐ ┌─────────────┐ ┌─────────────┐
+    │  EC2 NACLs  │ │  AWS WAF    │ │ DynamoDB/S3 │
+    │  (IPv4/v6)  │ │  IP Sets    │ │   /Local    │
+    └─────────────┘ └─────────────┘ └─────────────┘
+```
 
-1. Fork the repository
-2. Create a feature branch (`git checkout -b feature/amazing-feature`)
-3. Commit your changes (`git commit -m 'Add amazing feature'`)
-4. Push to the branch (`git push origin feature/amazing-feature`)
-5. Open a Pull Request
+See [docs/TECHNICAL_DESIGN.md](docs/TECHNICAL_DESIGN.md) for detailed architecture.
 
-### Development Setup
+## Troubleshooting
 
-```bash
-# Clone your fork
-git clone https://github.com/your-username/aws-auto-block-attackers.git
-cd aws-auto-block-attackers
+### No IPs Being Blocked
 
-# Install uv if not already installed
-curl -LsSf https://astral.sh/uv/install.sh | sh
+```bash
+# Lower threshold and enable debug
+python3 auto_block_attackers.py --threshold 10 --debug
 
-# Install all dependencies including dev extras
-uv sync --all-extras
+# Verify logs exist
+aws s3 ls s3://your-bucket/your-prefix/ --recursive | tail -20
+```
 
-# Run tests
-uv run pytest tests/ -v
+### Multi-Signal Filtering Too Aggressive
 
-# Run linting
-uv run black auto_block_attackers.py slack_client.py
-uv run pylint auto_block_attackers.py slack_client.py
+```bash
+# Lower the minimum threat score
+--min-threat-score 30
 
-# Run type checking
-uv run mypy auto_block_attackers.py slack_client.py
+# Or disable multi-signal entirely
+--disable-multi-signal
 ```
 
-## 📄 License
+### NACL Slots Full
 
-This project is licensed under the MIT License - see the [LICENSE](LICENSE) file for details.
+```bash
+# Increase limit (ensure rule range is available)
+--start-rule 70 --limit 30
+```
 
-## 🔒 Security
+### DynamoDB Throttling
+
+```bash
+# Use on-demand capacity mode
+aws dynamodb update-table \
+  --table-name my-block-registry \
+  --billing-mode PAY_PER_REQUEST
+```
 
-### IAM Permissions
+## IAM Permissions
 
-Minimum required IAM policy:
+Minimum required policy:
 
 ```json
 {
@@ -514,38 +481,41 @@ Minimum required IAM policy:
 }
 ```
 
-### Security Best Practices
+See [docs/TECHNICAL_DESIGN.md](docs/TECHNICAL_DESIGN.md#10-security-considerations) for full IAM policies including optional features.
 
-- ✅ Use IAM roles instead of access keys when possible
-- ✅ Enable CloudTrail logging for audit trails
-- ✅ Regularly review blocked IPs and patterns
-- ✅ Keep whitelist updated with legitimate IPs
-- ✅ Use separate AWS accounts for dev/prod
-- ✅ Rotate Slack tokens regularly
-- ✅ Monitor script execution logs
+## Documentation
 
-### Reporting Security Issues
+- [CLI Reference Guide](docs/CLI_GUIDE.md) - Complete command-line reference
+- [Technical Design](docs/TECHNICAL_DESIGN.md) - Architecture and implementation details
+- [Contributing Guide](CONTRIBUTING.md) - How to contribute
+- [Security Policy](SECURITY.md) - Security practices and reporting
 
-Please report security vulnerabilities to: security@yourorg.com
+## Contributing
 
-**Do not** open public issues for security vulnerabilities.
+```bash
+# Clone and setup
+git clone https://github.com/davidlu1001/aws-auto-block-attackers.git
+cd aws-auto-block-attackers
+uv sync --all-extras
+
+# Run tests
+uv run pytest tests/ -v
 
-## 📚 Additional Resources
+# Run linting
+uv run black auto_block_attackers.py slack_client.py
+```
 
-- [AWS Network ACL Documentation](https://docs.aws.amazon.com/vpc/latest/userguide/vpc-network-acls.html)
-- [ALB Access Logs](https://docs.aws.amazon.com/elasticloadbalancing/latest/application/load-balancer-access-logs.html)
-- [IPInfo API Documentation](https://ipinfo.io/developers)
+See [CONTRIBUTING.md](CONTRIBUTING.md) for details.
 
-## 💬 Support
+## License
 
-- **Issues**: [GitHub Issues](https://github.com/davidlu1001/aws-auto-block-attackers/issues)
-- **Discussions**: [GitHub Discussions](https://github.com/davidlu1001/aws-auto-block-attackers/discussions)
-- **Email**: support@yourorg.com
+MIT License - see [LICENSE](LICENSE) for details.
 
-## 🌟 Star History
+## Support
 
-[![Star History Chart](https://api.star-history.com/svg?repos=davidlu1001/aws-auto-block-attackers&type=Date)](https://star-history.com/#davidlu1001/aws-auto-block-attackers&Date)
+- **Issues**: [GitHub Issues](https://github.com/davidlu1001/aws-auto-block-attackers/issues)
+- **Discussions**: [GitHub Discussions](https://github.com/davidlu1001/aws-auto-block-attackers/discussions)
 
 ---
 
-**Made with ❤️ for the security community**
+**Made with security in mind**
diff --git a/auto_block_attackers.py b/auto_block_attackers.py
index 5e97d9e..144aaef 100644
--- a/auto_block_attackers.py
+++ b/auto_block_attackers.py
@@ -112,7 +112,7 @@
     See README.md for detailed documentation and examples
 """
 
-__version__ = "1.0.0"
+__version__ = "2.0.0"
 __author__ = "AWS Auto Block Attackers Contributors"
 __license__ = "MIT"
 
@@ -126,21 +126,48 @@
 import argparse
 from datetime import datetime, timedelta, timezone
 from botocore.config import Config
+from botocore.exceptions import ClientError
 from concurrent.futures import ThreadPoolExecutor, as_completed
 import ipaddress
 import fnmatch
-from typing import Set, List, Dict, Tuple, Optional
+from typing import Set, List, Dict, Tuple, Optional, Any
+from collections import defaultdict
+from dataclasses import dataclass, field
+from urllib.parse import urlparse
+import bisect
 import os
 import sys
 import ipinfo
+import requests
 
 # Import SlackClient from the same directory
 try:
-    from slack_client import SlackClient
+    from slack_client import SlackClient, SlackSeverity, TIER_TO_SEVERITY
 except ImportError:
     # If running from a different directory
     sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
-    from slack_client import SlackClient
+    from slack_client import SlackClient, SlackSeverity, TIER_TO_SEVERITY
+
+# Import storage backends
+try:
+    from storage_backends import (
+        StorageBackend,
+        LocalFileBackend,
+        DynamoDBBackend,
+        S3Backend,
+        create_storage_backend,
+        StorageError,
+    )
+except ImportError:
+    sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+    from storage_backends import (
+        StorageBackend,
+        LocalFileBackend,
+        DynamoDBBackend,
+        S3Backend,
+        create_storage_backend,
+        StorageError,
+    )
 
 # --- ENHANCED REGULAR EXPRESSIONS TO DETECT COMMON ATTACK PATTERNS ---
 # FIX: All patterns are now combined into a single string separated by '|'
@@ -162,6 +189,752 @@
     re.IGNORECASE,
 )
 
+# --- KNOWN MALICIOUS USER AGENTS ---
+SCANNER_USER_AGENTS = re.compile(
+    r"(zgrab|nmap|nikto|sqlmap|dirbuster|gobuster|nuclei|wpscan|"
+    r"masscan|shodan|censys|zmap|httpx|feroxbuster|ffuf|"
+    r"python-requests|go-http-client|curl/|wget/|"
+    r"scanner|crawler|spider|bot|scraper|"
+    r"java/\d|libwww-perl|lwp-trivial)",
+    re.IGNORECASE,
+)
+
+# --- SUSPICIOUS USER AGENT PATTERNS (lower confidence than scanners) ---
+SUSPICIOUS_UA_PATTERNS = re.compile(
+    r"(python|java|php|ruby|perl|curl|wget|libwww|"
+    r"httpclient|okhttp|apache-http|axios|node-fetch)",
+    re.IGNORECASE,
+)
+
+# --- AWS IP RANGES CONFIGURATION ---
+AWS_IP_RANGES_URL = "https://ip-ranges.amazonaws.com/ip-ranges.json"
+IP_RANGES_MAX_AGE_DAYS = 7  # Re-download if older than 7 days
+
+# AWS service names from ip-ranges.json
+# See: https://docs.aws.amazon.com/vpc/latest/userguide/aws-ip-ranges.html
+AWS_SERVICE_ROUTE53_HEALTHCHECKS = 'ROUTE53_HEALTHCHECKS'
+AWS_SERVICE_CLOUDFRONT = 'CLOUDFRONT'
+AWS_SERVICE_ELB = 'ELB'
+AWS_SERVICE_EC2 = 'EC2'
+AWS_SERVICE_AMAZON = 'AMAZON'
+
+# --- KNOWN LEGITIMATE SERVICES CONFIGURATION ---
+# SECURITY NOTE: No hardcoded IPs! AWS services verified via ip-ranges.json service tags.
+KNOWN_LEGITIMATE_SERVICES = {
+    'Route53-Health-Check': {
+        'ua_pattern': re.compile(r'^Amazon-Route53-Health-Check', re.IGNORECASE),
+        # Verify IP is from ROUTE53_HEALTHCHECKS service in ip-ranges.json
+        'aws_service': AWS_SERVICE_ROUTE53_HEALTHCHECKS,
+        'require_service_match': True,
+    },
+    'ELB-HealthChecker': {
+        'ua_pattern': re.compile(r'^ELB-HealthChecker', re.IGNORECASE),
+        'aws_service': AWS_SERVICE_ELB,
+        'require_service_match': True,
+    },
+    'CloudFront': {
+        'ua_pattern': re.compile(r'^Amazon CloudFront', re.IGNORECASE),
+        'aws_service': AWS_SERVICE_CLOUDFRONT,
+        'require_service_match': True,
+    },
+    # Non-AWS services: require path matching since we can't verify IPs
+    # These only get -15 (vs -25 for AWS), so even if spoofed, won't bypass threshold alone
+    'Datadog': {
+        'ua_pattern': re.compile(r'Datadog', re.IGNORECASE),
+        'expected_paths': ['/health', '/metrics', '/status', '/api/v1', '/info'],
+        'require_path_match': True,
+    },
+    'NewRelic': {
+        'ua_pattern': re.compile(r'NewRelic', re.IGNORECASE),
+        'expected_paths': ['/health', '/status', '/ping'],
+        'require_path_match': True,
+    },
+    'Pingdom': {
+        'ua_pattern': re.compile(r'Pingdom', re.IGNORECASE),
+        'expected_paths': ['/health', '/status', '/ping', '/'],
+        'require_path_match': True,
+    },
+    'UptimeRobot': {
+        'ua_pattern': re.compile(r'UptimeRobot', re.IGNORECASE),
+        'expected_paths': ['/health', '/status', '/'],
+        'require_path_match': True,
+    },
+}
+
+
+def get_ip_ranges_path() -> str:
+    """
+    Get appropriate path for ip-ranges.json based on environment.
+
+    - Lambda: /tmp (re-download on cold start, ~500ms, acceptable)
+    - ECS with EFS: /mnt/efs (persistent)
+    - EC2/VM: ./ip-ranges.json (persistent)
+
+    Note: We intentionally skip S3 caching to avoid IAM complexity.
+    The ~500ms download time on Lambda cold start is acceptable.
+    """
+    # Lambda environment
+    if os.environ.get('AWS_LAMBDA_FUNCTION_NAME'):
+        return '/tmp/ip-ranges.json'
+
+    # ECS with EFS mount
+    if os.path.exists('/mnt/efs') and os.access('/mnt/efs', os.W_OK):
+        return '/mnt/efs/cache/ip-ranges.json'
+
+    # Default: current directory
+    return './ip-ranges.json'
+
+
+def download_aws_ip_ranges(
+    file_path: str,
+    max_age_days: int = IP_RANGES_MAX_AGE_DAYS
+) -> Optional[Dict]:
+    """
+    Download AWS IP ranges if missing or stale.
+
+    Args:
+        file_path: Path to save the ip-ranges.json file
+        max_age_days: Re-download if file is older than this many days
+
+    Returns:
+        Parsed JSON data if successful, None otherwise
+    """
+    path = Path(file_path)
+    is_lambda = os.environ.get('AWS_LAMBDA_FUNCTION_NAME') is not None
+
+    # Check freshness (Lambda always re-downloads on cold start)
+    if path.exists() and not is_lambda:
+        file_age = datetime.now() - datetime.fromtimestamp(path.stat().st_mtime)
+        if file_age < timedelta(days=max_age_days):
+            logging.debug(f"AWS IP ranges fresh ({file_age.days}d old), loading from cache")
+            try:
+                with open(path) as f:
+                    return json.load(f)
+            except json.JSONDecodeError:
+                logging.warning("Cached IP ranges corrupted, re-downloading")
+
+    # Download using requests
+    logging.info(f"Downloading AWS IP ranges from {AWS_IP_RANGES_URL}...")
+    try:
+        response = requests.get(
+            AWS_IP_RANGES_URL,
+            timeout=30,
+            headers={'User-Agent': 'aws-auto-block-attackers/2.0'}
+        )
+        response.raise_for_status()
+        data = response.json()
+
+        # Save for future use (skip on Lambda - /tmp is ephemeral anyway)
+        if not is_lambda:
+            path.parent.mkdir(parents=True, exist_ok=True)
+            with open(path, 'w') as f:
+                json.dump(data, f)
+            logging.info(
+                f"Successfully downloaded AWS IP ranges ({len(response.content) / 1024:.1f} KB) "
+                f"to {file_path}"
+            )
+        else:
+            logging.info(
+                f"Downloaded AWS IP ranges ({len(response.content) / 1024:.1f} KB) "
+                f"(Lambda env, not caching)"
+            )
+
+        return data
+
+    except requests.exceptions.Timeout:
+        logging.warning("Timeout downloading AWS IP ranges (30s)")
+    except requests.exceptions.RequestException as e:
+        logging.warning(f"Failed to download AWS IP ranges: {e}")
+    except json.JSONDecodeError as e:
+        logging.warning(f"Downloaded AWS IP ranges file is invalid JSON: {e}")
+    except Exception as e:
+        logging.warning(f"Unexpected error downloading AWS IP ranges: {e}")
+
+    # Fallback: try loading stale cache
+    if path.exists():
+        logging.info("Using stale cached IP ranges as fallback")
+        try:
+            with open(path) as f:
+                return json.load(f)
+        except Exception:
+            pass
+
+    logging.warning(
+        "No AWS IP ranges available. AWS IPs will not be excluded. "
+        "Some legitimate AWS service traffic may be blocked."
+    )
+    return None
+
+
+@dataclass
+class AWSIPRangeIndex:
+    """
+    Sorted index for O(log N) AWS IP lookups with service mapping.
+
+    Features:
+    - Binary search for fast IP-in-range checks
+    - Service-based verification (e.g., is IP from ROUTE53_HEALTHCHECKS?)
+    - No hardcoded IPs - all data from ip-ranges.json
+
+    Performance: O(log N) per lookup, where N ≈ 10,000 ranges
+    """
+    # For general "is AWS IP" checks: List of (start_int, end_int, cidr_str)
+    ipv4_ranges: List[Tuple[int, int, str]] = field(default_factory=list)
+    ipv6_ranges: List[Tuple[int, int, str]] = field(default_factory=list)
+
+    # For service-specific checks: service_name -> List of (start_int, end_int)
+    service_ranges_v4: Dict[str, List[Tuple[int, int]]] = field(default_factory=lambda: defaultdict(list))
+    service_ranges_v6: Dict[str, List[Tuple[int, int]]] = field(default_factory=lambda: defaultdict(list))
+
+    # Statistics
+    total_ipv4: int = 0
+    total_ipv6: int = 0
+    services: Set[str] = field(default_factory=set)
+
+    # Lookup statistics
+    _lookup_hits: int = 0
+    _lookup_misses: int = 0
+
+    @classmethod
+    def from_json_data(cls, data: Dict) -> 'AWSIPRangeIndex':
+        """Build index from ip-ranges.json data."""
+        index = cls()
+
+        # Process IPv4 prefixes
+        for prefix in data.get('prefixes', []):
+            ip_prefix = prefix.get('ip_prefix')
+            service = prefix.get('service', 'UNKNOWN')
+
+            if not ip_prefix:
+                continue
+
+            try:
+                network = ipaddress.ip_network(ip_prefix, strict=False)
+                start_int = int(network.network_address)
+                end_int = int(network.broadcast_address)
+
+                index.ipv4_ranges.append((start_int, end_int, ip_prefix))
+                index.service_ranges_v4[service].append((start_int, end_int))
+                index.services.add(service)
+            except ValueError:
+                continue
+
+        # Process IPv6 prefixes
+        for prefix in data.get('ipv6_prefixes', []):
+            ip_prefix = prefix.get('ipv6_prefix')
+            service = prefix.get('service', 'UNKNOWN')
+
+            if not ip_prefix:
+                continue
+
+            try:
+                network = ipaddress.ip_network(ip_prefix, strict=False)
+                start_int = int(network.network_address)
+                end_int = int(network.broadcast_address)
+
+                index.ipv6_ranges.append((start_int, end_int, ip_prefix))
+                index.service_ranges_v6[service].append((start_int, end_int))
+                index.services.add(service)
+            except ValueError:
+                continue
+
+        # Sort all ranges for binary search
+        index.ipv4_ranges.sort(key=lambda x: x[0])
+        index.ipv6_ranges.sort(key=lambda x: x[0])
+
+        for service in index.service_ranges_v4:
+            index.service_ranges_v4[service].sort(key=lambda x: x[0])
+        for service in index.service_ranges_v6:
+            index.service_ranges_v6[service].sort(key=lambda x: x[0])
+
+        index.total_ipv4 = len(index.ipv4_ranges)
+        index.total_ipv6 = len(index.ipv6_ranges)
+
+        # Log summary of services
+        top_services = sorted(index.services)[:5]
+        logging.info(
+            f"Built AWS IP index: {index.total_ipv4} IPv4, {index.total_ipv6} IPv6 ranges, "
+            f"{len(index.services)} services ({', '.join(top_services)}...)"
+        )
+
+        return index
+
+    def is_aws_ip(self, ip_str: str) -> bool:
+        """
+        O(log N) check if IP belongs to any AWS range.
+
+        Args:
+            ip_str: IP address string (IPv4 or IPv6)
+
+        Returns:
+            True if IP is from AWS
+        """
+        result = self._bisect_lookup(ip_str) is not None
+        if result:
+            self._lookup_hits += 1
+        else:
+            self._lookup_misses += 1
+        return result
+
+    def is_from_service(self, ip_str: str, service_name: str) -> bool:
+        """
+        Check if IP belongs to a specific AWS service.
+
+        This enables dynamic verification without hardcoded IPs.
+        Service names come from ip-ranges.json (e.g., 'ROUTE53_HEALTHCHECKS', 'CLOUDFRONT').
+
+        Handles overlapping ranges by searching backwards from bisect position.
+
+        Args:
+            ip_str: IP address to check
+            service_name: AWS service name from ip-ranges.json
+
+        Returns:
+            True if IP belongs to the specified service
+        """
+        try:
+            ip = ipaddress.ip_address(ip_str)
+            ip_int = int(ip)
+
+            if ip.version == 4:
+                ranges = self.service_ranges_v4.get(service_name, [])
+            else:
+                ranges = self.service_ranges_v6.get(service_name, [])
+
+            if not ranges:
+                return False
+
+            # Binary search in service-specific ranges
+            starts = [r[0] for r in ranges]
+            initial_idx = bisect.bisect_right(starts, ip_int) - 1
+
+            if initial_idx < 0:
+                return False
+
+            # Check current and previous ranges for overlapping ranges
+            # Limit search to 100 ranges back to avoid O(n) worst case
+            idx = initial_idx
+            while idx >= 0 and idx > initial_idx - 100:
+                start_int, end_int = ranges[idx]
+
+                if start_int <= ip_int <= end_int:
+                    return True
+
+                idx -= 1
+
+            return False
+
+        except ValueError:
+            return False
+
+    def get_service_for_ip(self, ip_str: str) -> Optional[str]:
+        """
+        Get the AWS service name for an IP address.
+
+        Handles overlapping ranges by searching backwards from bisect position.
+
+        Args:
+            ip_str: IP address to check
+
+        Returns:
+            Service name if found, None otherwise
+        """
+        try:
+            ip = ipaddress.ip_address(ip_str)
+            ip_int = int(ip)
+
+            service_ranges = self.service_ranges_v4 if ip.version == 4 else self.service_ranges_v6
+
+            for service_name, ranges in service_ranges.items():
+                if not ranges:
+                    continue
+
+                starts = [r[0] for r in ranges]
+                initial_idx = bisect.bisect_right(starts, ip_int) - 1
+
+                if initial_idx < 0:
+                    continue
+
+                # Check current and previous ranges for overlapping ranges
+                # Limit search to 100 ranges back to avoid O(n) worst case
+                idx = initial_idx
+                while idx >= 0 and idx > initial_idx - 100:
+                    start_int, end_int = ranges[idx]
+
+                    if start_int <= ip_int <= end_int:
+                        return service_name
+
+                    idx -= 1
+
+            return None
+
+        except ValueError:
+            return None
+
+    def _bisect_lookup(self, ip_str: str) -> Optional[str]:
+        """
+        Binary search for IP in all ranges.
+
+        Handles overlapping ranges (e.g., /16 and /26 subnets) by searching
+        backwards from the bisect position. AWS IP ranges contain overlapping
+        CIDRs where a /16 may be followed by smaller /26 subnets with higher
+        start addresses but lower end addresses.
+
+        Returns matching CIDR or None.
+        """
+        try:
+            ip = ipaddress.ip_address(ip_str)
+            ip_int = int(ip)
+
+            ranges = self.ipv4_ranges if ip.version == 4 else self.ipv6_ranges
+
+            if not ranges:
+                return None
+
+            # Binary search: find rightmost range where start <= ip_int
+            starts = [r[0] for r in ranges]
+            idx = bisect.bisect_right(starts, ip_int) - 1
+
+            if idx < 0:
+                return None
+
+            # Check current and previous ranges for overlapping ranges
+            # We must check backwards because a /16 (with lower start but higher end)
+            # may be before a /26 (with higher start but lower end)
+            # Track the maximum end seen - if we see a range where end >= ip_int,
+            # there's potential for earlier ranges to contain the IP
+            max_end_seen = 0
+            while idx >= 0:
+                start_int, end_int, cidr = ranges[idx]
+
+                if start_int <= ip_int <= end_int:
+                    return cidr
+
+                max_end_seen = max(max_end_seen, end_int)
+
+                # We can stop if ALL ranges from here backwards have start > ip_int
+                # But since ranges are sorted by start and we started at rightmost start <= ip_int,
+                # earlier ranges also have start <= ip_int. So we need a different exit condition:
+                # If max_end_seen < ip_int and current start is far enough from ip_int that
+                # no /8 or larger could contain it, we can stop.
+                # For simplicity, limit the backwards search to avoid O(n) worst case.
+                # AWS ranges are dense, so checking ~100 ranges back should cover most overlaps.
+                if idx < (bisect.bisect_right(starts, ip_int) - 1) - 100:
+                    break
+
+                idx -= 1
+
+            return None
+
+        except ValueError:
+            return None
+
+    def get_lookup_stats(self) -> Tuple[int, int, float]:
+        """
+        Get lookup statistics.
+
+        Returns:
+            Tuple of (hits, misses, hit_rate_percent)
+        """
+        total = self._lookup_hits + self._lookup_misses
+        hit_rate = (self._lookup_hits / total * 100) if total > 0 else 0.0
+        return self._lookup_hits, self._lookup_misses, hit_rate
+
+
+# Module-level index (singleton)
+_aws_ip_index: Optional[AWSIPRangeIndex] = None
+
+
+def _clean_path(url_or_path: str) -> str:
+    """
+    Extract and clean the path component from a URL or path string.
+
+    Removes query parameters and fragments to prevent bypass attempts like:
+    /login?redirect=/health  (would incorrectly match '/health' if not cleaned)
+
+    Args:
+        url_or_path: Full URL or path string
+
+    Returns:
+        Clean path without query params or fragments
+    """
+    # Handle full URLs
+    if '://' in url_or_path:
+        parsed = urlparse(url_or_path)
+        path = parsed.path
+    else:
+        # Just a path - split off query string
+        path = url_or_path.split('?')[0].split('#')[0]
+
+    # Normalize: ensure leading slash, remove trailing slash (except for root)
+    if not path.startswith('/'):
+        path = '/' + path
+    if path != '/' and path.endswith('/'):
+        path = path.rstrip('/')
+
+    return path
+
+
+def _path_matches(req_path: str, expected_path: str) -> bool:
+    """
+    Check if request path matches expected path (prefix match).
+
+    More secure than simple 'in' check:
+    - /health matches /health, /health/check, /healthz
+    - /health does NOT match /login?ref=/health
+
+    Args:
+        req_path: Actual request path (will be cleaned)
+        expected_path: Expected path pattern
+
+    Returns:
+        True if path matches
+    """
+    clean_req = _clean_path(req_path)
+    clean_expected = expected_path.rstrip('/')
+
+    # Exact match
+    if clean_req == clean_expected:
+        return True
+
+    # Prefix match (e.g., /health matches /health/check)
+    if clean_expected and clean_req.startswith(clean_expected + '/'):
+        return True
+
+    # Root path special case
+    if clean_expected == '/' and clean_req == '/':
+        return True
+
+    return False
+
+
+def verify_legitimate_service(
+    ip: str,
+    ua: str,
+    request_paths: List[str],
+    aws_index: Optional[AWSIPRangeIndex] = None
+) -> Tuple[int, Optional[str], Optional[str]]:
+    """
+    Verify if traffic is from a known legitimate service.
+
+    SECURITY: NEVER trusts UA alone. Requires secondary verification:
+    - AWS services: IP must belong to correct AWS service (dynamic lookup via ip-ranges.json)
+    - Non-AWS services: Request paths must match expected patterns (cleaned, no query params)
+
+    FAIL-CLOSED: If aws_index is unavailable, AWS services cannot be verified.
+    This may cause false positives but maintains security.
+
+    Args:
+        ip: Client IP address
+        ua: User-Agent string
+        request_paths: List of request paths/URLs from this IP
+        aws_index: AWSIPRangeIndex for service verification (built from ip-ranges.json)
+
+    Returns:
+        (score_adjustment, service_name, verification_method)
+        - score_adjustment: Negative value to reduce threat score (-25 for AWS, -15 for path match)
+        - service_name: Name of verified service, or None
+        - verification_method: How it was verified ('aws_service', 'path_match', None)
+    """
+    if not ua:
+        return 0, None, None
+
+    for service_name, config in KNOWN_LEGITIMATE_SERVICES.items():
+        # Step 1: Check UA pattern (anchored patterns prevent injection like "Evil-Amazon-Route53...")
+        if not config['ua_pattern'].search(ua):
+            continue
+
+        # UA matched - now REQUIRE secondary verification (don't trust UA alone!)
+
+        # Step 2a: AWS service verification (dynamic, no hardcoded IPs)
+        if config.get('require_service_match'):
+            aws_service = config.get('aws_service')
+
+            if aws_index is None:
+                # FAIL-CLOSED: Can't verify without index - don't give negative score
+                # This is intentional: security over availability
+                logging.warning(
+                    f"UA matches {service_name} but AWS IP index unavailable. "
+                    f"Cannot verify IP {ip}. This may cause false positive. "
+                    f"Check if ip-ranges.json download failed."
+                )
+                continue
+
+            if aws_service and aws_index.is_from_service(ip, aws_service):
+                # VERIFIED: UA + IP matches AWS service
+                logging.debug(
+                    f"Verified legitimate AWS service: {service_name} "
+                    f"(IP {ip} confirmed in {aws_service} range)"
+                )
+                return -25, service_name, 'aws_service'
+            else:
+                # SUSPICIOUS: UA claims to be AWS service but IP doesn't match!
+                logging.warning(
+                    f"SPOOFING ALERT: UA claims to be {service_name} but IP {ip} "
+                    f"is NOT in {aws_service} range. Possible attack vector."
+                )
+                # Don't give negative score - likely spoofing attempt
+                continue
+
+        # Step 2b: Path-based verification (for non-AWS services like Datadog)
+        # Uses cleaned paths to prevent bypass via query params
+        if config.get('require_path_match'):
+            expected_paths = config.get('expected_paths', [])
+
+            # Check if any request path matches expected patterns
+            path_matched = False
+            matched_path = None
+            for req_path in request_paths:
+                for expected in expected_paths:
+                    if _path_matches(req_path, expected):
+                        path_matched = True
+                        matched_path = expected
+                        break
+                if path_matched:
+                    break
+
+            if path_matched:
+                logging.debug(
+                    f"Verified legitimate service: {service_name} "
+                    f"(UA + path '{matched_path}' match)"
+                )
+                return -15, service_name, 'path_match'
+            else:
+                # UA matches but paths don't - be cautious
+                sample_paths = [_clean_path(p) for p in request_paths[:3]]
+                logging.debug(
+                    f"UA claims {service_name} but paths {sample_paths} "
+                    f"don't match expected {expected_paths}. Not giving negative score."
+                )
+                continue
+
+    return 0, None, None
+
+
+# --- MULTI-SIGNAL THREAT DETECTION CONFIGURATION ---
+DEFAULT_THREAT_SIGNALS_CONFIG = {
+    # Weights for different threat signals (sum should ideally be around 100)
+    "attack_pattern_weight": 40,  # Pattern match in request
+    "scanner_ua_weight": 25,  # Known scanner user agent
+    "error_rate_weight": 20,  # High 4xx/5xx response rate
+    "path_diversity_weight": 10,  # Many unique paths (scanning behavior)
+    "rate_weight": 5,  # High request rate
+
+    # Thresholds
+    "error_rate_threshold": 0.7,  # 70% error responses
+    "path_diversity_threshold": 0.8,  # 80% unique paths
+    "rate_threshold": 100,  # 100+ requests in time window
+
+    # Minimum score to be considered malicious (out of 100)
+    "min_threat_score": 40,
+
+    # Enable/disable multi-signal mode
+    "enabled": True,
+}
+
+
+class ThreatSignals:
+    """
+    Tracks multiple threat signals for an IP address.
+    Used for multi-signal threat detection to reduce false positives.
+    """
+
+    def __init__(self):
+        self.attack_pattern_hits: int = 0
+        self.scanner_ua_hits: int = 0
+        self.error_responses: int = 0  # 4xx/5xx responses
+        self.total_requests: int = 0
+        self.unique_paths: Set[str] = set()
+        self.first_seen: Optional[datetime] = None
+        self.last_seen: Optional[datetime] = None
+
+    def add_request(
+        self,
+        has_attack_pattern: bool,
+        has_scanner_ua: bool,
+        status_code: int,
+        path: str,
+        timestamp: Optional[datetime] = None,
+    ):
+        """Record a request and its signals."""
+        self.total_requests += 1
+
+        if has_attack_pattern:
+            self.attack_pattern_hits += 1
+
+        if has_scanner_ua:
+            self.scanner_ua_hits += 1
+
+        if status_code >= 400:
+            self.error_responses += 1
+
+        self.unique_paths.add(path)
+
+        if timestamp:
+            if self.first_seen is None or timestamp < self.first_seen:
+                self.first_seen = timestamp
+            if self.last_seen is None or timestamp > self.last_seen:
+                self.last_seen = timestamp
+
+    def calculate_threat_score(self, config: Dict) -> Tuple[float, Dict[str, float]]:
+        """
+        Calculate overall threat score based on multiple signals.
+
+        Returns:
+            Tuple of (total_score, breakdown_dict)
+        """
+        if self.total_requests == 0:
+            return 0.0, {}
+
+        breakdown = {}
+
+        # 1. Attack pattern signal
+        pattern_ratio = self.attack_pattern_hits / self.total_requests
+        pattern_score = pattern_ratio * config["attack_pattern_weight"]
+        breakdown["attack_pattern"] = pattern_score
+
+        # 2. Scanner user agent signal
+        scanner_ratio = self.scanner_ua_hits / self.total_requests
+        scanner_score = scanner_ratio * config["scanner_ua_weight"]
+        breakdown["scanner_ua"] = scanner_score
+
+        # 3. Error response rate signal
+        error_ratio = self.error_responses / self.total_requests
+        if error_ratio >= config["error_rate_threshold"]:
+            error_score = config["error_rate_weight"]
+        else:
+            error_score = (error_ratio / config["error_rate_threshold"]) * config["error_rate_weight"]
+        breakdown["error_rate"] = error_score
+
+        # 4. Path diversity signal (scanning behavior)
+        path_diversity = len(self.unique_paths) / self.total_requests if self.total_requests > 0 else 0
+        if path_diversity >= config["path_diversity_threshold"]:
+            diversity_score = config["path_diversity_weight"]
+        else:
+            diversity_score = (path_diversity / config["path_diversity_threshold"]) * config["path_diversity_weight"]
+        breakdown["path_diversity"] = diversity_score
+
+        # 5. Request rate signal
+        if self.total_requests >= config["rate_threshold"]:
+            rate_score = config["rate_weight"]
+        else:
+            rate_score = (self.total_requests / config["rate_threshold"]) * config["rate_weight"]
+        breakdown["rate"] = rate_score
+
+        total_score = sum(breakdown.values())
+        return total_score, breakdown
+
+    def is_malicious(self, config: Dict) -> Tuple[bool, float, Dict[str, float]]:
+        """
+        Determine if this IP should be considered malicious based on threat score.
+
+        Returns:
+            Tuple of (is_malicious, score, breakdown)
+        """
+        score, breakdown = self.calculate_threat_score(config)
+        return score >= config["min_threat_score"], score, breakdown
+
+
 # --- TIERED BLOCKING CONFIGURATION ---
 # Each tier: (min_hits, block_duration, tier_name, priority)
 # Priority: Higher number = higher priority (won't be displaced by lower priority)
@@ -174,15 +947,195 @@
 ]
 
 
-def setup_logging(debug: bool = False):
-    """Configures logging level."""
+class JsonFormatter(logging.Formatter):
+    """
+    JSON formatter for structured logging (CloudWatch Logs compatible).
+    """
+
+    def format(self, record: logging.LogRecord) -> str:
+        log_dict = {
+            "timestamp": datetime.now(timezone.utc).isoformat(),
+            "level": record.levelname,
+            "logger": record.name,
+            "message": record.getMessage(),
+            "module": record.module,
+            "function": record.funcName,
+            "line": record.lineno,
+        }
+
+        # Add exception info if present
+        if record.exc_info:
+            log_dict["exception"] = self.formatException(record.exc_info)
+
+        # Add extra fields if provided
+        if hasattr(record, "extra_fields"):
+            log_dict.update(record.extra_fields)
+
+        return json.dumps(log_dict)
+
+
+def setup_logging(debug: bool = False, json_format: bool = False):
+    """
+    Configures logging level and format.
+
+    Args:
+        debug: Enable debug level logging
+        json_format: Use JSON structured logging format (for CloudWatch Logs)
+    """
     log_level = logging.DEBUG if debug else logging.INFO
-    # Force reconfiguration even if basicConfig was already called
-    logging.basicConfig(
-        level=log_level,
-        format="%(asctime)s - %(levelname)s - %(message)s",
-        force=True,  # Python 3.8+ - forces reconfiguration
-    )
+
+    # Remove all existing handlers
+    root_logger = logging.getLogger()
+    for handler in root_logger.handlers[:]:
+        root_logger.removeHandler(handler)
+
+    # Create console handler
+    handler = logging.StreamHandler()
+    handler.setLevel(log_level)
+
+    if json_format:
+        handler.setFormatter(JsonFormatter())
+    else:
+        handler.setFormatter(
+            logging.Formatter("%(asctime)s - %(levelname)s - %(message)s")
+        )
+
+    root_logger.setLevel(log_level)
+    root_logger.addHandler(handler)
+
+
+class CloudWatchMetrics:
+    """
+    CloudWatch metrics publisher for monitoring the blocker's activity.
+
+    Publishes custom metrics to AWS CloudWatch for:
+    - IPs blocked/unblocked
+    - Attack patterns detected
+    - Processing performance
+    - Error rates
+    """
+
+    def __init__(
+        self,
+        namespace: str = "AutoBlockAttackers",
+        region: str = "us-east-1",
+        enabled: bool = True,
+        dry_run: bool = False,
+    ):
+        """
+        Initialize CloudWatch metrics publisher.
+
+        Args:
+            namespace: CloudWatch metrics namespace
+            region: AWS region
+            enabled: Whether to publish metrics
+            dry_run: If True, log metrics instead of publishing
+        """
+        self.namespace = namespace
+        self.enabled = enabled
+        self.dry_run = dry_run
+        self._metric_buffer: List[Dict] = []
+        self._buffer_size = 20  # AWS CloudWatch limit per API call
+        self._cloudwatch = None
+
+        if enabled:
+            try:
+                boto_config = Config(
+                    connect_timeout=5,
+                    read_timeout=10,
+                    retries={"max_attempts": 3, "mode": "adaptive"},
+                )
+                self._cloudwatch = boto3.client(
+                    "cloudwatch", region_name=region, config=boto_config
+                )
+                logging.info(f"CloudWatch metrics enabled (namespace: {namespace})")
+            except Exception as e:
+                logging.warning(f"Failed to initialize CloudWatch metrics: {e}")
+                self.enabled = False
+
+    def put_metric(
+        self,
+        metric_name: str,
+        value: float,
+        unit: str = "Count",
+        dimensions: Optional[Dict[str, str]] = None,
+    ):
+        """
+        Queue a metric for publishing to CloudWatch.
+
+        Args:
+            metric_name: Name of the metric
+            value: Metric value
+            unit: Metric unit (Count, Seconds, Bytes, etc.)
+            dimensions: Optional dimension key-value pairs
+        """
+        if not self.enabled:
+            return
+
+        metric_data = {
+            "MetricName": metric_name,
+            "Value": value,
+            "Unit": unit,
+            "Timestamp": datetime.now(timezone.utc),
+        }
+
+        if dimensions:
+            metric_data["Dimensions"] = [
+                {"Name": k, "Value": v} for k, v in dimensions.items()
+            ]
+
+        self._metric_buffer.append(metric_data)
+
+        # Flush if buffer is full
+        if len(self._metric_buffer) >= self._buffer_size:
+            self.flush()
+
+    def put_count(
+        self,
+        metric_name: str,
+        count: int = 1,
+        dimensions: Optional[Dict[str, str]] = None,
+    ):
+        """Convenience method for count metrics."""
+        self.put_metric(metric_name, float(count), "Count", dimensions)
+
+    def put_timing(
+        self,
+        metric_name: str,
+        seconds: float,
+        dimensions: Optional[Dict[str, str]] = None,
+    ):
+        """Convenience method for timing metrics in seconds."""
+        self.put_metric(metric_name, seconds, "Seconds", dimensions)
+
+    def flush(self):
+        """Publish all buffered metrics to CloudWatch."""
+        if not self._metric_buffer:
+            return
+
+        if self.dry_run:
+            logging.debug(
+                f"[DRY-RUN] Would publish {len(self._metric_buffer)} metrics to CloudWatch"
+            )
+            self._metric_buffer.clear()
+            return
+
+        if not self.enabled or not self._cloudwatch:
+            self._metric_buffer.clear()
+            return
+
+        try:
+            # Split into chunks of 20 (AWS limit)
+            for i in range(0, len(self._metric_buffer), self._buffer_size):
+                chunk = self._metric_buffer[i : i + self._buffer_size]
+                self._cloudwatch.put_metric_data(
+                    Namespace=self.namespace, MetricData=chunk
+                )
+            logging.debug(f"Published {len(self._metric_buffer)} metrics to CloudWatch")
+        except ClientError as e:
+            logging.warning(f"Failed to publish CloudWatch metrics: {e}")
+        finally:
+            self._metric_buffer.clear()
 
 
 def is_valid_public_ipv4(ip_str: str) -> bool:
@@ -201,54 +1154,235 @@ def is_valid_public_ipv4(ip_str: str) -> bool:
         return False
 
 
-def load_aws_ip_ranges(file_path: Optional[str]) -> Set[ipaddress.IPv4Network]:
+def is_valid_public_ip(ip_str: str) -> Tuple[bool, int]:
+    """
+    Checks if a string is a valid, public IP address (IPv4 or IPv6).
+
+    Args:
+        ip_str: String representation of an IP address
+
+    Returns:
+        Tuple of (is_valid, version) where version is 4 or 6.
+        Returns (False, 0) for invalid addresses.
+    """
+    try:
+        ip = ipaddress.ip_address(ip_str)
+
+        # Check if it's a public IP (not private, loopback, etc.)
+        is_public = (
+            not ip.is_private
+            and not ip.is_loopback
+            and not ip.is_link_local
+            and not ip.is_multicast
+            and not ip.is_reserved
+        )
+
+        # Additional check for IPv6 site-local addresses (deprecated but still exist)
+        if ip.version == 6:
+            # Check for unique local addresses (fc00::/7) - similar to private IPv4
+            if ip_str.lower().startswith(('fc', 'fd')):
+                is_public = False
+
+        return (is_public, ip.version) if is_public else (False, ip.version)
+    except ValueError:
+        return (False, 0)
+
+
+def load_aws_ip_ranges(
+    file_path: Optional[str],
+) -> Tuple[Set[ipaddress.IPv4Network], Set[ipaddress.IPv6Network]]:
     """
     Loads AWS IP ranges from ip-ranges.json file.
-    Returns a set of IPv4Network objects for efficient IP membership testing.
+
+    Args:
+        file_path: Path to the AWS ip-ranges.json file
+
+    Returns:
+        Tuple of (IPv4 networks set, IPv6 networks set) for efficient IP membership testing.
+
+    Note:
+        This function is maintained for backward compatibility.
+        For O(log N) lookups with service verification, use load_aws_ip_ranges_with_index().
     """
     if not file_path:
-        return set()
+        return set(), set()
 
     try:
         json_path = Path(file_path)
         if not json_path.exists():
             logging.warning(f"AWS IP ranges file not found: {file_path}")
-            return set()
+            return set(), set()
 
         with open(json_path, "r") as f:
             data = json.load(f)
 
-        aws_networks = set()
-        for prefix in data.get("prefixes", []):
-            ip_prefix = prefix.get("ip_prefix")
-            if ip_prefix and "/" in ip_prefix:
-                try:
-                    network = ipaddress.ip_network(ip_prefix, strict=False)
-                    if network.version == 4:  # Only IPv4
-                        aws_networks.add(network)
-                except ValueError:
-                    continue
+        aws_ipv4_networks = set()
+        aws_ipv6_networks = set()
+
+        # Load IPv4 prefixes
+        for prefix in data.get("prefixes", []):
+            ip_prefix = prefix.get("ip_prefix")
+            if ip_prefix and "/" in ip_prefix:
+                try:
+                    network = ipaddress.ip_network(ip_prefix, strict=False)
+                    if network.version == 4:
+                        aws_ipv4_networks.add(network)
+                except ValueError:
+                    continue
+
+        # Load IPv6 prefixes
+        for prefix in data.get("ipv6_prefixes", []):
+            ip_prefix = prefix.get("ipv6_prefix")
+            if ip_prefix and "/" in ip_prefix:
+                try:
+                    network = ipaddress.ip_network(ip_prefix, strict=False)
+                    if network.version == 6:
+                        aws_ipv6_networks.add(network)
+                except ValueError:
+                    continue
+
+        logging.info(
+            f"Loaded {len(aws_ipv4_networks)} AWS IPv4 and {len(aws_ipv6_networks)} AWS IPv6 ranges from {file_path}"
+        )
+        return aws_ipv4_networks, aws_ipv6_networks
+
+    except Exception as e:
+        logging.warning(f"Error loading AWS IP ranges from {file_path}: {e}")
+        return set(), set()
+
+
+def load_aws_ip_ranges_with_index(
+    file_path: Optional[str] = None,
+    auto_download: bool = True,
+) -> Tuple[Optional[AWSIPRangeIndex], Set[ipaddress.IPv4Network], Set[ipaddress.IPv6Network]]:
+    """
+    Load AWS IP ranges with O(log N) index and optional auto-download.
+
+    This function provides:
+    - Auto-download of ip-ranges.json if missing or stale
+    - O(log N) bisect-based lookups via AWSIPRangeIndex
+    - Service-based IP verification (Route53 health checks, CloudFront, etc.)
+    - Backward-compatible network sets for legacy code
+
+    Args:
+        file_path: Path to ip-ranges.json file. If None, uses environment-appropriate default.
+        auto_download: If True, download the file if missing or stale (default: True).
+                       Set to False for air-gapped environments.
+
+    Returns:
+        Tuple of (AWSIPRangeIndex, IPv4 network set, IPv6 network set)
+        - AWSIPRangeIndex: For O(log N) lookups and service verification. None if loading failed.
+        - IPv4 networks: Set for backward compatibility
+        - IPv6 networks: Set for backward compatibility
+    """
+    global _aws_ip_index
+
+    # Determine file path
+    if file_path is None:
+        file_path = get_ip_ranges_path()
+
+    # Try to load or download data
+    data = None
+    if auto_download:
+        data = download_aws_ip_ranges(file_path)
+    else:
+        # Load without downloading
+        path = Path(file_path)
+        if path.exists():
+            try:
+                with open(path) as f:
+                    data = json.load(f)
+                logging.info(f"Loaded AWS IP ranges from {file_path}")
+            except Exception as e:
+                logging.warning(f"Failed to load {file_path}: {e}")
+        else:
+            logging.warning(
+                f"AWS IP ranges file not found: {file_path}. "
+                f"Use --no-auto-download-ip-ranges=false to auto-download."
+            )
+
+    if not data:
+        return None, set(), set()
+
+    # Build the index
+    _aws_ip_index = AWSIPRangeIndex.from_json_data(data)
 
-        logging.info(f"Loaded {len(aws_networks)} AWS IPv4 ranges from {file_path}")
-        return aws_networks
+    # Also build network sets for backward compatibility
+    aws_ipv4_networks = set()
+    aws_ipv6_networks = set()
 
-    except Exception as e:
-        logging.warning(f"Error loading AWS IP ranges from {file_path}: {e}")
-        return set()
+    for prefix in data.get("prefixes", []):
+        ip_prefix = prefix.get("ip_prefix")
+        if ip_prefix and "/" in ip_prefix:
+            try:
+                network = ipaddress.ip_network(ip_prefix, strict=False)
+                if network.version == 4:
+                    aws_ipv4_networks.add(network)
+            except ValueError:
+                continue
+
+    for prefix in data.get("ipv6_prefixes", []):
+        ip_prefix = prefix.get("ipv6_prefix")
+        if ip_prefix and "/" in ip_prefix:
+            try:
+                network = ipaddress.ip_network(ip_prefix, strict=False)
+                if network.version == 6:
+                    aws_ipv6_networks.add(network)
+            except ValueError:
+                continue
+
+    return _aws_ip_index, aws_ipv4_networks, aws_ipv6_networks
 
 
-def is_aws_ip(ip_str: str, aws_networks: Set[ipaddress.IPv4Network]) -> bool:
+def is_aws_ip_fast(ip_str: str, aws_index: Optional[AWSIPRangeIndex] = None) -> bool:
     """
-    Checks if an IP address belongs to AWS IP ranges.
-    Uses early termination for efficiency.
+    O(log N) check if IP belongs to AWS ranges using bisect-based index.
+
+    This is the preferred method for production use. Falls back to False if
+    no index is available.
+
+    Args:
+        ip_str: IP address string to check
+        aws_index: Optional AWSIPRangeIndex. If None, uses global _aws_ip_index.
+
+    Returns:
+        True if the IP belongs to AWS, False otherwise.
     """
-    if not aws_networks:
+    index = aws_index or _aws_ip_index
+    if index is None:
         return False
+    return index.is_aws_ip(ip_str)
 
+
+def is_aws_ip(
+    ip_str: str,
+    aws_ipv4_networks: Set[ipaddress.IPv4Network],
+    aws_ipv6_networks: Optional[Set[ipaddress.IPv6Network]] = None,
+) -> bool:
+    """
+    Checks if an IP address belongs to AWS IP ranges.
+
+    Args:
+        ip_str: IP address string to check
+        aws_ipv4_networks: Set of AWS IPv4 networks
+        aws_ipv6_networks: Optional set of AWS IPv6 networks
+
+    Returns:
+        True if the IP belongs to AWS, False otherwise.
+    """
     try:
         ip = ipaddress.ip_address(ip_str)
-        # Iterate through networks - will return True immediately on first match
-        return any(ip in network for network in aws_networks)
+
+        if ip.version == 4:
+            if not aws_ipv4_networks:
+                return False
+            return any(ip in network for network in aws_ipv4_networks)
+        elif ip.version == 6:
+            if not aws_ipv6_networks:
+                return False
+            return any(ip in network for network in aws_ipv6_networks)
+
+        return False
     except ValueError:
         return False
 
@@ -275,33 +1409,108 @@ def __init__(
         ipinfo_token: Optional[str] = None,
         registry_file: Optional[str] = None,
         tier_config: Optional[List[Tuple]] = None,
+        storage_backend: Optional[str] = None,
+        dynamodb_table: Optional[str] = None,
+        s3_state_bucket: Optional[str] = None,
+        s3_state_key: Optional[str] = None,
+        create_dynamodb_table: bool = False,
+        # IPv6 support parameters
+        start_rule_ipv6: int = 180,
+        limit_ipv6: int = 20,
+        enable_ipv6: bool = True,
+        # Incremental processing
+        force_reprocess: bool = False,
+        # AWS WAF IP Set integration
+        waf_ip_set_name: Optional[str] = None,
+        waf_ip_set_scope: str = "REGIONAL",  # "REGIONAL" or "CLOUDFRONT"
+        waf_ip_set_id: Optional[str] = None,
+        create_waf_ip_set: bool = False,
+        # Structured logging & CloudWatch metrics
+        json_logging: bool = False,
+        enable_cloudwatch_metrics: bool = False,
+        cloudwatch_namespace: str = "AutoBlockAttackers",
+        # Multi-signal threat detection
+        enable_multi_signal: bool = True,
+        threat_signals_config: Optional[Dict] = None,
+        # Enhanced Slack notifications
+        enhanced_slack: bool = False,
+        # Athena integration for large-scale log analysis
+        athena_enabled: bool = False,
+        athena_database: str = "alb_logs",
+        athena_output_location: Optional[str] = None,
+        # Auto-download AWS IP ranges
+        auto_download_ip_ranges: bool = True,
     ):
-        setup_logging(debug)
+        setup_logging(debug, json_format=json_logging)
         logging.info("Initializing NaclAutoBlocker...")
+
+        # Multi-signal threat detection configuration
+        self._enable_multi_signal = enable_multi_signal
+        self._threat_signals_config = threat_signals_config or DEFAULT_THREAT_SIGNALS_CONFIG.copy()
+        if enable_multi_signal:
+            logging.info(
+                f"Multi-signal threat detection enabled (min score: {self._threat_signals_config['min_threat_score']})"
+            )
         self.lb_name_pattern = lb_name_pattern
         self.region = region
         self.lookback_delta = self._parse_lookback_period(lookback_str)
         self.threshold = threshold
-        # Calculate end rule based on start_rule and limit
+
+        # IPv4 NACL rule range
         end_rule = min(start_rule + limit, 100)
-        self.deny_rule_range = range(start_rule, end_rule)  # Managed DENY rules
+        self.deny_rule_range = range(start_rule, end_rule)  # Managed IPv4 DENY rules
         self.nacl_limit = limit
+
+        # IPv6 NACL rule range (separate from IPv4)
+        self.enable_ipv6 = enable_ipv6
+        end_rule_ipv6 = min(start_rule_ipv6 + limit_ipv6, 200)
+        self.deny_rule_range_ipv6 = range(start_rule_ipv6, end_rule_ipv6)
+        self.nacl_limit_ipv6 = limit_ipv6
+
+        if enable_ipv6:
+            logging.info(f"IPv6 blocking enabled: rules {start_rule_ipv6}-{end_rule_ipv6 - 1}")
+
         logging.info("Loading whitelist and AWS IP ranges...")
         self.whitelist = self._load_whitelist(whitelist_file)
-        self.aws_networks = load_aws_ip_ranges(aws_ip_ranges_file)
+
+        # Load AWS IP ranges with O(log N) index and optional auto-download
+        self._auto_download_ip_ranges = auto_download_ip_ranges
+        self.aws_ip_index, self.aws_ipv4_networks, self.aws_ipv6_networks = load_aws_ip_ranges_with_index(
+            file_path=aws_ip_ranges_file,
+            auto_download=auto_download_ip_ranges,
+        )
+        # Keep backward compatibility
+        self.aws_networks = self.aws_ipv4_networks
+
+        # Store debug mode for logging control
+        self._debug = debug
+
         self.dry_run = dry_run
 
         # Block registry for persistent time-based blocking
         self.registry_file = registry_file or "./block_registry.json"
         self.tier_config = tier_config or DEFAULT_TIER_CONFIG
         self.block_registry: Dict[str, Dict] = {}
-        logging.info(f"Using block registry file: {self.registry_file}")
+
+        # Initialize storage backend
+        self._storage_backend_type = storage_backend or "local"
+        self._storage_backend = self._init_storage_backend(
+            backend_type=self._storage_backend_type,
+            registry_file=self.registry_file,
+            dynamodb_table=dynamodb_table,
+            s3_bucket=s3_state_bucket,
+            s3_key=s3_state_key or "block_registry.json",
+            region=region,
+            create_dynamodb_table=create_dynamodb_table,
+        )
         self._load_block_registry()
 
         # Initialize Slack client if credentials provided
         self.slack_client = None
+        self._enhanced_slack = enhanced_slack
         if slack_token and slack_channel:
-            logging.info("Initializing Slack notifications...")
+            notification_type = "enhanced" if enhanced_slack else "basic"
+            logging.info(f"Initializing Slack notifications ({notification_type})...")
             self.slack_client = SlackClient(token=slack_token, channel=slack_channel)
         elif slack_token or slack_channel:
             logging.warning(
@@ -318,14 +1527,94 @@ def __init__(
         else:
             logging.info("No IPInfo token provided. IP geolocation disabled.")
 
+        # IPInfo circuit breaker state
+        self._ipinfo_failures = 0
+        self._ipinfo_circuit_open = False
+        self._ipinfo_failure_threshold = 3
+
+        # Failed Slack messages queue for retry
+        self._failed_slack_messages: List[Tuple[str, bool]] = []
+
+        # S3 processing error tracking
+        self._s3_processing_errors = 0
+
+        # Skipped IPs tracking (for dry-run summary)
+        self._skipped_ips: List[Tuple[str, float, Dict[str, Any]]] = []
+
+        # Incremental log processing state
+        self._force_reprocess = force_reprocess
+        self._processed_files: Dict[str, str] = {}  # key -> etag
+        self._processed_files_cache_key = "_processed_files_cache"
+        self._skipped_files_count = 0
+        self._new_files_count = 0
+
+        # Load processed files cache (only if not force_reprocess)
+        if not force_reprocess:
+            self._load_processed_files_cache()
+        else:
+            logging.info("Force reprocess enabled - ignoring processed files cache")
+
+        # Athena integration for large-scale log analysis
+        self._athena_enabled = athena_enabled
+        self._athena_database = athena_database
+        self._athena_output_location = athena_output_location
+        self._athena = None  # Lazy initialization
+        if athena_enabled:
+            if not athena_output_location:
+                logging.warning(
+                    "Athena enabled but no output location specified. "
+                    "Use --athena-output-location to specify S3 path for query results."
+                )
+                self._athena_enabled = False
+            else:
+                logging.info(
+                    f"Athena integration enabled (database: {athena_database}, "
+                    f"output: {athena_output_location})"
+                )
+
         logging.info("Initializing AWS clients (boto3)...")
+        # Enhanced boto config with adaptive retries for production stability
         boto_config = Config(
-            connect_timeout=10, read_timeout=15, retries={"max_attempts": 3}
+            connect_timeout=10,
+            read_timeout=30,
+            retries={
+                "max_attempts": 5,
+                "mode": "adaptive",  # Exponential backoff with jitter
+            },
         )
         self.ec2 = boto3.client("ec2", region_name=self.region, config=boto_config)
         self.elbv2 = boto3.client("elbv2", region_name=self.region, config=boto_config)
         self.s3 = boto3.client("s3", region_name=self.region, config=boto_config)
         self.sts = boto3.client("sts", region_name=self.region, config=boto_config)
+
+        # AWS WAF IP Set integration
+        self._waf_ip_set_name = waf_ip_set_name
+        self._waf_ip_set_scope = waf_ip_set_scope.upper()
+        self._waf_ip_set_id = waf_ip_set_id
+        self._create_waf_ip_set = create_waf_ip_set
+        self._waf_enabled = bool(waf_ip_set_name or waf_ip_set_id)
+        self._waf_ip_set_lock_token: Optional[str] = None
+        self._waf_max_addresses = 10000  # AWS WAF limit per IP set
+
+        if self._waf_enabled:
+            # CloudFront WAF must use us-east-1 region
+            waf_region = "us-east-1" if self._waf_ip_set_scope == "CLOUDFRONT" else self.region
+            self.wafv2 = boto3.client("wafv2", region_name=waf_region, config=boto_config)
+            logging.info(
+                f"AWS WAF integration enabled (scope: {self._waf_ip_set_scope}, region: {waf_region})"
+            )
+            self._init_waf_ip_set()
+        else:
+            self.wafv2 = None
+
+        # Initialize CloudWatch metrics
+        self._metrics = CloudWatchMetrics(
+            namespace=cloudwatch_namespace,
+            region=self.region,
+            enabled=enable_cloudwatch_metrics,
+            dry_run=dry_run,
+        )
+
         logging.info("Initialization complete. Ready to run.")
 
     def _parse_lookback_period(self, lookback_str: str) -> timedelta:
@@ -342,6 +1631,52 @@ def _parse_lookback_period(self, lookback_str: str) -> timedelta:
         else:  # unit == "d"
             return timedelta(days=value)
 
+    def _init_storage_backend(
+        self,
+        backend_type: str,
+        registry_file: str,
+        dynamodb_table: Optional[str],
+        s3_bucket: Optional[str],
+        s3_key: str,
+        region: str,
+        create_dynamodb_table: bool,
+    ) -> StorageBackend:
+        """
+        Initialize the appropriate storage backend based on configuration.
+
+        Args:
+            backend_type: Type of backend ('local', 'dynamodb', 's3')
+            registry_file: Path to local registry file
+            dynamodb_table: DynamoDB table name
+            s3_bucket: S3 bucket name
+            s3_key: S3 object key
+            region: AWS region
+            create_dynamodb_table: Whether to create DynamoDB table if missing
+
+        Returns:
+            StorageBackend: Configured storage backend instance
+        """
+        try:
+            backend = create_storage_backend(
+                backend_type=backend_type,
+                local_file=registry_file,
+                dynamodb_table=dynamodb_table,
+                s3_bucket=s3_bucket,
+                s3_key=s3_key,
+                region=region,
+                create_dynamodb_table=create_dynamodb_table,
+            )
+            logging.info(f"Storage backend initialized: {backend_type}")
+            return backend
+        except ValueError as e:
+            logging.error(f"Invalid storage backend configuration: {e}")
+            raise
+        except Exception as e:
+            logging.error(f"Failed to initialize storage backend: {e}")
+            # Fall back to local storage
+            logging.warning("Falling back to local file storage")
+            return LocalFileBackend(file_path=registry_file)
+
     def _load_whitelist(self, file_path: Optional[str]) -> Set[str]:
         if not file_path:
             return set()
@@ -361,50 +1696,28 @@ def _load_whitelist(self, file_path: Optional[str]) -> Set[str]:
             return set()
 
     def _load_block_registry(self):
-        """Loads the block registry from JSON file. Creates new if not exists or corrupted."""
+        """Loads the block registry from the configured storage backend."""
         try:
-            if os.path.exists(self.registry_file):
-                with open(self.registry_file, "r") as f:
-                    data = json.load(f)
-                    # Validate structure
-                    if isinstance(data, dict):
-                        self.block_registry = data
-                        logging.info(
-                            f"Loaded block registry with {len(self.block_registry)} IPs"
-                        )
-                    else:
-                        logging.warning(
-                            "Block registry has invalid structure. Starting fresh."
-                        )
-                        self.block_registry = {}
-            else:
-                logging.info(
-                    "Block registry file not found. Starting with empty registry."
-                )
-                self.block_registry = {}
-        except json.JSONDecodeError as e:
-            logging.warning(f"Block registry JSON is corrupted: {e}. Starting fresh.")
+            self.block_registry = self._storage_backend.load()
+            logging.info(f"Loaded block registry with {len(self.block_registry)} IPs")
+        except StorageError as e:
+            logging.warning(f"Storage backend error: {e}. Starting fresh.")
             self.block_registry = {}
         except Exception as e:
             logging.warning(f"Error loading block registry: {e}. Starting fresh.")
             self.block_registry = {}
 
     def _save_block_registry(self):
-        """Saves the block registry to JSON file."""
+        """Saves the block registry to the configured storage backend."""
         if self.dry_run:
-            logging.info("[DRY RUN] Would save block registry to file")
+            logging.info("[DRY RUN] Would save block registry")
             return
 
         try:
-            # Ensure directory exists
-            os.makedirs(os.path.dirname(self.registry_file), exist_ok=True)
-
-            # Write to temp file first, then atomic rename
-            temp_file = f"{self.registry_file}.tmp"
-            with open(temp_file, "w") as f:
-                json.dump(self.block_registry, f, indent=2, default=str)
-            os.rename(temp_file, self.registry_file)
+            self._storage_backend.save(self.block_registry)
             logging.info(f"Saved block registry with {len(self.block_registry)} IPs")
+        except StorageError as e:
+            logging.error(f"Storage backend error saving registry: {e}")
         except Exception as e:
             logging.error(f"Failed to save block registry: {e}")
 
@@ -423,8 +1736,16 @@ def _get_registry_entry(self, ip: str) -> Optional[Dict]:
         """Gets registry entry for an IP, returns None if not found."""
         return self.block_registry.get(ip)
 
-    def _update_registry_entry(self, ip: str, hit_count: int, now: datetime):
-        """Updates or creates a registry entry for an IP."""
+    def _update_registry_entry(self, ip: str, hit_count: int, now: datetime, ip_version: int = 4):
+        """
+        Updates or creates a registry entry for an IP.
+
+        Args:
+            ip: IP address to register
+            hit_count: Number of malicious hits
+            now: Current UTC datetime
+            ip_version: IP version (4 or 6)
+        """
         tier_name, duration, priority = self._determine_tier(hit_count)
         block_until = now + duration
 
@@ -434,6 +1755,8 @@ def _update_registry_entry(self, ip: str, hit_count: int, now: datetime):
             old_tier = existing.get("tier", "unknown")
             old_priority = existing.get("priority", 0)
             old_block_until = existing.get("block_until")
+            # Preserve IP version from existing entry if not explicitly set
+            existing_version = existing.get("ip_version", ip_version)
 
             # Keep the earlier first_seen timestamp
             first_seen = existing.get("first_seen", now.isoformat())
@@ -441,7 +1764,7 @@ def _update_registry_entry(self, ip: str, hit_count: int, now: datetime):
             # Only extend block time if tier upgraded (priority increased)
             if priority > old_priority:
                 logging.info(
-                    f"Upgrading {ip} from {old_tier} to {tier_name} tier - extending block duration"
+                    f"Upgrading {ip} (v{ip_version}) from {old_tier} to {tier_name} tier - extending block duration"
                 )
                 # Tier upgraded - reset block time with new duration
                 final_block_until = block_until.isoformat()
@@ -461,9 +1784,11 @@ def _update_registry_entry(self, ip: str, hit_count: int, now: datetime):
                 "priority": priority,
                 "block_until": final_block_until,
                 "block_duration_hours": duration.total_seconds() / 3600,
+                "ip_version": existing_version,
             }
         else:
             # Create new entry
+            logging.info(f"New block for {ip} (IPv{ip_version}): tier={tier_name}, hits={hit_count}")
             self.block_registry[ip] = {
                 "first_seen": now.isoformat(),
                 "last_seen": now.isoformat(),
@@ -472,6 +1797,7 @@ def _update_registry_entry(self, ip: str, hit_count: int, now: datetime):
                 "priority": priority,
                 "block_until": block_until.isoformat(),
                 "block_duration_hours": duration.total_seconds() / 3600,
+                "ip_version": ip_version,
             }
 
     def _remove_registry_entry(self, ip: str):
@@ -479,6 +1805,505 @@ def _remove_registry_entry(self, ip: str):
         if ip in self.block_registry:
             del self.block_registry[ip]
 
+    def _load_processed_files_cache(self):
+        """
+        Load the processed files cache from storage backend.
+        Uses a special key prefix to store alongside block registry.
+        """
+        try:
+            if self._storage_backend_type == "local":
+                # Store in a separate file for local backend
+                cache_file = self.registry_file.replace(".json", "_processed.json")
+                if os.path.exists(cache_file):
+                    with open(cache_file, "r") as f:
+                        self._processed_files = json.load(f)
+                        logging.debug(f"Loaded {len(self._processed_files)} processed file records")
+            else:
+                # For cloud backends, retrieve from storage
+                cached = self._storage_backend.get(self._processed_files_cache_key)
+                if cached and isinstance(cached.get("files"), dict):
+                    self._processed_files = cached["files"]
+                    logging.debug(f"Loaded {len(self._processed_files)} processed file records")
+        except Exception as e:
+            logging.warning(f"Failed to load processed files cache: {e}")
+            self._processed_files = {}
+
+    def _save_processed_files_cache(self):
+        """Save the processed files cache to storage backend."""
+        if self.dry_run:
+            logging.debug("[DRY RUN] Would save processed files cache")
+            return
+
+        try:
+            if self._storage_backend_type == "local":
+                cache_file = self.registry_file.replace(".json", "_processed.json")
+                with open(cache_file, "w") as f:
+                    json.dump(self._processed_files, f, indent=2)
+            else:
+                self._storage_backend.put(
+                    self._processed_files_cache_key,
+                    {
+                        "files": self._processed_files,
+                        "updated_at": datetime.now(timezone.utc).isoformat(),
+                    },
+                )
+            logging.debug(f"Saved {len(self._processed_files)} processed file records")
+        except Exception as e:
+            logging.warning(f"Failed to save processed files cache: {e}")
+
+    def _cleanup_old_processed_files(self, lookback_hours: float):
+        """
+        Remove processed file records older than 2x lookback period.
+
+        Args:
+            lookback_hours: Current lookback period in hours
+        """
+        if not self._processed_files:
+            return
+
+        now = datetime.now(timezone.utc)
+        cutoff_hours = lookback_hours * 2  # Keep records for 2x lookback
+
+        keys_to_remove = []
+        for key, data in self._processed_files.items():
+            try:
+                # Parse the processed_at timestamp if it exists
+                if isinstance(data, dict):
+                    processed_at_str = data.get("processed_at")
+                    if processed_at_str:
+                        processed_at = datetime.fromisoformat(processed_at_str)
+                        if processed_at.tzinfo is None:
+                            processed_at = processed_at.replace(tzinfo=timezone.utc)
+                        age_hours = (now - processed_at).total_seconds() / 3600
+                        if age_hours > cutoff_hours:
+                            keys_to_remove.append(key)
+            except Exception:
+                pass
+
+        for key in keys_to_remove:
+            del self._processed_files[key]
+
+        if keys_to_remove:
+            logging.info(f"Cleaned up {len(keys_to_remove)} old processed file records")
+
+    def _is_file_already_processed(self, bucket: str, key: str, etag: str) -> bool:
+        """
+        Check if a file has already been processed (based on ETag).
+
+        Args:
+            bucket: S3 bucket name
+            key: S3 object key
+            etag: S3 object ETag
+
+        Returns:
+            True if file was already processed with same ETag
+        """
+        if self._force_reprocess:
+            return False
+
+        cache_key = f"{bucket}:{key}"
+        cached = self._processed_files.get(cache_key)
+
+        if cached:
+            if isinstance(cached, dict):
+                return cached.get("etag") == etag
+            else:
+                # Backward compatibility: cached value is just the etag
+                return cached == etag
+
+        return False
+
+    def _mark_file_processed(self, bucket: str, key: str, etag: str):
+        """
+        Mark a file as processed.
+
+        Args:
+            bucket: S3 bucket name
+            key: S3 object key
+            etag: S3 object ETag
+        """
+        cache_key = f"{bucket}:{key}"
+        self._processed_files[cache_key] = {
+            "etag": etag,
+            "processed_at": datetime.now(timezone.utc).isoformat(),
+        }
+
+    # -------------------------------------------------------------------------
+    # AWS WAF IP Set Integration Methods
+    # -------------------------------------------------------------------------
+
+    def _init_waf_ip_set(self):
+        """
+        Initialize AWS WAF IP Set - find existing or create new if configured.
+        """
+        if not self._waf_enabled:
+            return
+
+        try:
+            # If IP Set ID is provided, verify it exists
+            if self._waf_ip_set_id:
+                ip_set = self._get_waf_ip_set_by_id(self._waf_ip_set_id)
+                if ip_set:
+                    self._waf_ip_set_name = ip_set.get("Name", self._waf_ip_set_name)
+                    logging.info(f"Using existing WAF IP Set: {self._waf_ip_set_name} ({self._waf_ip_set_id})")
+                    return
+                else:
+                    logging.error(f"WAF IP Set ID {self._waf_ip_set_id} not found")
+                    self._waf_enabled = False
+                    return
+
+            # Search by name
+            if self._waf_ip_set_name:
+                ip_set_id = self._find_waf_ip_set_by_name(self._waf_ip_set_name)
+                if ip_set_id:
+                    self._waf_ip_set_id = ip_set_id
+                    logging.info(f"Found existing WAF IP Set: {self._waf_ip_set_name} ({ip_set_id})")
+                    return
+
+                # Create new IP set if requested
+                if self._create_waf_ip_set:
+                    self._create_waf_ip_set_resource()
+                else:
+                    logging.warning(
+                        f"WAF IP Set '{self._waf_ip_set_name}' not found. "
+                        "Use --create-waf-ip-set to create it."
+                    )
+                    self._waf_enabled = False
+
+        except ClientError as e:
+            logging.error(f"Error initializing WAF IP Set: {e}")
+            self._waf_enabled = False
+
+    def _get_waf_ip_set_by_id(self, ip_set_id: str) -> Optional[Dict]:
+        """
+        Get WAF IP Set details by ID.
+
+        Args:
+            ip_set_id: The WAF IP Set ID
+
+        Returns:
+            IP Set details dict or None if not found
+        """
+        try:
+            response = self.wafv2.get_ip_set(
+                Name=self._waf_ip_set_name or "unknown",
+                Scope=self._waf_ip_set_scope,
+                Id=ip_set_id,
+            )
+            self._waf_ip_set_lock_token = response.get("LockToken")
+            return response.get("IPSet")
+        except ClientError as e:
+            if e.response["Error"]["Code"] == "WAFNonexistentItemException":
+                return None
+            raise
+
+    def _find_waf_ip_set_by_name(self, name: str) -> Optional[str]:
+        """
+        Find WAF IP Set by name.
+
+        Args:
+            name: The IP Set name to search for
+
+        Returns:
+            IP Set ID if found, None otherwise
+        """
+        try:
+            paginator = self.wafv2.get_paginator("list_ip_sets")
+            for page in paginator.paginate(Scope=self._waf_ip_set_scope):
+                for ip_set in page.get("IPSets", []):
+                    if ip_set.get("Name") == name:
+                        # Get the full IP set to retrieve lock token
+                        full_ip_set = self.wafv2.get_ip_set(
+                            Name=name,
+                            Scope=self._waf_ip_set_scope,
+                            Id=ip_set["Id"],
+                        )
+                        self._waf_ip_set_lock_token = full_ip_set.get("LockToken")
+                        return ip_set["Id"]
+            return None
+        except ClientError as e:
+            logging.error(f"Error listing WAF IP Sets: {e}")
+            return None
+
+    def _create_waf_ip_set_resource(self):
+        """
+        Create a new WAF IP Set.
+        """
+        if self.dry_run:
+            logging.info(f"[DRY-RUN] Would create WAF IP Set: {self._waf_ip_set_name}")
+            self._waf_enabled = False
+            return
+
+        try:
+            response = self.wafv2.create_ip_set(
+                Name=self._waf_ip_set_name,
+                Scope=self._waf_ip_set_scope,
+                Description=f"Auto-blocked attackers managed by aws-auto-block-attackers (v{__version__})",
+                IPAddressVersion="IPV4",  # We'll handle IPv6 separately if needed
+                Addresses=[],
+                Tags=[
+                    {"Key": "ManagedBy", "Value": "aws-auto-block-attackers"},
+                    {"Key": "Version", "Value": __version__},
+                ],
+            )
+            self._waf_ip_set_id = response["Summary"]["Id"]
+            self._waf_ip_set_lock_token = response["Summary"]["LockToken"]
+            logging.info(f"Created WAF IP Set: {self._waf_ip_set_name} ({self._waf_ip_set_id})")
+
+            # Create IPv6 IP set if enabled
+            if self.enable_ipv6:
+                self._create_waf_ipv6_ip_set()
+
+        except ClientError as e:
+            logging.error(f"Failed to create WAF IP Set: {e}")
+            self._waf_enabled = False
+
+    def _create_waf_ipv6_ip_set(self):
+        """
+        Create a companion IPv6 WAF IP Set.
+        """
+        ipv6_name = f"{self._waf_ip_set_name}-ipv6"
+        try:
+            response = self.wafv2.create_ip_set(
+                Name=ipv6_name,
+                Scope=self._waf_ip_set_scope,
+                Description=f"Auto-blocked IPv6 attackers managed by aws-auto-block-attackers (v{__version__})",
+                IPAddressVersion="IPV6",
+                Addresses=[],
+                Tags=[
+                    {"Key": "ManagedBy", "Value": "aws-auto-block-attackers"},
+                    {"Key": "Version", "Value": __version__},
+                ],
+            )
+            self._waf_ipv6_ip_set_id = response["Summary"]["Id"]
+            self._waf_ipv6_ip_set_lock_token = response["Summary"]["LockToken"]
+            logging.info(f"Created WAF IPv6 IP Set: {ipv6_name} ({self._waf_ipv6_ip_set_id})")
+        except ClientError as e:
+            logging.warning(f"Failed to create WAF IPv6 IP Set: {e}")
+
+    def _get_waf_current_addresses(self) -> Set[str]:
+        """
+        Get current addresses in the WAF IP Set.
+
+        Returns:
+            Set of CIDR addresses currently in the IP set
+        """
+        if not self._waf_enabled or not self._waf_ip_set_id:
+            return set()
+
+        try:
+            response = self.wafv2.get_ip_set(
+                Name=self._waf_ip_set_name,
+                Scope=self._waf_ip_set_scope,
+                Id=self._waf_ip_set_id,
+            )
+            self._waf_ip_set_lock_token = response.get("LockToken")
+            return set(response.get("IPSet", {}).get("Addresses", []))
+        except ClientError as e:
+            logging.error(f"Error getting WAF IP Set addresses: {e}")
+            return set()
+
+    def _sync_waf_ip_set(self, blocked_ips: Set[str]):
+        """
+        Synchronize blocked IPs with WAF IP Set.
+
+        Args:
+            blocked_ips: Set of IPs to block (will be converted to /32 CIDR)
+        """
+        if not self._waf_enabled or not self._waf_ip_set_id:
+            return
+
+        now = datetime.now(timezone.utc)
+
+        # Get active blocks from registry (not expired)
+        active_blocked_ips = set()
+        for ip in blocked_ips:
+            if ip in self.block_registry:
+                data = self.block_registry[ip]
+                block_until_str = data.get("block_until")
+                if block_until_str:
+                    try:
+                        block_until = datetime.fromisoformat(block_until_str)
+                        if block_until.tzinfo is None:
+                            block_until = block_until.replace(tzinfo=timezone.utc)
+                        if now < block_until:
+                            active_blocked_ips.add(ip)
+                    except Exception:
+                        pass
+            else:
+                # New block, include it
+                active_blocked_ips.add(ip)
+
+        # Separate IPv4 and IPv6
+        ipv4_ips = set()
+        ipv6_ips = set()
+
+        for ip in active_blocked_ips:
+            try:
+                ip_obj = ipaddress.ip_address(ip)
+                if ip_obj.version == 4:
+                    ipv4_ips.add(f"{ip}/32")
+                else:
+                    ipv6_ips.add(f"{ip}/128")
+            except ValueError:
+                logging.warning(f"Invalid IP address for WAF sync: {ip}")
+
+        # Sync IPv4 IP Set
+        self._update_waf_ip_set_addresses(ipv4_ips, is_ipv6=False)
+
+        # Sync IPv6 IP Set if we have IPv6 addresses and IPv6 is enabled
+        if ipv6_ips and self.enable_ipv6 and hasattr(self, "_waf_ipv6_ip_set_id"):
+            self._update_waf_ip_set_addresses(ipv6_ips, is_ipv6=True)
+
+    def _update_waf_ip_set_addresses(self, target_addresses: Set[str], is_ipv6: bool = False):
+        """
+        Update WAF IP Set with target addresses (add missing, remove stale).
+
+        Args:
+            target_addresses: Set of CIDR addresses that should be in the IP set
+            is_ipv6: Whether this is for the IPv6 IP set
+        """
+        if is_ipv6:
+            if not hasattr(self, "_waf_ipv6_ip_set_id") or not self._waf_ipv6_ip_set_id:
+                return
+            ip_set_id = self._waf_ipv6_ip_set_id
+            ip_set_name = f"{self._waf_ip_set_name}-ipv6"
+            lock_token_attr = "_waf_ipv6_ip_set_lock_token"
+        else:
+            ip_set_id = self._waf_ip_set_id
+            ip_set_name = self._waf_ip_set_name
+            lock_token_attr = "_waf_ip_set_lock_token"
+
+        try:
+            # Get current addresses
+            response = self.wafv2.get_ip_set(
+                Name=ip_set_name,
+                Scope=self._waf_ip_set_scope,
+                Id=ip_set_id,
+            )
+            current_addresses = set(response.get("IPSet", {}).get("Addresses", []))
+            lock_token = response.get("LockToken")
+            setattr(self, lock_token_attr, lock_token)
+
+            # Calculate changes
+            to_add = target_addresses - current_addresses
+            to_remove = current_addresses - target_addresses
+
+            if not to_add and not to_remove:
+                logging.debug(f"WAF IP Set {ip_set_name} already in sync")
+                return
+
+            # Merge current with changes
+            new_addresses = (current_addresses | to_add) - to_remove
+
+            # Check WAF limits
+            if len(new_addresses) > self._waf_max_addresses:
+                logging.warning(
+                    f"WAF IP Set would exceed {self._waf_max_addresses} addresses. "
+                    f"Truncating to limit."
+                )
+                # Prioritize keeping newer/higher-priority blocks
+                # For simplicity, just truncate (in production, implement smarter logic)
+                new_addresses = set(list(new_addresses)[: self._waf_max_addresses])
+
+            ip_version = "IPv6" if is_ipv6 else "IPv4"
+            if self.dry_run:
+                logging.info(
+                    f"[DRY-RUN] Would update WAF {ip_version} IP Set: "
+                    f"+{len(to_add)} -{len(to_remove)} addresses"
+                )
+                return
+
+            # Update IP set
+            self.wafv2.update_ip_set(
+                Name=ip_set_name,
+                Scope=self._waf_ip_set_scope,
+                Id=ip_set_id,
+                Addresses=list(new_addresses),
+                LockToken=lock_token,
+            )
+
+            logging.info(
+                f"Updated WAF {ip_version} IP Set: +{len(to_add)} -{len(to_remove)} addresses "
+                f"(total: {len(new_addresses)})"
+            )
+
+            # Send Slack notification for significant changes
+            if self.slack_client and (len(to_add) >= 5 or len(to_remove) >= 5):
+                self._send_slack_message(
+                    f"WAF {ip_version} IP Set updated: +{len(to_add)} -{len(to_remove)} addresses "
+                    f"(total: {len(new_addresses)})",
+                    is_error=False,
+                )
+
+        except ClientError as e:
+            error_code = e.response["Error"]["Code"]
+            if error_code == "WAFOptimisticLockException":
+                logging.warning("WAF IP Set was modified concurrently, retrying...")
+                # Retry once
+                self._update_waf_ip_set_addresses(target_addresses, is_ipv6)
+            else:
+                logging.error(f"Failed to update WAF IP Set: {e}")
+
+    def _cleanup_expired_waf_entries(self, expired_ips: Set[str]):
+        """
+        Remove expired IPs from WAF IP Set.
+
+        Args:
+            expired_ips: Set of IPs whose blocks have expired
+        """
+        if not self._waf_enabled or not expired_ips:
+            return
+
+        # Get current active blocks from registry
+        now = datetime.now(timezone.utc)
+        active_ips = set()
+
+        for ip, data in self.block_registry.items():
+            if ip in expired_ips:
+                continue
+            block_until_str = data.get("block_until")
+            if block_until_str:
+                try:
+                    block_until = datetime.fromisoformat(block_until_str)
+                    if block_until.tzinfo is None:
+                        block_until = block_until.replace(tzinfo=timezone.utc)
+                    if now < block_until:
+                        active_ips.add(ip)
+                except Exception:
+                    pass
+
+        # Sync with remaining active IPs
+        self._sync_waf_ip_set(active_ips)
+
+    def _get_waf_statistics(self) -> Dict:
+        """
+        Get statistics about WAF IP Set usage.
+
+        Returns:
+            Dict with WAF statistics
+        """
+        if not self._waf_enabled:
+            return {"enabled": False}
+
+        stats = {
+            "enabled": True,
+            "scope": self._waf_ip_set_scope,
+            "ip_set_id": self._waf_ip_set_id,
+            "ip_set_name": self._waf_ip_set_name,
+        }
+
+        try:
+            current = self._get_waf_current_addresses()
+            stats["ipv4_count"] = len([a for a in current if "." in a])
+            stats["capacity_used"] = len(current)
+            stats["capacity_max"] = self._waf_max_addresses
+            stats["capacity_percent"] = round(len(current) / self._waf_max_addresses * 100, 1)
+        except Exception as e:
+            stats["error"] = str(e)
+
+        return stats
+
     def _get_expired_blocks(self, now: datetime) -> Set[str]:
         """Returns set of IPs whose blocks have expired."""
         expired = set()
@@ -498,6 +2323,11 @@ def _get_expired_blocks(self, now: datetime) -> Set[str]:
 
     def _cleanup_old_registry_entries(self, now: datetime, days_old: int = 30):
         """Remove very old expired entries from registry to prevent unbounded growth."""
+        # For DynamoDB backend, TTL handles cleanup automatically
+        if self._storage_backend_type == "dynamodb":
+            logging.debug("DynamoDB TTL handles automatic cleanup - skipping manual cleanup")
+            return
+
         cutoff_time = now - timedelta(days=days_old)
         old_entries = []
 
@@ -520,6 +2350,12 @@ def _cleanup_old_registry_entries(self, now: datetime, days_old: int = 30):
             )
             for ip in old_entries:
                 del self.block_registry[ip]
+                # Also delete from storage backend if using S3 (to keep in sync)
+                if self._storage_backend_type == "s3":
+                    try:
+                        self._storage_backend.delete(ip)
+                    except Exception:
+                        pass  # Will be cleaned up on next full save
 
     def _get_active_blocks(self, now: datetime) -> Dict[str, Dict]:
         """Returns dict of IPs that should still be blocked (not expired)."""
@@ -540,12 +2376,25 @@ def _get_active_blocks(self, now: datetime) -> Dict[str, Dict]:
 
     def run(self):
         """Executes the entire blocking process."""
+        import time
+
+        run_start_time = time.time()
+
         logging.info(
             "--- Starting Automated Attacker Blocking Script (Tiered Persistence Mode) ---"
         )
         if self.dry_run:
             logging.warning("*** RUNNING IN DRY RUN MODE. NO CHANGES WILL BE MADE. ***")
 
+        # Reset error counters for this run
+        self._s3_processing_errors = 0
+        self._ipinfo_failures = 0
+        self._ipinfo_circuit_open = False
+        self._failed_slack_messages.clear()
+
+        # Track metrics dimensions
+        metrics_dimensions = {"Region": self.region}
+
         now = datetime.now(timezone.utc)
 
         logging.info("Step 1/7: Discovering target load balancers...")
@@ -593,46 +2442,126 @@ def run(self):
             # Now remove from registry
             for ip in expired_ips:
                 self._remove_registry_entry(ip)
+
+            # Cleanup WAF IP Set as well
+            if self._waf_enabled:
+                self._cleanup_expired_waf_entries(expired_ips)
+
+            # Emit metric for expired blocks
+            self._metrics.put_count("BlocksExpired", len(expired_ips), metrics_dimensions)
         else:
             logging.info("No expired blocks found.")
+            self._metrics.put_count("BlocksExpired", 0, metrics_dimensions)
 
         # Periodic cleanup of very old entries (prevents unbounded growth)
         self._cleanup_old_registry_entries(now, days_old=30)
 
         logging.info("Step 5/7: Scanning S3 for ALB log files...")
         start_scan_time = now - self.lookback_delta
+
+        # Cleanup old processed file records (2x lookback period)
+        lookback_hours = self.lookback_delta.total_seconds() / 3600
+        self._cleanup_old_processed_files(lookback_hours)
+
         all_log_keys = []
+        files_with_etags: Dict[str, str] = {}  # key -> etag mapping for marking processed
+
         for bucket, prefix in unique_log_locations:
-            keys = self._find_log_files_in_window(bucket, prefix, start_scan_time)
-            all_log_keys.extend([(bucket, key) for key in keys])
+            file_tuples = self._find_log_files_in_window(bucket, prefix, start_scan_time)
+            for key, etag in file_tuples:
+                all_log_keys.append((bucket, key))
+                files_with_etags[f"{bucket}:{key}"] = etag
 
         logging.info(f"Step 6/7: Processing {len(all_log_keys)} log file(s)...")
 
+        # Emit metric for files processed
+        self._metrics.put_count("LogFilesProcessed", len(all_log_keys), metrics_dimensions)
+
         # Process logs and get new offenders
         new_offenders = set()
-        ip_counts = Counter()
+        ip_counts: Counter = Counter()
+        ip_versions: Dict[str, int] = {}  # Track IP version for each IP
 
         if all_log_keys:
-            all_malicious_ips = self._process_logs_in_parallel(all_log_keys)
-            if all_malicious_ips:
-                ip_counts = Counter(all_malicious_ips)
-                new_offenders = {
-                    ip
-                    for ip, count in ip_counts.items()
-                    if count >= self.threshold
-                    and ip not in self.whitelist
-                    and not is_aws_ip(ip, self.aws_networks)
-                }
+            all_malicious_ips_with_version = self._process_logs_in_parallel(all_log_keys)
+            if all_malicious_ips_with_version:
+                # Count IPs and track versions
+                for ip, version in all_malicious_ips_with_version:
+                    ip_counts[ip] += 1
+                    ip_versions[ip] = version  # Store the version
+
+                # Identify new offenders (both IPv4 and IPv6)
+                new_offenders = set()
+                for ip, count in ip_counts.items():
+                    if count < self.threshold:
+                        continue
+                    if ip in self.whitelist:
+                        continue
+
+                    # Check AWS IP with appropriate network list
+                    version = ip_versions.get(ip, 4)
+                    if version == 4:
+                        if is_aws_ip(ip, self.aws_ipv4_networks, None):
+                            continue
+                    elif version == 6:
+                        if is_aws_ip(ip, set(), self.aws_ipv6_networks):
+                            continue
+
+                    new_offenders.add(ip)
+
+                # Multi-signal threat filtering (when enabled)
+                if self._enable_multi_signal and new_offenders:
+                    logging.info("Applying multi-signal threat detection...")
+                    multi_signal_offenders = self._filter_by_multi_signal(
+                        new_offenders, all_log_keys, metrics_dimensions
+                    )
+                    filtered_count = len(new_offenders) - len(multi_signal_offenders)
+                    if filtered_count > 0:
+                        logging.info(
+                            f"Multi-signal filtering: {filtered_count} potential false positive(s) removed"
+                        )
+                        self._metrics.put_count("FalsePositivesFiltered", filtered_count, metrics_dimensions)
+                    new_offenders = multi_signal_offenders
+
+                # Emit metric for total malicious hits detected
+                self._metrics.put_count(
+                    "MaliciousHitsDetected",
+                    len(all_malicious_ips_with_version),
+                    metrics_dimensions,
+                )
 
                 if new_offenders:
+                    ipv4_count = sum(1 for ip in new_offenders if ip_versions.get(ip, 4) == 4)
+                    ipv6_count = sum(1 for ip in new_offenders if ip_versions.get(ip, 4) == 6)
                     logging.warning(
-                        f"Identified {len(new_offenders)} new offender(s) from recent logs."
+                        f"Identified {len(new_offenders)} new offender(s) from recent logs "
+                        f"(IPv4: {ipv4_count}, IPv6: {ipv6_count})"
                     )
-                    # Update registry with new offenders
+
+                    # Emit metrics for new offenders
+                    self._metrics.put_count("NewOffendersIPv4", ipv4_count, metrics_dimensions)
+                    self._metrics.put_count("NewOffendersIPv6", ipv6_count, metrics_dimensions)
+                    self._metrics.put_count("NewOffendersTotal", len(new_offenders), metrics_dimensions)
+
+                    # Update registry with new offenders (including IP version)
                     for ip in new_offenders:
-                        self._update_registry_entry(ip, ip_counts[ip], now)
+                        version = ip_versions.get(ip, 4)
+                        self._update_registry_entry(ip, ip_counts[ip], now, version)
+                else:
+                    self._metrics.put_count("NewOffendersTotal", 0, metrics_dimensions)
+
+                # Mark processed files (even if no malicious activity found)
+                for cache_key, etag in files_with_etags.items():
+                    parts = cache_key.split(":", 1)
+                    if len(parts) == 2:
+                        self._mark_file_processed(parts[0], parts[1], etag)
             else:
                 logging.info("No malicious activity found in recent log files.")
+                # Still mark files as processed
+                for cache_key, etag in files_with_etags.items():
+                    parts = cache_key.split(":", 1)
+                    if len(parts) == 2:
+                        self._mark_file_processed(parts[0], parts[1], etag)
         else:
             logging.info("No relevant log files found in lookback window.")
 
@@ -643,27 +2572,65 @@ def run(self):
         logging.info(f"Total active blocks in registry: {len(ips_to_block)}")
 
         logging.info("Step 7/7: Updating NACL rules with time-based blocks...")
-        self._update_nacl_rules_with_registry(nacl_id, ips_to_block, active_blocks)
+        ips_to_add, ips_to_remove = self._update_nacl_rules_with_registry(nacl_id, ips_to_block, active_blocks)
+
+        # Sync blocked IPs to WAF IP Set (if enabled)
+        if self._waf_enabled:
+            logging.info("Syncing blocked IPs to WAF IP Set...")
+            self._sync_waf_ip_set(ips_to_block)
 
-        # Save registry
+        # Save registry and processed files cache
         self._save_block_registry()
+        self._save_processed_files_cache()
 
         final_deny_rules, _ = self._get_nacl_rules(nacl_id)
         final_blocked_ips = {cidr.split("/")[0] for cidr in final_deny_rules.values()}
         self._generate_report(
-            ip_counts, new_offenders, final_blocked_ips, active_blocks
+            ip_counts, new_offenders, final_blocked_ips, active_blocks,
+            ips_to_add=ips_to_add, ips_to_remove=ips_to_remove
         )
 
         # Send summary notification to Slack (only if there were changes)
-        self._send_summary_notification_with_registry(
-            new_offenders,
-            final_blocked_ips,
-            ip_counts,
-            initially_blocked_ips,
-            active_blocks,
-        )
+        if self._enhanced_slack:
+            self._send_enhanced_slack_notification(
+                new_offenders,
+                final_blocked_ips,
+                ip_counts,
+                initially_blocked_ips,
+                active_blocks,
+            )
+        else:
+            self._send_summary_notification_with_registry(
+                new_offenders,
+                final_blocked_ips,
+                ip_counts,
+                initially_blocked_ips,
+                active_blocks,
+            )
 
-        logging.info("--- Script Finished ---")
+        # Retry any failed Slack notifications
+        self._retry_failed_slack_messages()
+
+        # Emit metrics for active blocks
+        self._metrics.put_count("ActiveBlocksTotal", len(ips_to_block), metrics_dimensions)
+        self._metrics.put_count("NACLBlockedIPs", len(final_blocked_ips), metrics_dimensions)
+
+        # Log execution summary with error counts
+        if self._s3_processing_errors > 0:
+            logging.warning(f"S3 processing errors during this run: {self._s3_processing_errors} file(s) skipped")
+            self._metrics.put_count("S3ProcessingErrors", self._s3_processing_errors, metrics_dimensions)
+        if self._ipinfo_circuit_open:
+            logging.warning("IPInfo was disabled during this run due to repeated failures")
+            self._metrics.put_count("IPInfoCircuitBreakerTripped", 1, metrics_dimensions)
+
+        # Emit run timing metric
+        run_duration = time.time() - run_start_time
+        self._metrics.put_timing("RunDuration", run_duration, metrics_dimensions)
+
+        # Flush all buffered metrics
+        self._metrics.flush()
+
+        logging.info(f"--- Script Finished (duration: {run_duration:.2f}s) ---")
 
     def _discover_target_lbs(self) -> Optional[Dict[str, Dict]]:
         """Finds all LBs matching the pattern and their details."""
@@ -764,7 +2731,18 @@ def _find_nacl_for_subnets(self, target_lbs: Dict[str, Dict]) -> Optional[str]:
 
     def _find_log_files_in_window(
         self, bucket: str, prefix: str, start_time: datetime
-    ) -> List[str]:
+    ) -> List[Tuple[str, str]]:
+        """
+        Find log files within the lookback window.
+
+        Args:
+            bucket: S3 bucket name
+            prefix: S3 prefix for logs
+            start_time: Start of lookback window
+
+        Returns:
+            List of tuples (key, etag) for each log file found.
+        """
         try:
             paginator = self.s3.get_paginator("list_objects_v2")
             account_id = self.sts.get_caller_identity().get("Account")
@@ -778,91 +2756,944 @@ def _find_log_files_in_window(
             current_date = start_time.date()
             end_date = datetime.now(timezone.utc).date()
 
-            while current_date <= end_date:
-                date_prefix = f"{base_prefix}{current_date.year:04d}/{current_date.month:02d}/{current_date.day:02d}/"
-                date_prefixes.append(date_prefix)
-                current_date += timedelta(days=1)
+            while current_date <= end_date:
+                date_prefix = f"{base_prefix}{current_date.year:04d}/{current_date.month:02d}/{current_date.day:02d}/"
+                date_prefixes.append(date_prefix)
+                current_date += timedelta(days=1)
+
+            logging.info(
+                f"Searching for logs in s3://{bucket}/{base_prefix} "
+                f"across {len(date_prefixes)} date(s) from {start_time.date()} to {end_date}"
+            )
+
+            all_files = []
+            new_files = []
+            skipped_files = 0
+
+            # Scan each date prefix separately (much faster than scanning all dates)
+            for date_prefix in date_prefixes:
+                pages = paginator.paginate(
+                    Bucket=bucket,
+                    Prefix=date_prefix,
+                    PaginationConfig={"MaxItems": 10000},  # Per-date limit
+                )
+
+                for page in pages:
+                    if "Contents" in page:
+                        for obj in page["Contents"]:
+                            if (
+                                not obj["Key"].endswith("/")
+                                and obj["LastModified"] >= start_time
+                            ):
+                                key = obj["Key"]
+                                etag = obj.get("ETag", "").strip('"')
+
+                                all_files.append((key, etag))
+
+                                # Check if already processed (incremental processing)
+                                if self._is_file_already_processed(bucket, key, etag):
+                                    skipped_files += 1
+                                else:
+                                    new_files.append((key, etag))
+
+            # Update counters for metrics
+            self._new_files_count = len(new_files)
+            self._skipped_files_count = skipped_files
+
+            if skipped_files > 0:
+                logging.info(
+                    f"S3 scan complete: found {len(all_files)} file(s), "
+                    f"skipping {skipped_files} already-processed, "
+                    f"processing {len(new_files)} new file(s)"
+                )
+            else:
+                logging.info(
+                    f"S3 scan complete: found {len(new_files)} file(s) to process "
+                    f"across {len(date_prefixes)} date(s)."
+                )
+
+            return new_files
+        except Exception as e:
+            logging.error(f"Error listing S3 objects for prefix {prefix}: {e}")
+            return []
+
+    def _process_logs_in_parallel(
+        self, bucket_key_pairs: List[Tuple[str, str]]
+    ) -> List[Tuple[str, int]]:
+        """
+        Uses a thread pool to download and parse logs concurrently.
+
+        Returns:
+            List of tuples (ip_address, ip_version) for all malicious IPs found.
+        """
+        all_malicious_ips: List[Tuple[str, int]] = []
+        total_files = len(bucket_key_pairs)
+        completed_files = 0
+
+        with ThreadPoolExecutor(max_workers=10) as executor:
+            future_to_key = {
+                executor.submit(self._download_and_parse_log, bucket, key): (
+                    bucket,
+                    key,
+                )
+                for bucket, key in bucket_key_pairs
+            }
+            for future in as_completed(future_to_key):
+                completed_files += 1
+                try:
+                    ips_from_file = future.result()
+                    all_malicious_ips.extend(ips_from_file)
+
+                    # Progress update every 10 files or at completion
+                    if completed_files % 10 == 0 or completed_files == total_files:
+                        logging.info(
+                            f"Log processing progress: {completed_files}/{total_files} files "
+                            f"({completed_files * 100 // total_files}%) - found {len(all_malicious_ips)} malicious requests so far"
+                        )
+                except Exception as e:
+                    logging.error(f"Error processing a log file in thread: {e}")
+        return all_malicious_ips
+
+    def _download_and_parse_log(self, bucket: str, key: str) -> List[Tuple[str, int]]:
+        """
+        Download and parse a single ALB log file from S3.
+
+        Args:
+            bucket: S3 bucket name
+            key: S3 object key
+
+        Returns:
+            List of tuples (ip_address, ip_version) for malicious IPs found.
+            Returns empty list on error (logged but not raised).
+        """
+        filename = key.split("/")[-1]
+        logging.debug(f"Starting processing for file: {filename}")
+
+        try:
+            response = self.s3.get_object(Bucket=bucket, Key=key)
+        except ClientError as e:
+            error_code = e.response.get("Error", {}).get("Code", "")
+            if error_code in ("NoSuchKey", "AccessDenied"):
+                logging.warning(f"S3 access error for {filename}: {error_code} - skipping file")
+            else:
+                logging.error(f"S3 error fetching {filename}: {e} - skipping file")
+            self._s3_processing_errors += 1
+            return []
+        except Exception as e:
+            logging.error(f"Unexpected error fetching {filename} from S3: {e} - skipping file")
+            self._s3_processing_errors += 1
+            return []
+
+        try:
+            with gzip.open(response["Body"], "rt") as f:
+                malicious_ips = []
+                for line in f:
+                    if ATTACK_PATTERNS.search(line):
+                        parts = line.split()
+                        if len(parts) > 3:
+                            # Client IP:port is in field 4 (index 3)
+                            client_field = parts[3]
+
+                            # Handle IPv6 addresses which may be in brackets [::1]:port
+                            if client_field.startswith('['):
+                                # IPv6 format: [::1]:port
+                                bracket_end = client_field.find(']')
+                                if bracket_end > 0:
+                                    ip_str = client_field[1:bracket_end]
+                                else:
+                                    continue
+                            else:
+                                # IPv4 format: 1.2.3.4:port
+                                ip_str = client_field.split(":")[0]
+
+                            # Check if it's a valid public IP (v4 or v6)
+                            is_valid, ip_version = is_valid_public_ip(ip_str)
+                            if is_valid:
+                                # If IPv6 disabled, skip IPv6 addresses
+                                if ip_version == 6 and not self.enable_ipv6:
+                                    continue
+                                malicious_ips.append((ip_str, ip_version))
+                            elif is_valid_public_ipv4(ip_str):
+                                # Fallback for backward compatibility
+                                malicious_ips.append((ip_str, 4))
+
+            logging.debug(
+                f"Finished processing file: {filename}, found {len(malicious_ips)} malicious IPs."
+            )
+            return malicious_ips
+        except gzip.BadGzipFile as e:
+            logging.warning(f"Corrupted gzip file {filename}: {e} - skipping file")
+            self._s3_processing_errors += 1
+            return []
+        except Exception as e:
+            logging.error(f"Error parsing log file {filename}: {e} - skipping file")
+            self._s3_processing_errors += 1
+            return []
+
+    def _download_and_parse_log_multi_signal(
+        self, bucket: str, key: str
+    ) -> Dict[str, ThreatSignals]:
+        """
+        Download and parse a log file with multi-signal threat detection.
+
+        Extracts additional signals beyond attack patterns:
+        - HTTP status codes (4xx/5xx)
+        - User-agent analysis
+        - Request paths for diversity scoring
+
+        Args:
+            bucket: S3 bucket name
+            key: S3 object key
+
+        Returns:
+            Dict mapping IP addresses to their ThreatSignals objects.
+        """
+        filename = key.split("/")[-1]
+        logging.debug(f"Multi-signal processing for file: {filename}")
+
+        ip_signals: Dict[str, ThreatSignals] = {}
+
+        try:
+            response = self.s3.get_object(Bucket=bucket, Key=key)
+        except ClientError as e:
+            error_code = e.response.get("Error", {}).get("Code", "")
+            if error_code in ("NoSuchKey", "AccessDenied"):
+                logging.warning(f"S3 access error for {filename}: {error_code} - skipping file")
+            else:
+                logging.error(f"S3 error fetching {filename}: {e} - skipping file")
+            self._s3_processing_errors += 1
+            return {}
+        except Exception as e:
+            logging.error(f"Unexpected error fetching {filename} from S3: {e} - skipping file")
+            self._s3_processing_errors += 1
+            return {}
+
+        try:
+            with gzip.open(response["Body"], "rt") as f:
+                for line in f:
+                    # Parse ALB log line
+                    # ALB log format fields:
+                    # 0: type, 1: timestamp, 2: elb, 3: client:port, 4: target:port,
+                    # 5: request_processing_time, 6: target_processing_time,
+                    # 7: response_processing_time, 8: elb_status_code,
+                    # 9: target_status_code, 10: received_bytes, 11: sent_bytes,
+                    # 12: "request", 13: "user_agent", ...
+
+                    parts = line.split()
+                    if len(parts) < 14:
+                        continue
+
+                    # Extract client IP
+                    client_field = parts[3]
+                    if client_field.startswith('['):
+                        bracket_end = client_field.find(']')
+                        if bracket_end > 0:
+                            ip_str = client_field[1:bracket_end]
+                        else:
+                            continue
+                    else:
+                        ip_str = client_field.split(":")[0]
+
+                    # Check if valid public IP
+                    is_valid, ip_version = is_valid_public_ip(ip_str)
+                    if not is_valid:
+                        continue
+
+                    # Skip IPv6 if disabled
+                    if ip_version == 6 and not self.enable_ipv6:
+                        continue
+
+                    # Parse status code (ELB status code at index 8)
+                    try:
+                        status_code = int(parts[8])
+                    except (ValueError, IndexError):
+                        status_code = 0
+
+                    # Parse request (at index 12, quoted)
+                    # Format: "GET /path HTTP/1.1"
+                    request_field = ""
+                    try:
+                        # Find quoted request field
+                        quote_start = line.find('"')
+                        if quote_start >= 0:
+                            quote_end = line.find('"', quote_start + 1)
+                            if quote_end > quote_start:
+                                request_field = line[quote_start + 1 : quote_end]
+                    except Exception:
+                        pass
+
+                    # Extract path from request
+                    path = "/"
+                    if request_field:
+                        request_parts = request_field.split()
+                        if len(request_parts) >= 2:
+                            path = request_parts[1].split("?")[0]  # Remove query string
+
+                    # Parse user agent (second quoted field after request)
+                    user_agent = ""
+                    try:
+                        first_quote_end = line.find('"', line.find('"') + 1)
+                        if first_quote_end >= 0:
+                            ua_start = line.find('"', first_quote_end + 1)
+                            if ua_start >= 0:
+                                ua_end = line.find('"', ua_start + 1)
+                                if ua_end > ua_start:
+                                    user_agent = line[ua_start + 1 : ua_end]
+                    except Exception:
+                        pass
+
+                    # Check for attack patterns
+                    has_attack_pattern = bool(ATTACK_PATTERNS.search(line))
+
+                    # Check for scanner user agent
+                    has_scanner_ua = bool(SCANNER_USER_AGENTS.search(user_agent)) if user_agent else False
+
+                    # Create or update threat signals for this IP
+                    if ip_str not in ip_signals:
+                        ip_signals[ip_str] = ThreatSignals()
+
+                    ip_signals[ip_str].add_request(
+                        has_attack_pattern=has_attack_pattern,
+                        has_scanner_ua=has_scanner_ua,
+                        status_code=status_code,
+                        path=path,
+                    )
+
+            logging.debug(f"Multi-signal processed {filename}: {len(ip_signals)} unique IPs")
+            return ip_signals
+
+        except gzip.BadGzipFile as e:
+            logging.warning(f"Corrupted gzip file {filename}: {e} - skipping file")
+            self._s3_processing_errors += 1
+            return {}
+        except Exception as e:
+            logging.error(f"Error parsing log file {filename}: {e} - skipping file")
+            self._s3_processing_errors += 1
+            return {}
+
+    def _log_threat_score_details(
+        self,
+        ip: str,
+        score: float,
+        details: Dict[str, Any],
+        blocked: bool
+    ):
+        """
+        Log threat score details at appropriate verbosity level.
+
+        Logging Strategy:
+        - BLOCKED: Always INFO + full details
+        - High-traffic skipped (>=100 hits OR >=2x threshold): INFO + full details + WARNING
+        - Borderline skipped (score within ±20 of threshold): INFO + full details
+        - Other skipped: DEBUG only (prevent log explosion)
+
+        Args:
+            ip: IP address being evaluated
+            score: Final threat score
+            details: Dict with breakdown details including:
+                - hit_count: Total requests from IP
+                - reasons: List of reason strings
+                - breakdown: Score component breakdown
+                - base_score: Score before service adjustment
+                - final_score: Score after service adjustment
+                - service_name: Verified legitimate service (if any)
+            blocked: Whether the IP will be blocked
+        """
+        # Get breakdown components safely
+        breakdown = details.get('breakdown', {})
+        reasons_str = ', '.join(details.get('reasons', [])) if details.get('reasons') else 'no_specific_signals'
+        hit_count = details.get('hit_count', 0)
+        service_name = details.get('service_name')
+
+        # Build status string with service name for skipped IPs
+        if blocked:
+            status = "BLOCKED"
+        elif service_name:
+            status = f"SKIPPED (score={score:.0f}, {service_name})"
+        else:
+            status = f"SKIPPED (score={score:.0f})"
+
+        # Determine logging level and detail requirements
+        min_score = self._threat_signals_config.get('min_threat_score', 40)
+        is_borderline = abs(score - min_score) <= 20
+        is_high_traffic = hit_count >= 100 or hit_count >= self.threshold * 2
+
+        # Determine if we should log details
+        should_log_details = blocked or is_high_traffic or is_borderline or self._debug
+
+        # Log at appropriate level
+        if blocked or is_high_traffic or is_borderline:
+            logging.info(
+                f"IP {ip}: score={score:.1f}, hits={hit_count}, "
+                f"status={status}, reasons=[{reasons_str}]"
+            )
+        else:
+            # Low-traffic, non-borderline skipped IPs - DEBUG only
+            logging.debug(
+                f"IP {ip}: score={score:.1f}, hits={hit_count}, "
+                f"status={status}, reasons=[{reasons_str}]"
+            )
+
+        # Log detailed breakdown for relevant cases
+        if should_log_details:
+            service_adj = details.get('service_adjustment', 0)
+
+            logging.info(
+                f"  → Score breakdown: "
+                f"pattern={breakdown.get('attack_pattern', 0):.1f}, "
+                f"scanner_ua={breakdown.get('scanner_ua', 0):.1f}, "
+                f"error_rate={breakdown.get('error_rate', 0):.1f}, "
+                f"path_diversity={breakdown.get('path_diversity', 0):.1f}, "
+                f"rate={breakdown.get('rate', 0):.1f}"
+            )
+
+            if service_adj != 0:
+                svc_name = details.get('service_name', 'unknown')
+                verification_method = details.get('verification_method', 'unknown')
+                logging.info(
+                    f"  → Verified service: {svc_name} (via {verification_method})"
+                )
+
+            aws_service = details.get('aws_service')
+            if aws_service:
+                logging.info(f"  → AWS service detected: {aws_service}")
+
+            # Log attack pattern and scanner details
+            attack_hits = details.get('attack_pattern_hits', 0)
+            scanner_hits = details.get('scanner_ua_hits', 0)
+            error_count = details.get('error_responses', 0)
+            if attack_hits > 0 or scanner_hits > 0:
+                logging.info(
+                    f"  → Attack patterns: {attack_hits}, Scanner UAs: {scanner_hits}, "
+                    f"Errors: {error_count}/{hit_count}"
+                )
+
+        # Warn for high-hit IPs that were skipped (potential false negative)
+        if not blocked and is_high_traffic:
+            logging.warning(
+                f"⚠️  High-traffic IP {ip} ({hit_count} hits) was NOT blocked. "
+                f"Score {score:.1f} < threshold {min_score}. "
+                f"Review if this is expected."
+            )
+
+    def _aggregate_threat_signals(
+        self, signal_dicts: List[Dict[str, ThreatSignals]]
+    ) -> Dict[str, ThreatSignals]:
+        """
+        Aggregate threat signals from multiple log files.
+
+        Args:
+            signal_dicts: List of dicts mapping IPs to ThreatSignals
+
+        Returns:
+            Combined dict with aggregated signals
+        """
+        aggregated: Dict[str, ThreatSignals] = {}
+
+        for signals in signal_dicts:
+            for ip, signals_obj in signals.items():
+                if ip not in aggregated:
+                    aggregated[ip] = ThreatSignals()
+
+                # Merge signals
+                agg = aggregated[ip]
+                agg.attack_pattern_hits += signals_obj.attack_pattern_hits
+                agg.scanner_ua_hits += signals_obj.scanner_ua_hits
+                agg.error_responses += signals_obj.error_responses
+                agg.total_requests += signals_obj.total_requests
+                agg.unique_paths.update(signals_obj.unique_paths)
+
+                if signals_obj.first_seen:
+                    if agg.first_seen is None or signals_obj.first_seen < agg.first_seen:
+                        agg.first_seen = signals_obj.first_seen
+                if signals_obj.last_seen:
+                    if agg.last_seen is None or signals_obj.last_seen > agg.last_seen:
+                        agg.last_seen = signals_obj.last_seen
+
+        return aggregated
+
+    def _filter_by_multi_signal(
+        self,
+        candidate_ips: Set[str],
+        log_keys: List[Tuple[str, str]],
+        metrics_dimensions: Dict[str, str],
+    ) -> Set[str]:
+        """
+        Filter candidate IPs using multi-signal threat detection.
+
+        Only IPs that meet the threat score threshold are returned.
+
+        Args:
+            candidate_ips: Set of IPs that passed initial pattern matching
+            log_keys: List of (bucket, key) tuples for log files to analyze
+            metrics_dimensions: Dimensions for CloudWatch metrics
+
+        Returns:
+            Set of IPs that pass the multi-signal threshold
+        """
+        if not candidate_ips:
+            return set()
+
+        # Process logs with multi-signal extraction
+        all_signals: List[Dict[str, ThreatSignals]] = []
+
+        with ThreadPoolExecutor(max_workers=10) as executor:
+            futures = {
+                executor.submit(self._download_and_parse_log_multi_signal, bucket, key): (bucket, key)
+                for bucket, key in log_keys
+            }
+            for future in as_completed(futures):
+                try:
+                    result = future.result()
+                    if result:
+                        all_signals.append(result)
+                except Exception as e:
+                    bucket, key = futures[future]
+                    logging.warning(f"Error in multi-signal processing for {key}: {e}")
+
+        # Aggregate signals across all files
+        aggregated = self._aggregate_threat_signals(all_signals)
+
+        # Filter candidates based on threat scores
+        confirmed_offenders = set()
+        skipped_ips: List[Tuple[str, float, Dict[str, Any]]] = []
+
+        for ip in candidate_ips:
+            if ip not in aggregated:
+                # No multi-signal data - use original pattern-match decision
+                # This shouldn't happen normally, but be safe
+                confirmed_offenders.add(ip)
+                continue
+
+            signals = aggregated[ip]
+            is_malicious_base, base_score, breakdown = signals.is_malicious(self._threat_signals_config)
+
+            # Enhanced details for logging
+            details: Dict[str, Any] = {
+                'base_score': base_score,
+                'breakdown': breakdown,
+                'hit_count': signals.total_requests,
+                'reasons': [],
+                'top_user_agents': list(signals.unique_paths)[:3] if hasattr(signals, 'unique_paths') else [],
+                'attack_pattern_hits': signals.attack_pattern_hits,
+                'scanner_ua_hits': signals.scanner_ua_hits,
+                'error_responses': signals.error_responses,
+            }
+
+            # Add reasons based on signal breakdown
+            if breakdown.get('attack_pattern', 0) > 0:
+                details['reasons'].append(f"attack_patterns ({signals.attack_pattern_hits} hits)")
+            if breakdown.get('scanner_ua', 0) > 0:
+                details['reasons'].append(f"scanner_ua ({signals.scanner_ua_hits} hits)")
+            if breakdown.get('error_rate', 0) > 0:
+                error_ratio = signals.error_responses / signals.total_requests if signals.total_requests else 0
+                details['reasons'].append(f"high_error_rate ({error_ratio:.0%})")
+            if breakdown.get('path_diversity', 0) > 0:
+                details['reasons'].append(f"path_scanning ({len(signals.unique_paths)} unique paths)")
+
+            # Check for legitimate service verification (reduces false positives)
+            service_adjustment = 0
+            service_name = None
+            verification_method = None
+
+            # Get sample request data for service verification
+            sample_paths = list(signals.unique_paths)[:20] if hasattr(signals, 'unique_paths') else []
+            # For service verification, we need to check if this looks like a legitimate service
+            # Since we don't have the actual UA here, we check using basic heuristics
+            # The full verification would happen at request parsing time
+            if self.aws_ip_index is not None:
+                # Check if IP belongs to any known AWS service
+                aws_service = self.aws_ip_index.get_service_for_ip(ip)
+                if aws_service:
+                    details['aws_service'] = aws_service
+                    # Only give score reduction for health check services
+                    if aws_service in [AWS_SERVICE_ROUTE53_HEALTHCHECKS, AWS_SERVICE_ELB]:
+                        service_adjustment = -15
+                        service_name = aws_service
+                        verification_method = 'aws_service_ip'
+                        details['reasons'].append(f"aws_service_ip ({aws_service})")
+                        details['service_adjustment'] = service_adjustment
+
+            # Calculate final score with service adjustment
+            final_score = max(0, base_score + service_adjustment)
+            details['final_score'] = final_score
+            details['service_name'] = service_name
+            details['verification_method'] = verification_method
+
+            # Determine if malicious based on final score
+            min_score = self._threat_signals_config['min_threat_score']
+            is_malicious_final = final_score >= min_score
+
+            if is_malicious_final:
+                confirmed_offenders.add(ip)
+                self._log_threat_score_details(ip, final_score, details, blocked=True)
+            else:
+                skipped_ips.append((ip, final_score, details))
+                self._log_threat_score_details(ip, final_score, details, blocked=False)
+
+        # Store skipped IPs for dry-run summary
+        self._skipped_ips = skipped_ips
+
+        # Emit metrics for threat scores
+        if aggregated:
+            avg_score = sum(
+                signals.calculate_threat_score(self._threat_signals_config)[0]
+                for ip, signals in aggregated.items()
+                if ip in candidate_ips
+            ) / len(candidate_ips) if candidate_ips else 0
+            self._metrics.put_metric(
+                "AverageThreatScore", avg_score, "None", metrics_dimensions
+            )
+
+        return confirmed_offenders
+
+    # -------------------------------------------------------------------------
+    # Athena Integration for Large-Scale Log Analysis
+    # -------------------------------------------------------------------------
+
+    def _init_athena(self):
+        """Initialize Athena client if not already done."""
+        if not hasattr(self, '_athena') or self._athena is None:
+            self._athena = boto3.client("athena", region_name=self.region)
+
+    def _setup_athena_table(
+        self,
+        database: str,
+        table_name: str,
+        s3_log_location: str,
+        output_location: str,
+    ) -> bool:
+        """
+        Create or verify the Athena table for ALB logs.
+
+        Uses the standard ALB log format as defined by AWS.
+
+        Args:
+            database: Athena database name
+            table_name: Table name to create
+            s3_log_location: S3 location of ALB logs (s3://bucket/prefix/)
+            output_location: S3 location for query results
+
+        Returns:
+            bool: True if table exists or was created successfully
+        """
+        self._init_athena()
+
+        # ALB log table DDL (standard AWS format)
+        create_table_query = f"""
+        CREATE EXTERNAL TABLE IF NOT EXISTS {database}.{table_name} (
+            type string,
+            time string,
+            elb string,
+            client_ip string,
+            client_port int,
+            target_ip string,
+            target_port int,
+            request_processing_time double,
+            target_processing_time double,
+            response_processing_time double,
+            elb_status_code int,
+            target_status_code string,
+            received_bytes bigint,
+            sent_bytes bigint,
+            request_verb string,
+            request_url string,
+            request_proto string,
+            user_agent string,
+            ssl_cipher string,
+            ssl_protocol string,
+            target_group_arn string,
+            trace_id string,
+            domain_name string,
+            chosen_cert_arn string,
+            matched_rule_priority string,
+            request_creation_time string,
+            actions_executed string,
+            redirect_url string,
+            lambda_error_reason string,
+            target_port_list string,
+            target_status_code_list string,
+            classification string,
+            classification_reason string
+        )
+        ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.RegexSerDe'
+        WITH SERDEPROPERTIES (
+            'serialization.format' = '1',
+            'input.regex' =
+            '([^ ]*) ([^ ]*) ([^ ]*) ([^ ]*):([0-9]*) ([^ ]*)[:-]([0-9]*) ([-.0-9]*) ([-.0-9]*) ([-.0-9]*) (|[-0-9]*) (-|[-0-9]*) ([-0-9]*) ([-0-9]*) \"([^ ]*) (.*) (- |[^ ]*)\" \"([^\"]*)\" ([A-Z0-9-_]+) ([A-Za-z0-9.-]*) ([^ ]*) \"([^\"]*)\" \"([^\"]*)\" \"([^\"]*)\" ([-.0-9]*) ([^ ]*) \"([^\"]*)\" \"([^\"]*)\" \"([^ ]*)\" \"([^\\s]+?)\" \"([^\\s]+)\" \"([^ ]*)\" \"([^ ]*)\"'
+        )
+        LOCATION '{s3_log_location}'
+        """
+
+        try:
+            # Create database if not exists
+            self._execute_athena_query(
+                f"CREATE DATABASE IF NOT EXISTS {database}",
+                output_location,
+                wait=True,
+            )
+
+            # Create table
+            self._execute_athena_query(
+                create_table_query,
+                output_location,
+                wait=True,
+            )
+
+            logging.info(f"Athena table {database}.{table_name} ready")
+            return True
+
+        except Exception as e:
+            logging.error(f"Failed to set up Athena table: {e}")
+            return False
+
+    def _execute_athena_query(
+        self,
+        query: str,
+        output_location: str,
+        database: Optional[str] = None,
+        wait: bool = True,
+        timeout_seconds: int = 300,
+    ) -> Optional[str]:
+        """
+        Execute an Athena query and optionally wait for completion.
+
+        Args:
+            query: SQL query to execute
+            output_location: S3 location for results
+            database: Optional database context
+            wait: If True, poll until query completes
+            timeout_seconds: Max time to wait for query
+
+        Returns:
+            str: Query execution ID if successful, None on failure
+        """
+        self._init_athena()
+
+        try:
+            params = {
+                "QueryString": query,
+                "ResultConfiguration": {
+                    "OutputLocation": output_location,
+                },
+            }
+            if database:
+                params["QueryExecutionContext"] = {"Database": database}
+
+            response = self._athena.start_query_execution(**params)
+            query_id = response["QueryExecutionId"]
+            logging.debug(f"Started Athena query: {query_id}")
+
+            if wait:
+                return self._wait_for_athena_query(query_id, timeout_seconds)
+            return query_id
+
+        except Exception as e:
+            logging.error(f"Failed to execute Athena query: {e}")
+            return None
+
+    def _wait_for_athena_query(
+        self,
+        query_id: str,
+        timeout_seconds: int = 300,
+    ) -> Optional[str]:
+        """
+        Wait for an Athena query to complete.
+
+        Args:
+            query_id: Query execution ID
+            timeout_seconds: Max time to wait
+
+        Returns:
+            str: Query ID if successful, None on failure
+        """
+        import time
+
+        start_time = time.time()
+        poll_interval = 1  # Start with 1 second
+
+        while time.time() - start_time < timeout_seconds:
+            try:
+                response = self._athena.get_query_execution(
+                    QueryExecutionId=query_id
+                )
+                state = response["QueryExecution"]["Status"]["State"]
+
+                if state == "SUCCEEDED":
+                    return query_id
+                elif state in ("FAILED", "CANCELLED"):
+                    reason = response["QueryExecution"]["Status"].get(
+                        "StateChangeReason", "Unknown"
+                    )
+                    logging.error(f"Athena query {state}: {reason}")
+                    return None
+
+                # Exponential backoff (max 30s)
+                time.sleep(poll_interval)
+                poll_interval = min(poll_interval * 1.5, 30)
+
+            except Exception as e:
+                logging.error(f"Error polling Athena query status: {e}")
+                return None
+
+        logging.error(f"Athena query timed out after {timeout_seconds}s")
+        return None
+
+    def _query_athena_for_attackers(
+        self,
+        database: str,
+        table_name: str,
+        output_location: str,
+        lookback_hours: float,
+        attack_patterns: List[str],
+        min_count: int,
+    ) -> Optional[Counter]:
+        """
+        Query Athena for IPs matching attack patterns with hit counts.
+
+        This is more efficient than processing individual log files for
+        large-scale analysis across many log files.
+
+        Args:
+            database: Athena database name
+            table_name: Table name
+            output_location: S3 location for query results
+            lookback_hours: How far back to look
+            attack_patterns: SQL LIKE patterns for attacks
+            min_count: Minimum hit count to include
+
+        Returns:
+            Counter: IP -> hit count mapping, or None on failure
+        """
+        self._init_athena()
+
+        # Build WHERE clause for attack patterns
+        pattern_conditions = " OR ".join([
+            f"request_url LIKE '%{pattern}%'"
+            for pattern in attack_patterns
+        ])
+
+        # Calculate time boundary
+        cutoff_time = datetime.now(timezone.utc) - timedelta(hours=lookback_hours)
+        time_filter = cutoff_time.strftime("%Y-%m-%dT%H:%M:%S")
+
+        query = f"""
+        SELECT
+            client_ip,
+            COUNT(*) as hit_count
+        FROM {database}.{table_name}
+        WHERE
+            time >= '{time_filter}'
+            AND ({pattern_conditions})
+        GROUP BY client_ip
+        HAVING COUNT(*) >= {min_count}
+        ORDER BY hit_count DESC
+        LIMIT 10000
+        """
+
+        query_id = self._execute_athena_query(
+            query,
+            output_location,
+            database=database,
+            wait=True,
+            timeout_seconds=600,  # 10 minutes for large queries
+        )
+
+        if not query_id:
+            return None
+
+        return self._get_athena_results_as_counter(query_id)
+
+    def _get_athena_results_as_counter(self, query_id: str) -> Optional[Counter]:
+        """
+        Get Athena query results and convert to Counter.
+
+        Args:
+            query_id: Completed query execution ID
 
-            logging.info(
-                f"Searching for logs in s3://{bucket}/{base_prefix} "
-                f"across {len(date_prefixes)} date(s) from {start_time.date()} to {end_date}"
-            )
+        Returns:
+            Counter: IP -> count mapping, or None on failure
+        """
+        self._init_athena()
 
-            log_files_to_process = []
+        try:
+            paginator = self._athena.get_paginator("get_query_results")
+            results = Counter()
 
-            # Scan each date prefix separately (much faster than scanning all dates)
-            for date_prefix in date_prefixes:
-                pages = paginator.paginate(
-                    Bucket=bucket,
-                    Prefix=date_prefix,
-                    PaginationConfig={"MaxItems": 10000},  # Per-date limit
-                )
+            for page in paginator.paginate(QueryExecutionId=query_id):
+                for row in page["ResultSet"]["Rows"][1:]:  # Skip header
+                    data = row["Data"]
+                    if len(data) >= 2:
+                        ip = data[0].get("VarCharValue", "")
+                        count_str = data[1].get("VarCharValue", "0")
+                        if ip and count_str.isdigit():
+                            results[ip] = int(count_str)
 
-                for page in pages:
-                    if "Contents" in page:
-                        for obj in page["Contents"]:
-                            if (
-                                not obj["Key"].endswith("/")
-                                and obj["LastModified"] >= start_time
-                            ):
-                                log_files_to_process.append(obj["Key"])
+            logging.info(f"Athena query returned {len(results)} IPs")
+            return results
 
-            logging.info(
-                f"S3 scan complete: found {len(log_files_to_process)} matching log file(s) across {len(date_prefixes)} date(s)."
-            )
-            return log_files_to_process
         except Exception as e:
-            logging.error(f"Error listing S3 objects for prefix {prefix}: {e}")
-            return []
+            logging.error(f"Failed to get Athena results: {e}")
+            return None
 
-    def _process_logs_in_parallel(
-        self, bucket_key_pairs: List[Tuple[str, str]]
-    ) -> List[str]:
-        """Uses a thread pool to download and parse logs concurrently."""
-        all_malicious_ips = []
-        total_files = len(bucket_key_pairs)
-        completed_files = 0
+    def _process_logs_via_athena(
+        self,
+        log_location: str,
+        lookback_hours: float,
+    ) -> Optional[Counter]:
+        """
+        Process ALB logs using Athena for large-scale analysis.
 
-        with ThreadPoolExecutor(max_workers=10) as executor:
-            future_to_key = {
-                executor.submit(self._download_and_parse_log, bucket, key): (
-                    bucket,
-                    key,
-                )
-                for bucket, key in bucket_key_pairs
-            }
-            for future in as_completed(future_to_key):
-                completed_files += 1
-                try:
-                    ips_from_file = future.result()
-                    all_malicious_ips.extend(ips_from_file)
+        This method is an alternative to _process_logs_in_parallel() for
+        scenarios with many log files where S3 GetObject would be too slow.
 
-                    # Progress update every 10 files or at completion
-                    if completed_files % 10 == 0 or completed_files == total_files:
-                        logging.info(
-                            f"Log processing progress: {completed_files}/{total_files} files "
-                            f"({completed_files * 100 // total_files}%) - found {len(all_malicious_ips)} malicious requests so far"
-                        )
-                except Exception as e:
-                    logging.error(f"Error processing a log file in thread: {e}")
-        return all_malicious_ips
+        Args:
+            log_location: S3 URI for ALB logs (s3://bucket/prefix/)
+            lookback_hours: How far back to analyze
 
-    def _download_and_parse_log(self, bucket: str, key: str) -> List[str]:
-        logging.debug(f"Starting processing for file: {key.split('/')[-1]}")
-        response = self.s3.get_object(Bucket=bucket, Key=key)
-        with gzip.open(response["Body"], "rt") as f:
-            malicious_ips = []
-            for line in f:
-                if ATTACK_PATTERNS.search(line):
-                    parts = line.split()
-                    if len(parts) > 3:
-                        ip_str = parts[3].split(":")[0]
-                        if is_valid_public_ipv4(ip_str):
-                            malicious_ips.append(ip_str)
-        logging.debug(
-            f"Finished processing file: {key.split('/')[-1]}, found {len(malicious_ips)} malicious IPs."
+        Returns:
+            Counter: IP -> hit count mapping, or None on failure
+        """
+        if not self._athena_enabled:
+            logging.warning("Athena integration not enabled")
+            return None
+
+        # Derive table name from LB pattern
+        safe_pattern = re.sub(r'[^a-zA-Z0-9]', '_', self.lb_name_pattern)
+        table_name = f"alb_logs_{safe_pattern}_{self.region.replace('-', '_')}"
+
+        # Set up table if needed
+        if not self._setup_athena_table(
+            self._athena_database,
+            table_name,
+            log_location,
+            self._athena_output_location,
+        ):
+            return None
+
+        # Attack patterns for SQL LIKE queries
+        sql_patterns = [
+            "../",           # Path traversal
+            ".env",          # Environment file access
+            ".git",          # Git repository access
+            "wp-login",      # WordPress login
+            "wp-admin",      # WordPress admin
+            "phpmyadmin",    # phpMyAdmin
+            "<script",       # XSS
+            "UNION SELECT",  # SQL injection
+            "eval(",         # Code injection
+            "/etc/passwd",   # System file access
+            ".php?",         # PHP with params (often exploits)
+        ]
+
+        return self._query_athena_for_attackers(
+            self._athena_database,
+            table_name,
+            self._athena_output_location,
+            lookback_hours,
+            sql_patterns,
+            self.threshold,
         )
-        return malicious_ips
 
     def _get_nacl_rules(self, nacl_id: str) -> Tuple[Dict[int, str], Set[int]]:
         """Gets all rules for a given NACL and separates them."""
@@ -917,9 +3748,12 @@ def _update_nacl_rules(self, nacl_id: str, offenders: Set[str], ip_counts: Count
 
     def _update_nacl_rules_with_registry(
         self, nacl_id: str, ips_to_block: Set[str], active_blocks: Dict[str, Dict]
-    ):
+    ) -> Tuple[Set[str], Set[str]]:
         """
         Updates NACL rules based on the persistent registry with priority-based slot management.
+
+        Returns:
+            Tuple of (ips_to_add, ips_to_remove) for summary reporting
         """
         existing_deny_rules, all_rule_nums = self._get_nacl_rules(nacl_id)
         existing_blocked_ips = {
@@ -953,6 +3787,8 @@ def _update_nacl_rules_with_registry(
                 nacl_id, ips_to_add, active_blocks
             )
 
+        return ips_to_add, ips_to_remove
+
     def _manage_rule_limit_and_add_with_priority(
         self, nacl_id: str, ips_to_add: Set[str], active_blocks: Dict[str, Dict]
     ):
@@ -1100,6 +3936,10 @@ def _send_slack_notification(self, message: str, is_critical: bool = False):
         Args:
             message: The message to send
             is_critical: If True, adds warning emoji to the message
+
+        Note:
+            Failed notifications are queued for retry at end of run.
+            Notification failures never affect core blocking logic.
         """
         if not self.slack_client:
             return
@@ -1111,11 +3951,46 @@ def _send_slack_notification(self, message: str, is_critical: bool = False):
         try:
             success = self.slack_client.post_message(message=message)
             if success:
-                logging.debug(f"Slack notification sent: {message}")
+                logging.debug(f"Slack notification sent successfully")
             else:
-                logging.debug("Failed to send Slack notification")
+                # Queue for retry
+                self._failed_slack_messages.append((message, is_critical))
+                logging.debug("Slack notification failed - queued for retry")
         except Exception as e:
-            logging.warning(f"Error sending Slack notification: {e}")
+            # Queue for retry - don't let Slack failures affect blocking
+            self._failed_slack_messages.append((message, is_critical))
+            logging.warning(f"Error sending Slack notification (queued for retry): {e}")
+
+    def _retry_failed_slack_messages(self):
+        """
+        Retry sending failed Slack messages at end of run.
+        Called once after all blocking operations complete.
+        """
+        if not self._failed_slack_messages or not self.slack_client:
+            return
+
+        logging.info(f"Retrying {len(self._failed_slack_messages)} failed Slack notification(s)...")
+        retry_successes = 0
+
+        for message, is_critical in self._failed_slack_messages:
+            try:
+                # Remove emoji prefix if already added (to avoid duplication)
+                clean_message = message.replace(":warning: ", "") if is_critical else message
+                final_message = f":warning: {clean_message}" if is_critical else clean_message
+
+                success = self.slack_client.post_message(message=final_message)
+                if success:
+                    retry_successes += 1
+            except Exception as e:
+                logging.debug(f"Retry failed for Slack message: {e}")
+
+        if retry_successes > 0:
+            logging.info(f"Successfully sent {retry_successes}/{len(self._failed_slack_messages)} queued Slack notifications")
+        else:
+            logging.warning(f"All {len(self._failed_slack_messages)} Slack notification retries failed")
+
+        # Clear the queue
+        self._failed_slack_messages.clear()
 
     def _send_summary_notification(
         self,
@@ -1268,15 +4143,187 @@ def _send_summary_notification_with_registry(
         message = "\n".join(summary_lines)
         self._send_slack_notification(message, is_critical=bool(newly_blocked))
 
+    def _send_enhanced_slack_notification(
+        self,
+        new_offenders: Set[str],
+        final_blocked_ips: Set[str],
+        ip_counts: Counter,
+        initially_blocked_ips: Set[str],
+        active_blocks: Dict[str, Dict],
+        run_id: Optional[str] = None,
+    ):
+        """
+        Sends enhanced Slack notifications with:
+        - Severity-based color coding
+        - Incident threading (all messages grouped by run_id)
+        - Actionable information organized by threat tier
+
+        Args:
+            new_offenders: Set of newly detected offending IPs
+            final_blocked_ips: Set of IPs actually blocked in NACL
+            ip_counts: Counter of malicious hits per IP
+            initially_blocked_ips: Set of IPs that were blocked before this run
+            active_blocks: Current block registry with tier information
+            run_id: Optional run identifier for threading
+        """
+        if not self.slack_client or self.dry_run:
+            return
+
+        # Calculate actual changes
+        newly_blocked = final_blocked_ips - initially_blocked_ips
+        newly_unblocked = initially_blocked_ips - final_blocked_ips
+
+        # Skip if no changes
+        if not newly_blocked and not newly_unblocked:
+            logging.info("No changes to blocked IPs. Skipping enhanced Slack notification.")
+            return
+
+        # Generate run_id for threading if not provided
+        if not run_id:
+            run_id = datetime.now(timezone.utc).strftime("%Y%m%d_%H%M%S")
+
+        incident_id = f"block_run_{run_id}"
+
+        # Determine overall severity based on highest threat tier
+        max_severity = SlackSeverity.INFO
+        tier_breakdown = {"minimal": 0, "low": 0, "medium": 0, "high": 0, "critical": 0}
+
+        for ip in newly_blocked:
+            tier = active_blocks.get(ip, {}).get("tier", "low")
+            tier_breakdown[tier] = tier_breakdown.get(tier, 0) + 1
+            tier_severity = TIER_TO_SEVERITY.get(tier, SlackSeverity.LOW)
+            if tier_severity.value > max_severity.value:
+                max_severity = tier_severity
+
+        # Use critical severity if many IPs blocked
+        if len(newly_blocked) >= 10:
+            max_severity = SlackSeverity.CRITICAL
+        elif len(newly_blocked) >= 5 and max_severity.value < SlackSeverity.HIGH.value:
+            max_severity = SlackSeverity.HIGH
+
+        # Build summary fields
+        fields = [
+            ("Region", self.region),
+            ("Pattern", f"`{self.lb_name_pattern}`"),
+            ("Total Blocked", str(len(final_blocked_ips))),
+            ("Lookback", str(self.lookback_delta)),
+        ]
+
+        if newly_blocked:
+            fields.append(("Newly Blocked", str(len(newly_blocked))))
+        if newly_unblocked:
+            fields.append(("Unblocked", str(len(newly_unblocked))))
+
+        # Tier breakdown
+        active_tiers = [f"{t}: {c}" for t, c in tier_breakdown.items() if c > 0]
+        if active_tiers:
+            fields.append(("Tier Breakdown", ", ".join(active_tiers)))
+
+        # Build description with top offenders
+        description_parts = []
+        if newly_blocked:
+            # Group by tier and show top offenders
+            tier_groups = {"critical": [], "high": [], "medium": [], "low": [], "minimal": []}
+            for ip in newly_blocked:
+                tier = active_blocks.get(ip, {}).get("tier", "low")
+                hits = ip_counts.get(ip, active_blocks.get(ip, {}).get("total_hits", 0))
+                tier_groups[tier].append((ip, hits))
+
+            # Show critical/high first
+            for tier_name in ["critical", "high", "medium", "low", "minimal"]:
+                ips_in_tier = tier_groups[tier_name]
+                if ips_in_tier:
+                    ips_in_tier.sort(key=lambda x: x[1], reverse=True)
+                    emoji = self._get_tier_emoji(tier_name)
+                    description_parts.append(f"\n{emoji} *{tier_name.upper()} tier ({len(ips_in_tier)}):*")
+                    for ip, hits in ips_in_tier[:3]:  # Top 3 per tier
+                        duration = active_blocks.get(ip, {}).get("block_duration_hours", 0)
+                        duration_str = self._format_duration(duration)
+                        ip_info = self._get_ip_info(ip)
+                        location = ""
+                        if ip_info:
+                            location = f" ({ip_info.get('country_code', '')})"
+                        description_parts.append(f"  `{ip}`{location} - {hits} hits, blocked {duration_str}")
+                    if len(ips_in_tier) > 3:
+                        description_parts.append(f"  _...and {len(ips_in_tier) - 3} more_")
+
+        if newly_unblocked:
+            description_parts.append(f"\n:white_check_mark: *Unblocked ({len(newly_unblocked)}):*")
+            for ip in list(newly_unblocked)[:3]:
+                description_parts.append(f"  `{ip}`")
+            if len(newly_unblocked) > 3:
+                description_parts.append(f"  _...and {len(newly_unblocked) - 3} more_")
+
+        description = "\n".join(description_parts) if description_parts else "No details available"
+
+        # Build action buttons (informational - actual action requires external handling)
+        action_buttons = []
+        if newly_blocked:
+            # Add informational button
+            action_buttons.append({
+                "text": "View Details",
+                "action_id": f"view_details_{run_id}",
+                "value": json.dumps({
+                    "run_id": run_id,
+                    "newly_blocked": list(newly_blocked)[:10],
+                    "region": self.region,
+                }),
+            })
+
+        # Post the enhanced notification
+        try:
+            self.slack_client.post_incident_notification(
+                title=f":shield: Auto Block Attackers - {self.region}",
+                description=description,
+                fields=fields,
+                severity=max_severity,
+                incident_id=incident_id,
+                action_buttons=action_buttons if action_buttons else None,
+            )
+            logging.info(f"Enhanced Slack notification sent for run {run_id}")
+        except Exception as e:
+            logging.warning(f"Failed to send enhanced Slack notification: {e}")
+            # Fall back to basic notification
+            self._send_slack_notification(
+                f"Auto Block Attackers - {self.region}: {len(newly_blocked)} blocked, {len(newly_unblocked)} unblocked",
+                is_critical=bool(newly_blocked),
+            )
+
+    def _get_tier_emoji(self, tier: str) -> str:
+        """Get emoji for threat tier."""
+        emoji_map = {
+            "critical": ":rotating_light:",
+            "high": ":red_circle:",
+            "medium": ":large_orange_circle:",
+            "low": ":large_yellow_circle:",
+            "minimal": ":white_circle:",
+        }
+        return emoji_map.get(tier, ":question:")
+
+    def _format_duration(self, hours: float) -> str:
+        """Format duration in hours to human readable string."""
+        if hours >= 24:
+            days = int(hours / 24)
+            return f"{days}d"
+        elif hours >= 1:
+            return f"{int(hours)}h"
+        else:
+            return f"{int(hours * 60)}m"
+
     def _get_ip_info(self, ip: str) -> Optional[Dict]:
         """
         Fetches detailed geolocation and hosting information for an IP address.
         Returns None if ipinfo is not configured or if lookup fails.
         Uses in-memory caching to reduce API calls.
+        Implements circuit breaker to disable after repeated failures.
         """
         if not self.ipinfo_handler:
             return None
 
+        # Circuit breaker: skip if too many failures
+        if self._ipinfo_circuit_open:
+            return None
+
         # Check cache first
         now = datetime.now(timezone.utc)
         if ip in self.ipinfo_cache:
@@ -1312,9 +4359,21 @@ def _get_ip_info(self, ip: str) -> Optional[Dict]:
             # Store in cache
             self.ipinfo_cache[ip] = (now, info)
 
+            # Reset failure counter on success
+            self._ipinfo_failures = 0
+
             return info
         except Exception as e:
-            logging.warning(f"Failed to fetch IP info for {ip}: {e}")
+            self._ipinfo_failures += 1
+            logging.warning(f"Failed to fetch IP info for {ip}: {e} (failure {self._ipinfo_failures}/{self._ipinfo_failure_threshold})")
+
+            # Open circuit breaker after threshold failures
+            if self._ipinfo_failures >= self._ipinfo_failure_threshold:
+                self._ipinfo_circuit_open = True
+                logging.warning(
+                    f"IPInfo circuit breaker OPEN - disabled for rest of run after {self._ipinfo_failures} consecutive failures"
+                )
+
             return None
 
     def _format_ip_info(self, ip_info: Optional[Dict]) -> str:
@@ -1364,6 +4423,13 @@ def _delete_deny_rule(self, nacl_id: str, ip: str, rule_num: int):
                 self._send_slack_notification(
                     f"[{self.region}] Removed IP block: {ip} (rule {rule_num}) - no longer meets threshold"
                 )
+            except ClientError as e:
+                error_code = e.response.get("Error", {}).get("Code", "")
+                if error_code == "InvalidNetworkAclEntry.NotFound":
+                    # Rule already deleted (possibly manually) - treat as success
+                    logging.warning(f"Rule {rule_num} for {ip} was already deleted (not found)")
+                else:
+                    logging.error(f"Failed to delete rule {rule_num}: {e}")
             except Exception as e:
                 logging.error(f"Failed to delete rule {rule_num}: {e}")
         else:
@@ -1386,6 +4452,13 @@ def _delete_deny_rule_with_reason(
                 self._send_slack_notification(
                     f"[{self.region}] Removed IP block: {ip} (rule {rule_num}) - {reason}"
                 )
+            except ClientError as e:
+                error_code = e.response.get("Error", {}).get("Code", "")
+                if error_code == "InvalidNetworkAclEntry.NotFound":
+                    # Rule already deleted (possibly manually) - treat as success
+                    logging.warning(f"Rule {rule_num} for {ip} was already deleted (not found)")
+                else:
+                    logging.error(f"Failed to delete rule {rule_num}: {e}")
             except Exception as e:
                 logging.error(f"Failed to delete rule {rule_num}: {e}")
         else:
@@ -1495,30 +4568,70 @@ def _generate_report(
         offenders: Set[str],
         final_blocked_ips: Set[str],
         active_blocks: Optional[Dict[str, Dict]] = None,
+        ips_to_add: Optional[Set[str]] = None,
+        ips_to_remove: Optional[Set[str]] = None,
     ):
-        """Prints a final summary table of actions taken."""
+        """
+        Prints a final summary table of actions taken or planned.
+
+        In dry-run mode, shows expected state changes rather than current state.
+
+        Args:
+            ip_counts: Counter of IP addresses and their hit counts
+            offenders: Set of IPs that should be blocked
+            final_blocked_ips: Set of IPs currently blocked
+            active_blocks: Dict of active block registry entries
+            ips_to_add: IPs that will be added to blocklist (dry-run tracking)
+            ips_to_remove: IPs that will be removed from blocklist (dry-run tracking)
+        """
         print("\n--- SCRIPT EXECUTION SUMMARY ---")
+
+        if self.dry_run:
+            print("(DRY RUN - showing planned changes, no actual modifications made)\n")
+
+        # Use sets for comparison
+        ips_to_add = ips_to_add or set()
+        ips_to_remove = ips_to_remove or set()
+
+        # Build skipped IPs lookup
+        skipped_ip_details: Dict[str, Tuple[float, Dict]] = {}
+        for ip, score, details in self._skipped_ips:
+            skipped_ip_details[ip] = (score, details)
+
         if active_blocks:
             print(
-                f"{'IP Address':<20} {'Hits':<10} {'Tier':<12} {'Status':<25} {'Block Until':<20}"
+                f"{'IP Address':<20} {'Hits':<10} {'Tier':<12} {'Status':<30} {'Block Until':<20}"
             )
-            print("-" * 87)
+            print("-" * 92)
         else:
-            print(f"{'IP Address':<20} {'Malicious Hits':<15} {'Status':<20}")
-            print("-" * 55)
+            print(f"{'IP Address':<20} {'Malicious Hits':<15} {'Status':<30}")
+            print("-" * 65)
 
-        # Include IPs from recent detection and registry
-        all_detected_ips = {
-            ip for ip, count in ip_counts.items() if count >= self.threshold
-        }
-        report_ips = all_detected_ips.union(final_blocked_ips)
+        # Collect all IPs to report
+        report_ips = set()
+
+        # IPs detected in this run (above threshold)
+        detected_ips = {ip for ip, count in ip_counts.items() if count >= self.threshold}
+        report_ips.update(detected_ips)
+
+        # Currently blocked IPs
+        report_ips.update(final_blocked_ips)
 
-        # If using registry, include all active blocks
+        # IPs in active blocks registry
         if active_blocks:
-            report_ips = report_ips.union(set(active_blocks.keys()))
+            report_ips.update(active_blocks.keys())
+
+        # IPs that will be added/removed
+        report_ips.update(ips_to_add)
+        report_ips.update(ips_to_remove)
+
+        # Include skipped IPs in report
+        report_ips.update(skipped_ip_details.keys())
 
         sorted_report_ips = sorted(
-            list(report_ips), key=lambda ip: ip_counts.get(ip, 0), reverse=True
+            list(report_ips),
+            key=lambda ip: (ip_counts.get(ip, 0), ip),
+            reverse=True,
         )
 
         if not sorted_report_ips and ip_counts:
@@ -1527,46 +4640,141 @@ def _generate_report(
             )
 
         for ip in sorted_report_ips:
-            status = "NOT BLOCKED (Below Threshold)"
-            if ip in self.whitelist:
-                status = "WHITELISTED"
-            elif is_aws_ip(ip, self.aws_networks):
-                status = "AWS IP (Excluded)"
-            elif ip in final_blocked_ips:
-                status = "ACTIVE BLOCK"
-            elif ip in offenders:
-                status = "SHOULD BE BLOCKED"
+            # Determine status based on dry-run vs live-run
+            if self.dry_run:
+                status = self._get_dry_run_status(
+                    ip,
+                    ips_to_add=ips_to_add,
+                    ips_to_remove=ips_to_remove,
+                    final_blocked_ips=final_blocked_ips,
+                    skipped_ip_details=skipped_ip_details,
+                    hits=ip_counts.get(ip, 0),
+                )
+            else:
+                status = self._get_live_run_status(
+                    ip,
+                    final_blocked_ips=final_blocked_ips,
+                    offenders=offenders,
+                    hits=ip_counts.get(ip, 0),
+                )
 
             hits = ip_counts.get(ip, 0)
+            tier = ""
+            block_until_str = ""
 
             if active_blocks and ip in active_blocks:
                 # Enhanced display with tier info
                 tier = active_blocks[ip].get("tier", "unknown")
                 block_until = active_blocks[ip].get("block_until", "unknown")
 
-                # Format block_until
+                # Format block_until in local timezone
                 try:
                     block_until_dt = datetime.fromisoformat(block_until)
                     if block_until_dt.tzinfo is None:
                         block_until_dt = block_until_dt.replace(tzinfo=timezone.utc)
-                    block_until_str = block_until_dt.strftime("%Y-%m-%d %H:%M")
+                    # Show in local time with timezone indicator
+                    local_dt = block_until_dt.astimezone()
+                    block_until_str = local_dt.strftime("%Y-%m-%d %H:%M %Z")
                 except Exception:
-                    block_until_str = "unknown"
+                    block_until_str = str(block_until) if block_until else ""
 
                 # Show total hits from registry if no recent hits
                 if hits == 0:
                     hits = active_blocks[ip].get("total_hits", 0)
 
+            if active_blocks:
                 print(
-                    f"{ip:<20} {str(hits):<10} {tier:<12} {status:<25} {block_until_str:<20}"
+                    f"{ip:<20} {str(hits):<10} {tier:<12} {status:<30} {block_until_str:<20}"
                 )
             else:
-                print(f"{ip:<20} {str(hits):<15} {status:<20}")
+                print(f"{ip:<20} {str(hits):<15} {status:<30}")
 
+        # Print separator
         if active_blocks:
-            print("-" * 87)
+            print("-" * 92)
         else:
-            print("-" * 55)
+            print("-" * 65)
+
+        # Print legend for dry-run mode
+        if self.dry_run:
+            print("\nLegend:")
+            print("  → WILL BE BLOCKED    = New block to be added")
+            print("  → WILL BE UNBLOCKED  = Expired block to be removed")
+            print("  NO CHANGE (blocked)  = Currently blocked, no change needed")
+            print("  SKIPPED (score=XX)   = Below threat score threshold")
+
+        # Log AWS IP lookup stats if available
+        if self.aws_ip_index is not None:
+            hits, misses, hit_rate = self.aws_ip_index.get_lookup_stats()
+            if hits + misses > 0:
+                logging.info(
+                    f"AWS IP lookup stats: {hits} lookups performed, "
+                    f"{misses} unique IPs checked"
+                )
+
+    def _get_dry_run_status(
+        self,
+        ip: str,
+        ips_to_add: Set[str],
+        ips_to_remove: Set[str],
+        final_blocked_ips: Set[str],
+        skipped_ip_details: Dict[str, Tuple[float, Dict]],
+        hits: int,
+    ) -> str:
+        """Determine display status for dry-run mode."""
+
+        if ip in self.whitelist:
+            return "WHITELISTED"
+
+        if is_aws_ip_fast(ip, self.aws_ip_index):
+            return "AWS IP (excluded)"
+
+        if ip in ips_to_add:
+            return "→ WILL BE BLOCKED"
+
+        if ip in ips_to_remove:
+            return "→ WILL BE UNBLOCKED (expired)"
+
+        if ip in final_blocked_ips:
+            return "NO CHANGE (blocked)"
+
+        if ip in skipped_ip_details:
+            score, details = skipped_ip_details[ip]
+            service_name = details.get('service_name') if details else None
+            if service_name:
+                return f"SKIPPED (score={score:.0f}, {service_name})"
+            return f"SKIPPED (score={score:.0f})"
+
+        if hits < self.threshold:
+            return f"BELOW THRESHOLD ({hits}<{self.threshold})"
+
+        return "NOT BLOCKED"
+
+    def _get_live_run_status(
+        self,
+        ip: str,
+        final_blocked_ips: Set[str],
+        offenders: Set[str],
+        hits: int,
+    ) -> str:
+        """Determine display status for live-run mode."""
+
+        if ip in self.whitelist:
+            return "WHITELISTED"
+
+        if is_aws_ip_fast(ip, self.aws_ip_index):
+            return "AWS IP (excluded)"
+
+        if ip in final_blocked_ips:
+            return "ACTIVE BLOCK"
+
+        if ip in offenders:
+            return "SHOULD BE BLOCKED (slot full?)"
+
+        if hits < self.threshold:
+            return "BELOW THRESHOLD"
+
+        return "NOT BLOCKED"
 
 
 if __name__ == "__main__":
@@ -1624,6 +4832,12 @@ def _generate_report(
         default="ip-ranges.json",
         help="Path to AWS ip-ranges.json file. If provided, automatically excludes all AWS IPs from blocking.",
     )
+    parser.add_argument(
+        "--no-auto-download-ip-ranges",
+        action="store_true",
+        help="Disable automatic download of AWS IP ranges file. Use for air-gapped environments. "
+        "If disabled and file is missing, AWS IP exclusion will be unavailable.",
+    )
     parser.add_argument(
         "--live-run",
         action="store_true",
@@ -1642,6 +4856,29 @@ def _generate_report(
         default=None,
         help="Slack channel to send notifications to (also can use SLACK_CHANNEL env var).",
     )
+    parser.add_argument(
+        "--enhanced-slack",
+        action="store_true",
+        help="Enable enhanced Slack notifications with color coding, threading, and formatted fields.",
+    )
+
+    # Athena integration options
+    parser.add_argument(
+        "--athena",
+        action="store_true",
+        help="Enable Athena for large-scale log analysis. Recommended for >1000 log files.",
+    )
+    parser.add_argument(
+        "--athena-database",
+        default="alb_logs",
+        help="Athena database name for ALB log tables (default: alb_logs).",
+    )
+    parser.add_argument(
+        "--athena-output-location",
+        default=None,
+        help="S3 location for Athena query results (e.g., s3://my-bucket/athena-results/). Required if --athena is used.",
+    )
+
     parser.add_argument(
         "--ipinfo-token",
         default=None,
@@ -1653,6 +4890,123 @@ def _generate_report(
         help="Path to block registry JSON file for persistent time-based blocking (default: ./block_registry.json).",
     )
 
+    # Storage backend options
+    parser.add_argument(
+        "--storage-backend",
+        choices=["local", "dynamodb", "s3"],
+        default=None,
+        help="Storage backend type: 'local' (JSON file), 'dynamodb' (DynamoDB table), 's3' (S3 bucket). "
+        "Default: 'local'. Also can use STORAGE_BACKEND env var.",
+    )
+    parser.add_argument(
+        "--dynamodb-table",
+        default=None,
+        help="DynamoDB table name for block registry (required if storage-backend=dynamodb). "
+        "Also can use DYNAMODB_TABLE env var.",
+    )
+    parser.add_argument(
+        "--s3-state-bucket",
+        default=None,
+        help="S3 bucket name for block registry (required if storage-backend=s3). "
+        "Also can use S3_STATE_BUCKET env var.",
+    )
+    parser.add_argument(
+        "--s3-state-key",
+        default="block_registry.json",
+        help="S3 object key for block registry (default: block_registry.json). "
+        "Also can use S3_STATE_KEY env var.",
+    )
+    parser.add_argument(
+        "--create-dynamodb-table",
+        action="store_true",
+        help="Create the DynamoDB table if it doesn't exist (requires additional IAM permissions).",
+    )
+
+    # IPv6 support options
+    parser.add_argument(
+        "--enable-ipv6",
+        action="store_true",
+        default=True,
+        help="Enable IPv6 blocking (default: enabled). Use --no-ipv6 to disable.",
+    )
+    parser.add_argument(
+        "--no-ipv6",
+        action="store_true",
+        help="Disable IPv6 blocking (only block IPv4 addresses).",
+    )
+    parser.add_argument(
+        "--start-rule-ipv6",
+        type=int,
+        default=180,
+        help="Starting NACL rule number for IPv6 DENY rules (default: 180).",
+    )
+    parser.add_argument(
+        "--limit-ipv6",
+        type=int,
+        default=20,
+        help="Maximum number of IPv6 DENY rules to manage (default: 20).",
+    )
+    parser.add_argument(
+        "--force-reprocess",
+        action="store_true",
+        help="Force reprocessing of all log files, ignoring the processed files cache.",
+    )
+
+    # AWS WAF IP Set arguments
+    parser.add_argument(
+        "--waf-ip-set-name",
+        type=str,
+        help="Name of the AWS WAF IP Set to sync blocked IPs to (enables WAF integration).",
+    )
+    parser.add_argument(
+        "--waf-ip-set-id",
+        type=str,
+        help="ID of an existing AWS WAF IP Set to use (alternative to --waf-ip-set-name).",
+    )
+    parser.add_argument(
+        "--waf-ip-set-scope",
+        type=str,
+        choices=["REGIONAL", "CLOUDFRONT"],
+        default="REGIONAL",
+        help="WAF IP Set scope: REGIONAL (for ALB/API Gateway) or CLOUDFRONT (default: REGIONAL).",
+    )
+    parser.add_argument(
+        "--create-waf-ip-set",
+        action="store_true",
+        help="Create the WAF IP Set if it doesn't exist.",
+    )
+
+    # Structured logging & CloudWatch metrics
+    parser.add_argument(
+        "--json-logging",
+        action="store_true",
+        help="Enable JSON structured logging format (for CloudWatch Logs ingestion).",
+    )
+    parser.add_argument(
+        "--enable-cloudwatch-metrics",
+        action="store_true",
+        help="Enable publishing metrics to CloudWatch (requires IAM permissions).",
+    )
+    parser.add_argument(
+        "--cloudwatch-namespace",
+        type=str,
+        default="AutoBlockAttackers",
+        help="CloudWatch metrics namespace (default: AutoBlockAttackers).",
+    )
+
+    # Multi-signal threat detection
+    parser.add_argument(
+        "--disable-multi-signal",
+        action="store_true",
+        help="Disable multi-signal threat detection (use pattern matching only).",
+    )
+    parser.add_argument(
+        "--min-threat-score",
+        type=int,
+        default=40,
+        help="Minimum threat score (0-100) to block an IP (default: 40).",
+    )
+
     args = parser.parse_args()
 
     # Get Slack credentials from args or environment variables
@@ -1662,6 +5016,35 @@ def _generate_report(
     # Get IPInfo token from args or environment variable
     ipinfo_token = args.ipinfo_token or os.getenv("IPINFO_TOKEN")
 
+    # Get storage backend configuration from args or environment variables
+    storage_backend = args.storage_backend or os.getenv("STORAGE_BACKEND", "local")
+    dynamodb_table = args.dynamodb_table or os.getenv("DYNAMODB_TABLE")
+    s3_state_bucket = args.s3_state_bucket or os.getenv("S3_STATE_BUCKET")
+    s3_state_key = args.s3_state_key or os.getenv("S3_STATE_KEY", "block_registry.json")
+
+    # Get WAF configuration from args or environment variables
+    waf_ip_set_name = args.waf_ip_set_name or os.getenv("WAF_IP_SET_NAME")
+    waf_ip_set_id = args.waf_ip_set_id or os.getenv("WAF_IP_SET_ID")
+    waf_ip_set_scope = args.waf_ip_set_scope or os.getenv("WAF_IP_SET_SCOPE", "REGIONAL")
+    create_waf_ip_set = args.create_waf_ip_set or os.getenv("CREATE_WAF_IP_SET", "").lower() == "true"
+
+    # Get logging & metrics configuration
+    json_logging = args.json_logging or os.getenv("JSON_LOGGING", "").lower() == "true"
+    enable_cloudwatch_metrics = args.enable_cloudwatch_metrics or os.getenv("ENABLE_CLOUDWATCH_METRICS", "").lower() == "true"
+    cloudwatch_namespace = args.cloudwatch_namespace or os.getenv("CLOUDWATCH_NAMESPACE", "AutoBlockAttackers")
+
+    # Get multi-signal configuration
+    disable_multi_signal = args.disable_multi_signal or os.getenv("DISABLE_MULTI_SIGNAL", "").lower() == "true"
+    enable_multi_signal = not disable_multi_signal
+    min_threat_score_env = os.getenv("MIN_THREAT_SCORE")
+    min_threat_score = args.min_threat_score if not min_threat_score_env else int(min_threat_score_env)
+
+    # Build threat signals config if score is customized
+    threat_signals_config = None
+    if min_threat_score != 40:  # Non-default value
+        threat_signals_config = DEFAULT_THREAT_SIGNALS_CONFIG.copy()
+        threat_signals_config["min_threat_score"] = min_threat_score
+
     # Validate inputs
     if args.threshold < 1:
         parser.error("Threshold must be at least 1")
@@ -1679,6 +5062,15 @@ def _generate_report(
             f"Will be capped at rule 99."
         )
 
+    # Validate storage backend configuration
+    if storage_backend == "dynamodb" and not dynamodb_table:
+        parser.error("--dynamodb-table is required when using dynamodb storage backend")
+    if storage_backend == "s3" and not s3_state_bucket:
+        parser.error("--s3-state-bucket is required when using s3 storage backend")
+
+    # Handle IPv6 enable/disable flag
+    enable_ipv6 = not args.no_ipv6
+
     blocker = NaclAutoBlocker(
         lb_name_pattern=args.lb_name_pattern,
         region=args.region,
@@ -1694,5 +5086,36 @@ def _generate_report(
         slack_channel=slack_channel,
         ipinfo_token=ipinfo_token,
         registry_file=args.registry_file,
+        storage_backend=storage_backend,
+        dynamodb_table=dynamodb_table,
+        s3_state_bucket=s3_state_bucket,
+        s3_state_key=s3_state_key,
+        create_dynamodb_table=args.create_dynamodb_table,
+        # IPv6 support parameters
+        start_rule_ipv6=args.start_rule_ipv6,
+        limit_ipv6=args.limit_ipv6,
+        enable_ipv6=enable_ipv6,
+        # Incremental processing
+        force_reprocess=args.force_reprocess,
+        # AWS WAF IP Set integration
+        waf_ip_set_name=waf_ip_set_name,
+        waf_ip_set_scope=waf_ip_set_scope,
+        waf_ip_set_id=waf_ip_set_id,
+        create_waf_ip_set=create_waf_ip_set,
+        # Structured logging & CloudWatch metrics
+        json_logging=json_logging,
+        enable_cloudwatch_metrics=enable_cloudwatch_metrics,
+        cloudwatch_namespace=cloudwatch_namespace,
+        # Multi-signal threat detection
+        enable_multi_signal=enable_multi_signal,
+        threat_signals_config=threat_signals_config,
+        # Enhanced Slack notifications
+        enhanced_slack=args.enhanced_slack,
+        # Athena integration
+        athena_enabled=args.athena,
+        athena_database=args.athena_database,
+        athena_output_location=args.athena_output_location,
+        # Auto-download AWS IP ranges
+        auto_download_ip_ranges=not args.no_auto_download_ip_ranges,
     )
     blocker.run()
diff --git a/docs/CLI_GUIDE.md b/docs/CLI_GUIDE.md
new file mode 100644
index 0000000..a9e0a45
--- /dev/null
+++ b/docs/CLI_GUIDE.md
@@ -0,0 +1,832 @@
+# CLI Reference Guide
+
+## AWS Auto Block Attackers - Command Line Interface
+
+This guide provides comprehensive documentation for all command-line options with real-world examples.
+
+---
+
+## Table of Contents
+
+1. [Quick Start](#quick-start)
+2. [Basic Options](#basic-options)
+3. [Storage Backends](#storage-backends)
+4. [IPv6 Configuration](#ipv6-configuration)
+5. [AWS WAF Integration](#aws-waf-integration)
+6. [Observability Options](#observability-options)
+7. [Multi-Signal Detection](#multi-signal-detection)
+8. [Athena Integration](#athena-integration)
+9. [Slack Notifications](#slack-notifications)
+10. [Common Use Cases](#common-use-cases)
+11. [Environment Variables](#environment-variables)
+
+---
+
+## Quick Start
+
+### Minimal Dry-Run
+
+```bash
+python3 auto_block_attackers.py
+```
+
+This runs with all defaults:
+- Pattern: `alb-*`
+- Region: `ap-southeast-2`
+- Lookback: `60m`
+- Threshold: `50`
+- Dry-run mode (no actual changes)
+
+### Minimal Production Run
+
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-alb-*" \
+  --live-run
+```
+
+---
+
+## Basic Options
+
+### `--lb-name-pattern`
+
+**Description:** Glob pattern to match Application Load Balancer names.
+
+**Default:** `alb-*`
+
+**Examples:**
+
+```bash
+# Match all ALBs starting with "prod-"
+--lb-name-pattern "prod-*"
+
+# Match specific ALB
+--lb-name-pattern "prod-api-alb"
+
+# Match multiple patterns (run separately)
+--lb-name-pattern "prod-web-*"
+--lb-name-pattern "prod-api-*"
+
+# Match ALBs with specific suffix
+--lb-name-pattern "*-public-alb"
+```
+
+---
+
+### `--region`
+
+**Description:** AWS region where ALBs are located.
+
+**Default:** `ap-southeast-2`
+
+**Examples:**
+
+```bash
+--region us-east-1
+--region eu-west-1
+--region ap-northeast-1
+```
+
+---
+
+### `--lookback`
+
+**Description:** How far back to analyze logs. Supports minutes (m), hours (h), and days (d).
+
+**Default:** `60m`
+
+**Examples:**
+
+```bash
+# Last 30 minutes (quick scan)
+--lookback 30m
+
+# Last 2 hours (standard)
+--lookback 2h
+
+# Last 6 hours (extended)
+--lookback 6h
+
+# Last 1 day (full day analysis)
+--lookback 1d
+
+# Last 90 minutes (custom)
+--lookback 90m
+```
+
+**Recommendations:**
+
+| Use Case | Lookback | Rationale |
+|----------|----------|-----------|
+| Frequent runs (every 5 min) | `15m` | Minimize overlap |
+| Standard cron (every 15 min) | `30m-60m` | Catch missed runs |
+| Hourly runs | `90m` | Buffer for delays |
+| Daily analysis | `24h` | Full day coverage |
+
+---
+
+### `--threshold`
+
+**Description:** Minimum number of malicious requests required to trigger blocking.
+
+**Default:** `50`
+
+**Examples:**
+
+```bash
+# Aggressive (block quickly)
+--threshold 20
+
+# Standard
+--threshold 50
+
+# Conservative (reduce false positives)
+--threshold 100
+
+# Very conservative (only major attackers)
+--threshold 500
+```
+
+**Guidelines:**
+
+| Traffic Volume | Recommended Threshold |
+|----------------|----------------------|
+| Low (<1000 req/hr) | 20-30 |
+| Medium (1000-10000 req/hr) | 50-100 |
+| High (>10000 req/hr) | 100-200 |
+
+---
+
+### `--start-rule`
+
+**Description:** Starting NACL rule number for IPv4 DENY rules.
+
+**Default:** `80`
+
+**Range:** Rules 80-99 are managed by default.
+
+```bash
+# Default (rules 80-99)
+--start-rule 80
+
+# Higher range (rules 100-119)
+--start-rule 100 --limit 20
+
+# Lower range (rules 50-69)
+--start-rule 50 --limit 20
+```
+
+**Important:** Ensure the rule range doesn't conflict with existing NACL rules.
+
+---
+
+### `--limit`
+
+**Description:** Maximum number of IPv4 DENY rules to manage.
+
+**Default:** `20`
+
+**Examples:**
+
+```bash
+# Fewer rules (conservative)
+--limit 10
+
+# Standard
+--limit 20
+
+# More rules (if NACL space available)
+--limit 30 --start-rule 70
+```
+
+---
+
+### `--whitelist-file`
+
+**Description:** Path to file containing whitelisted IPs/CIDRs.
+
+**Default:** `whitelist.txt`
+
+**File Format:**
+
+```text
+# Office IP
+203.0.113.50
+
+# Partner network
+198.51.100.0/24
+
+# Monitoring service
+192.0.2.10
+
+# IPv6 addresses work too
+2001:db8::1
+2001:db8::/32
+```
+
+**Examples:**
+
+```bash
+--whitelist-file /etc/auto-block/whitelist.txt
+--whitelist-file ./config/trusted-ips.txt
+--whitelist-file ""  # Disable whitelist
+```
+
+---
+
+### `--aws-ip-ranges-file`
+
+**Description:** Path to AWS ip-ranges.json file for automatic AWS IP exclusion. By default, the file is automatically downloaded from AWS if missing or older than 7 days.
+
+**Default:** `ip-ranges.json` (or `/tmp/ip-ranges.json` in Lambda environments)
+
+**Auto-Download:** The script automatically downloads fresh IP ranges from AWS:
+- On first run if file doesn't exist
+- If file is older than 7 days (stale)
+- Falls back to stale cache if download fails
+
+**Manual Download (optional):**
+
+```bash
+curl -o ip-ranges.json https://ip-ranges.amazonaws.com/ip-ranges.json
+```
+
+**Examples:**
+
+```bash
+--aws-ip-ranges-file /var/cache/aws-ip-ranges.json
+--aws-ip-ranges-file ""  # Disable AWS IP exclusion (not recommended)
+```
+
+---
+
+### `--no-auto-download-ip-ranges`
+
+**Description:** Disable automatic downloading of AWS IP ranges. Use this if you want to manage the ip-ranges.json file manually or in air-gapped environments.
+
+**Default:** Auto-download enabled
+
+**Examples:**
+
+```bash
+# Disable auto-download (use existing file only)
+--no-auto-download-ip-ranges
+
+# Use manual download in cron
+curl -o ip-ranges.json https://ip-ranges.amazonaws.com/ip-ranges.json
+python3 auto_block_attackers.py --no-auto-download-ip-ranges --live-run
+```
+
+---
+
+### `--registry-file`
+
+**Description:** Path to block registry JSON file.
+
+**Default:** `./block_registry.json`
+
+```bash
+--registry-file /var/lib/auto-block/registry.json
+--registry-file ./data/blocks.json
+```
+
+---
+
+### `--live-run`
+
+**Description:** Actually create/modify NACL rules. Without this flag, runs in dry-run mode.
+
+**Default:** `False` (dry-run)
+
+```bash
+# Dry-run (see what would happen)
+python3 auto_block_attackers.py
+
+# Live run (make changes)
+python3 auto_block_attackers.py --live-run
+```
+
+---
+
+### `--debug`
+
+**Description:** Enable verbose debug logging.
+
+```bash
+python3 auto_block_attackers.py --debug 2>&1 | tee debug.log
+```
+
+---
+
+## Storage Backends
+
+### `--storage-backend`
+
+**Description:** Choose where to persist block registry state.
+
+**Options:** `local`, `dynamodb`, `s3`
+
+**Default:** `local`
+
+### Local File Storage (Default)
+
+```bash
+--storage-backend local
+--registry-file ./block_registry.json
+```
+
+### DynamoDB Storage
+
+```bash
+# Use existing table
+--storage-backend dynamodb
+--dynamodb-table my-block-registry
+
+# Auto-create table if missing
+--storage-backend dynamodb
+--dynamodb-table my-block-registry
+--create-dynamodb-table
+```
+
+**DynamoDB Benefits:**
+- Multi-AZ durability
+- Supports concurrent access from multiple instances
+- Automatic scaling with on-demand capacity
+
+### S3 Storage
+
+```bash
+--storage-backend s3
+--s3-state-bucket my-security-bucket
+--s3-state-key auto-block/registry.json
+```
+
+**S3 Benefits:**
+- 11 9's durability
+- Version history
+- Cross-region replication possible
+
+---
+
+## IPv6 Configuration
+
+### `--start-rule-ipv6`
+
+**Description:** Starting NACL rule number for IPv6 DENY rules.
+
+**Default:** `180`
+
+```bash
+--start-rule-ipv6 180  # Rules 180-199
+--start-rule-ipv6 200  # Rules 200-219
+```
+
+### `--limit-ipv6`
+
+**Description:** Maximum number of IPv6 DENY rules.
+
+**Default:** `20`
+
+```bash
+--limit-ipv6 20
+--limit-ipv6 10  # Fewer IPv6 rules
+```
+
+### `--disable-ipv6`
+
+**Description:** Disable IPv6 blocking entirely.
+
+```bash
+--disable-ipv6
+```
+
+### Full IPv6 Example
+
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --start-rule 80 \
+  --limit 20 \
+  --start-rule-ipv6 180 \
+  --limit-ipv6 20 \
+  --live-run
+```
+
+---
+
+## AWS WAF Integration
+
+### `--waf-ip-set-name`
+
+**Description:** Name of WAF IP Set to synchronize.
+
+```bash
+--waf-ip-set-name "blocked-attackers"
+--waf-ip-set-name "auto-block-prod"
+```
+
+### `--waf-ip-set-scope`
+
+**Description:** WAF scope for IP Set.
+
+**Options:** `REGIONAL`, `CLOUDFRONT`
+
+**Default:** `REGIONAL`
+
+```bash
+--waf-ip-set-scope REGIONAL    # For regional WAF (ALB, API Gateway)
+--waf-ip-set-scope CLOUDFRONT  # For CloudFront distributions
+```
+
+### `--waf-ip-set-id`
+
+**Description:** Specific IP Set ID (optional, will find by name if not provided).
+
+```bash
+--waf-ip-set-id "a1b2c3d4-5678-90ab-cdef-EXAMPLE11111"
+```
+
+### `--create-waf-ip-set`
+
+**Description:** Create the WAF IP Set if it doesn't exist.
+
+```bash
+--waf-ip-set-name "blocked-attackers" \
+--create-waf-ip-set
+```
+
+### Full WAF Example
+
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --waf-ip-set-name "auto-blocked-ips" \
+  --waf-ip-set-scope REGIONAL \
+  --create-waf-ip-set \
+  --live-run
+```
+
+---
+
+## Observability Options
+
+### `--json-logging`
+
+**Description:** Output logs in JSON format for CloudWatch Logs ingestion.
+
+```bash
+python3 auto_block_attackers.py --json-logging 2>&1 | tee /var/log/auto-block.json
+```
+
+**Sample Output:**
+
+```json
+{"timestamp": "2026-01-09T10:30:00Z", "level": "INFO", "message": "Processing 150 log files..."}
+{"timestamp": "2026-01-09T10:30:05Z", "level": "WARNING", "message": "Blocking IP 1.2.3.4 (1523 hits)"}
+```
+
+### `--enable-cloudwatch-metrics`
+
+**Description:** Publish metrics to CloudWatch.
+
+```bash
+--enable-cloudwatch-metrics
+```
+
+### `--cloudwatch-namespace`
+
+**Description:** CloudWatch namespace for metrics.
+
+**Default:** `AutoBlockAttackers`
+
+```bash
+--enable-cloudwatch-metrics \
+--cloudwatch-namespace "Security/AutoBlock"
+```
+
+### Full Observability Example
+
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --json-logging \
+  --enable-cloudwatch-metrics \
+  --cloudwatch-namespace "Production/Security/AutoBlock" \
+  --live-run
+```
+
+---
+
+## Multi-Signal Detection
+
+### `--disable-multi-signal`
+
+**Description:** Disable multi-signal threat detection (use pattern matching only).
+
+```bash
+--disable-multi-signal
+```
+
+### `--min-threat-score`
+
+**Description:** Minimum threat score to confirm an IP as malicious.
+
+**Default:** `40`
+
+**Range:** `0-100`
+
+```bash
+# More aggressive (lower score = more blocks)
+--min-threat-score 30
+
+# Standard
+--min-threat-score 40
+
+# More conservative (higher score = fewer blocks)
+--min-threat-score 60
+```
+
+### Understanding Threat Scores
+
+| Score | Interpretation |
+|-------|----------------|
+| 0-20 | Low threat (likely false positive) |
+| 20-40 | Moderate threat (borderline) |
+| 40-60 | Confirmed threat (standard) |
+| 60-80 | High confidence threat |
+| 80-100 | Definite attacker |
+
+### Full Multi-Signal Example
+
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --min-threat-score 45 \
+  --debug \
+  --live-run
+```
+
+---
+
+## Athena Integration
+
+### `--athena`
+
+**Description:** Enable Athena for large-scale log analysis.
+
+### `--athena-database`
+
+**Description:** Athena database name.
+
+**Default:** `alb_logs`
+
+```bash
+--athena-database security_logs
+--athena-database prod_alb_analysis
+```
+
+### `--athena-output-location`
+
+**Description:** S3 location for Athena query results. **Required when using Athena.**
+
+```bash
+--athena-output-location "s3://my-bucket/athena-results/"
+```
+
+### Full Athena Example
+
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --athena \
+  --athena-database "security_logs" \
+  --athena-output-location "s3://my-bucket/athena-results/" \
+  --lookback 24h \
+  --live-run
+```
+
+**When to Use Athena:**
+- More than 1000 log files to process
+- Historical analysis (multiple days)
+- Complex filtering requirements
+
+---
+
+## Slack Notifications
+
+### `--slack-token`
+
+**Description:** Slack bot token for notifications.
+
+```bash
+--slack-token "xoxb-1234567890-abcdefghijk"
+```
+
+**Prefer environment variable:** `SLACK_BOT_TOKEN`
+
+### `--slack-channel`
+
+**Description:** Slack channel ID or name.
+
+```bash
+--slack-channel "C04ABCDEFG"
+--slack-channel "#security-alerts"
+```
+
+**Prefer environment variable:** `SLACK_CHANNEL`
+
+### `--enhanced-slack`
+
+**Description:** Enable enhanced Slack notifications with:
+- Severity-based color coding
+- Block Kit formatting
+- Incident threading
+- Structured fields
+
+```bash
+--enhanced-slack
+```
+
+### Slack Setup
+
+1. Create a Slack App at https://api.slack.com/apps
+2. Add Bot Token Scopes: `chat:write`, `files:write`
+3. Install to workspace
+4. Copy Bot User OAuth Token
+
+### Full Slack Example
+
+```bash
+export SLACK_BOT_TOKEN="xoxb-your-token"
+export SLACK_CHANNEL="C04SECURITY"
+
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --enhanced-slack \
+  --live-run
+```
+
+---
+
+## Common Use Cases
+
+### 1. Development/Testing
+
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "dev-*" \
+  --lookback 30m \
+  --threshold 10 \
+  --debug
+```
+
+### 2. Production - Hourly Cron
+
+```bash
+# crontab entry
+0 * * * * /opt/auto-block/run.sh >> /var/log/auto-block.log 2>&1
+
+# run.sh
+#!/bin/bash
+cd /opt/auto-block
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --region us-east-1 \
+  --lookback 90m \
+  --threshold 75 \
+  --storage-backend dynamodb \
+  --dynamodb-table prod-block-registry \
+  --enable-cloudwatch-metrics \
+  --enhanced-slack \
+  --live-run
+```
+
+### 3. Multi-Region Deployment
+
+```bash
+# Region 1
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --region us-east-1 \
+  --dynamodb-table global-block-registry \
+  --live-run
+
+# Region 2
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --region eu-west-1 \
+  --dynamodb-table global-block-registry \
+  --live-run
+```
+
+### 4. High-Security Environment
+
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --threshold 25 \
+  --min-threat-score 35 \
+  --waf-ip-set-name "blocked-ips" \
+  --create-waf-ip-set \
+  --storage-backend dynamodb \
+  --dynamodb-table secure-block-registry \
+  --json-logging \
+  --enable-cloudwatch-metrics \
+  --enhanced-slack \
+  --live-run
+```
+
+### 5. Large-Scale with Athena
+
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --athena \
+  --athena-database "security_analysis" \
+  --athena-output-location "s3://analytics-bucket/athena/" \
+  --lookback 24h \
+  --threshold 100 \
+  --live-run
+```
+
+### 6. Conservative/Low False Positive
+
+```bash
+python3 auto_block_attackers.py \
+  --lb-name-pattern "prod-*" \
+  --threshold 200 \
+  --min-threat-score 60 \
+  --lookback 2h \
+  --live-run
+```
+
+---
+
+## Environment Variables
+
+All sensitive values can be provided via environment variables:
+
+| Variable | CLI Equivalent | Description |
+|----------|---------------|-------------|
+| `SLACK_BOT_TOKEN` | `--slack-token` | Slack bot token |
+| `SLACK_CHANNEL` | `--slack-channel` | Slack channel |
+| `IPINFO_TOKEN` | `--ipinfo-token` | IPInfo API token |
+| `STORAGE_BACKEND` | `--storage-backend` | Storage type |
+| `DYNAMODB_TABLE` | `--dynamodb-table` | DynamoDB table name |
+| `S3_STATE_BUCKET` | `--s3-state-bucket` | S3 bucket for state |
+| `S3_STATE_KEY` | `--s3-state-key` | S3 key for state |
+| `DISABLE_MULTI_SIGNAL` | `--disable-multi-signal` | Set to "true" to disable |
+| `MIN_THREAT_SCORE` | `--min-threat-score` | Threat score threshold |
+| `AWS_DEFAULT_REGION` | `--region` | AWS region |
+
+### Example .env File
+
+```bash
+# AWS (if not using IAM role)
+AWS_DEFAULT_REGION=us-east-1
+
+# Slack
+SLACK_BOT_TOKEN=xoxb-your-token-here
+SLACK_CHANNEL=C04SECURITY
+
+# IPInfo (optional)
+IPINFO_TOKEN=your-ipinfo-token
+
+# Storage
+STORAGE_BACKEND=dynamodb
+DYNAMODB_TABLE=auto-block-registry
+
+# Threat Detection
+MIN_THREAT_SCORE=40
+```
+
+### Loading Environment
+
+```bash
+# Load from file
+source .env && python3 auto_block_attackers.py --live-run
+
+# Or use direnv
+echo "dotenv" > .envrc
+direnv allow
+python3 auto_block_attackers.py --live-run
+```
+
+---
+
+## Exit Codes
+
+| Code | Meaning |
+|------|---------|
+| 0 | Success |
+| 1 | Runtime error |
+| 2 | Configuration error |
+
+---
+
+## Help
+
+```bash
+python3 auto_block_attackers.py --help
+```
diff --git a/docs/TECHNICAL_DESIGN.md b/docs/TECHNICAL_DESIGN.md
new file mode 100644
index 0000000..b2ac31d
--- /dev/null
+++ b/docs/TECHNICAL_DESIGN.md
@@ -0,0 +1,829 @@
+# Technical Design Document
+
+## AWS Auto Block Attackers v2.0
+
+### Document Version: 2.0
+### Last Updated: January 2026
+
+---
+
+## Table of Contents
+
+1. [Overview](#1-overview)
+2. [Architecture](#2-architecture)
+3. [Core Components](#3-core-components)
+4. [Storage Backends](#4-storage-backends)
+5. [IPv6 Support](#5-ipv6-support)
+6. [AWS WAF Integration](#6-aws-waf-integration)
+7. [Multi-Signal Threat Detection](#7-multi-signal-threat-detection)
+8. [Athena Integration](#8-athena-integration)
+9. [Observability](#9-observability)
+10. [Security Considerations](#10-security-considerations)
+
+---
+
+## 1. Overview
+
+### 1.1 Purpose
+
+AWS Auto Block Attackers is an automated security tool that analyzes Application Load Balancer (ALB) access logs to detect malicious traffic patterns and implement tiered, time-based IP blocking via AWS Network ACLs (NACLs) and optionally AWS WAF IP Sets.
+
+### 1.2 Key Capabilities
+
+| Capability | Description |
+|------------|-------------|
+| **Pattern Detection** | Regex-based detection of LFI, XSS, SQLi, command injection, path traversal |
+| **Tiered Blocking** | 5-tier system (Critical→Minimal) with proportional block durations |
+| **Multi-Signal Analysis** | Reduces false positives by correlating multiple threat indicators |
+| **Dual-Stack Support** | Full IPv4 and IPv6 blocking capabilities |
+| **Cloud-Native Storage** | DynamoDB, S3, or local file storage for state persistence |
+| **AWS WAF Integration** | Parallel blocking via WAF IP Sets for edge protection |
+| **Athena Integration** | SQL-based log analysis for large-scale deployments |
+| **Observable** | Structured JSON logging, CloudWatch metrics, enhanced Slack notifications |
+
+### 1.3 Design Principles
+
+1. **Fail-Safe**: Security tool must never crash; graceful degradation on errors
+2. **Idempotent**: Multiple executions with same input produce same result
+3. **Observable**: Comprehensive logging and metrics for operational visibility
+4. **Configurable**: Sensible defaults with extensive customization options
+5. **Backward Compatible**: New features don't break existing deployments
+
+---
+
+## 2. Architecture
+
+### 2.1 High-Level Architecture
+
+```
+┌─────────────────────────────────────────────────────────────────────────────┐
+│                              AWS Auto Block Attackers                        │
+├─────────────────────────────────────────────────────────────────────────────┤
+│                                                                              │
+│  ┌──────────────┐    ┌──────────────┐    ┌──────────────┐                   │
+│  │   S3 Logs    │    │   Athena     │    │  CloudWatch  │                   │
+│  │   (Input)    │    │  (Optional)  │    │   (Metrics)  │                   │
+│  └──────┬───────┘    └──────┬───────┘    └──────▲───────┘                   │
+│         │                   │                   │                            │
+│         ▼                   ▼                   │                            │
+│  ┌────────────────────────────────────────┐    │                            │
+│  │         Log Processing Engine          │    │                            │
+│  │  ┌─────────────┐  ┌─────────────┐      │    │                            │
+│  │  │   Direct    │  │   Athena    │      │    │                            │
+│  │  │  S3 Fetch   │  │   Query     │      │    │                            │
+│  │  └─────────────┘  └─────────────┘      │    │                            │
+│  └────────────────┬───────────────────────┘    │                            │
+│                   │                            │                            │
+│                   ▼                            │                            │
+│  ┌────────────────────────────────────────┐    │                            │
+│  │         Threat Detection Engine        │────┘                            │
+│  │  ┌─────────────┐  ┌─────────────┐      │                                 │
+│  │  │   Pattern   │  │Multi-Signal │      │                                 │
+│  │  │   Matching  │  │  Analysis   │      │                                 │
+│  │  └─────────────┘  └─────────────┘      │                                 │
+│  └────────────────┬───────────────────────┘                                 │
+│                   │                                                          │
+│                   ▼                                                          │
+│  ┌────────────────────────────────────────┐                                 │
+│  │         Blocking Decision Engine       │                                 │
+│  │  ┌─────────────┐  ┌─────────────┐      │                                 │
+│  │  │    Tier     │  │  Priority   │      │                                 │
+│  │  │Classification│ │  Ordering   │      │                                 │
+│  │  └─────────────┘  └─────────────┘      │                                 │
+│  └────────────────┬───────────────────────┘                                 │
+│                   │                                                          │
+│         ┌─────────┴─────────┐                                               │
+│         ▼                   ▼                                               │
+│  ┌─────────────┐     ┌─────────────┐     ┌─────────────┐                   │
+│  │    NACL     │     │   WAF IP    │     │   Storage   │                   │
+│  │   Manager   │     │    Sets     │     │   Backend   │                   │
+│  └──────┬──────┘     └──────┬──────┘     └──────┬──────┘                   │
+│         │                   │                   │                            │
+└─────────┼───────────────────┼───────────────────┼────────────────────────────┘
+          │                   │                   │
+          ▼                   ▼                   ▼
+   ┌─────────────┐     ┌─────────────┐     ┌─────────────┐
+   │  AWS EC2    │     │  AWS WAF    │     │ DynamoDB/S3 │
+   │   NACLs     │     │  IP Sets    │     │   /Local    │
+   └─────────────┘     └─────────────┘     └─────────────┘
+```
+
+### 2.2 Execution Flow
+
+```
+START
+  │
+  ▼
+┌─────────────────────────────────────┐
+│ 1. Initialize                        │
+│    - Load configuration              │
+│    - Initialize AWS clients          │
+│    - Load block registry             │
+│    - Load processed files cache      │
+└─────────────────────────────────────┘
+  │
+  ▼
+┌─────────────────────────────────────┐
+│ 2. Discover Load Balancers          │
+│    - Match LB name pattern          │
+│    - Extract S3 log locations       │
+│    - Find associated NACLs          │
+└─────────────────────────────────────┘
+  │
+  ▼
+┌─────────────────────────────────────┐
+│ 3. Process Logs                     │
+│    - List S3 objects in window      │
+│    - Skip already-processed files   │
+│    - Parse logs (parallel/Athena)   │
+│    - Extract malicious IPs          │
+└─────────────────────────────────────┘
+  │
+  ▼
+┌─────────────────────────────────────┐
+│ 4. Apply Filters                    │
+│    - Remove whitelisted IPs         │
+│    - Remove AWS IPs (v4 + v6)       │
+│    - Apply threshold filter         │
+│    - Multi-signal validation        │
+└─────────────────────────────────────┘
+  │
+  ▼
+┌─────────────────────────────────────┐
+│ 5. Update Block Registry            │
+│    - Classify tiers                  │
+│    - Handle tier upgrades           │
+│    - Calculate expiration times     │
+│    - Merge with existing blocks     │
+└─────────────────────────────────────┘
+  │
+  ▼
+┌─────────────────────────────────────┐
+│ 6. Apply Blocks                     │
+│    - Update NACL rules (v4 + v6)    │
+│    - Sync WAF IP Sets               │
+│    - Respect priority ordering      │
+│    - Handle slot exhaustion         │
+└─────────────────────────────────────┘
+  │
+  ▼
+┌─────────────────────────────────────┐
+│ 7. Finalize                         │
+│    - Save block registry            │
+│    - Save processed files cache     │
+│    - Emit CloudWatch metrics        │
+│    - Send Slack notification        │
+└─────────────────────────────────────┘
+  │
+  ▼
+END
+```
+
+---
+
+## 3. Core Components
+
+### 3.1 NaclAutoBlocker Class
+
+The main orchestrator class that coordinates all operations.
+
+```python
+class NaclAutoBlocker:
+    """
+    Main class for automated IP blocking based on ALB log analysis.
+
+    Attributes:
+        lb_name_pattern (str): Glob pattern to match load balancer names
+        region (str): AWS region
+        lookback_delta (timedelta): How far back to analyze logs
+        threshold (int): Minimum hits to trigger blocking
+        dry_run (bool): If True, don't make actual changes
+    """
+```
+
+**Key Methods:**
+
+| Method | Purpose |
+|--------|---------|
+| `run()` | Main entry point, orchestrates entire flow |
+| `_download_and_parse_log()` | Fetch and parse single log file |
+| `_process_logs_in_parallel()` | Parallel log processing with ThreadPoolExecutor |
+| `_filter_by_multi_signal()` | Apply multi-signal threat detection |
+| `_determine_tier()` | Classify IP into threat tier |
+| `_sync_nacl_rules()` | Update NACL deny rules |
+| `_sync_waf_ip_set()` | Update WAF IP Set |
+
+### 3.2 Attack Pattern Detection
+
+Comprehensive regex patterns for common attack vectors:
+
+```python
+ATTACK_PATTERNS = re.compile(
+    r"(?:"
+    r"(?:\.\./|\.\.\\)"           # Path traversal
+    r"|/etc/passwd"               # Unix file access
+    r"|/proc/self"                # Linux proc filesystem
+    r"|<script[^>]*>"             # XSS script tags
+    r"|javascript:"               # JavaScript protocol
+    r"|UNION\s+SELECT"            # SQL injection
+    r"|SELECT\s+.*\s+FROM"        # SQL queries
+    r"|eval\s*\("                 # Code injection
+    r"|wp-login\.php"             # WordPress targeting
+    r"|/\.env"                    # Environment file exposure
+    r"|/\.git"                    # Git repository exposure
+    r"|phpMyAdmin"                # Admin panel scanning
+    r")",
+    re.IGNORECASE
+)
+```
+
+### 3.3 Tier Classification System
+
+```python
+DEFAULT_TIERS = [
+    # (min_hits, tier_name, block_hours, priority)
+    (2000, "critical", 168, 4),  # 7 days
+    (1000, "high", 72, 3),       # 3 days
+    (500, "medium", 48, 2),      # 2 days
+    (100, "low", 24, 1),         # 1 day
+    (0, "minimal", 1, 0),        # 1 hour
+]
+```
+
+**Tier Selection Algorithm:**
+```python
+def _determine_tier(self, hit_count: int) -> Tuple[str, int, int]:
+    for min_hits, tier_name, block_hours, priority in self.tier_config:
+        if hit_count >= min_hits:
+            return tier_name, block_hours, priority
+    return "minimal", 1, 0
+```
+
+---
+
+## 4. Storage Backends
+
+### 4.1 Architecture
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│                    StorageBackend (ABC)                      │
+│  ┌─────────────────────────────────────────────────────┐    │
+│  │  + get(key: str) -> Optional[Dict]                   │    │
+│  │  + put(key: str, data: Dict) -> bool                │    │
+│  │  + delete(key: str) -> bool                         │    │
+│  │  + exists(key: str) -> bool                         │    │
+│  │  + list_keys(prefix: str) -> List[str]              │    │
+│  └─────────────────────────────────────────────────────┘    │
+└─────────────────────────────────────────────────────────────┘
+         │                    │                    │
+         ▼                    ▼                    ▼
+┌─────────────┐      ┌─────────────┐      ┌─────────────┐
+│LocalFileBack│      │DynamoDBBack │      │  S3Backend  │
+│    end      │      │    end      │      │             │
+└─────────────┘      └─────────────┘      └─────────────┘
+```
+
+### 4.2 Backend Comparison
+
+| Feature | Local File | DynamoDB | S3 |
+|---------|------------|----------|-----|
+| **Latency** | ~1ms | ~10ms | ~50ms |
+| **Durability** | Single host | Multi-AZ | 11 9's |
+| **Concurrency** | Lock file | Conditional writes | Versioning |
+| **Cost** | Free | Pay per request | Pay per request |
+| **Use Case** | Dev/single instance | Multi-instance | Archival/large state |
+
+### 4.3 Configuration
+
+```bash
+# Local (default)
+--storage-backend local
+--registry-file ./block_registry.json
+
+# DynamoDB
+--storage-backend dynamodb
+--dynamodb-table auto-block-attackers-state
+--create-dynamodb-table  # Auto-create table
+
+# S3
+--storage-backend s3
+--s3-state-bucket my-state-bucket
+--s3-state-key security/block-registry.json
+```
+
+### 4.4 DynamoDB Table Schema
+
+```
+Table: auto-block-attackers-state
+├── Primary Key: pk (String) - Partition key
+├── Attributes:
+│   ├── data (Map) - JSON data
+│   ├── updated_at (String) - ISO8601 timestamp
+│   └── ttl (Number) - Unix timestamp for TTL
+└── GSI: None (single key access pattern)
+```
+
+---
+
+## 5. IPv6 Support
+
+### 5.1 Dual-Stack Architecture
+
+```
+                    ┌─────────────────────────────────┐
+                    │        Log Processing           │
+                    │   ┌─────────┐   ┌─────────┐    │
+                    │   │  IPv4   │   │  IPv6   │    │
+                    │   │ Parsing │   │ Parsing │    │
+                    │   └────┬────┘   └────┬────┘    │
+                    │        │             │         │
+                    │        ▼             ▼         │
+                    │   ┌─────────────────────┐      │
+                    │   │   IP Validation     │      │
+                    │   │  (Public only)      │      │
+                    │   └──────────┬──────────┘      │
+                    └──────────────┼──────────────────┘
+                                   │
+              ┌────────────────────┴────────────────────┐
+              │                                         │
+              ▼                                         ▼
+     ┌─────────────────┐                       ┌─────────────────┐
+     │   NACL IPv4     │                       │   NACL IPv6     │
+     │  Rules 80-99    │                       │  Rules 180-199  │
+     │  (CidrBlock)    │                       │ (Ipv6CidrBlock) │
+     └─────────────────┘                       └─────────────────┘
+```
+
+### 5.2 IPv6 Address Handling
+
+```python
+def is_valid_public_ip(ip_str: str) -> Tuple[bool, int]:
+    """
+    Validate if an IP address is a public (routable) address.
+
+    Returns:
+        Tuple[bool, int]: (is_valid, ip_version)
+        - ip_version: 4 for IPv4, 6 for IPv6
+    """
+    try:
+        ip = ipaddress.ip_address(ip_str)
+        if ip.is_global and not ip.is_private:
+            return True, ip.version
+        return False, ip.version
+    except ValueError:
+        return False, 0
+```
+
+### 5.3 NACL Rule Structure
+
+**IPv4 Rule:**
+```python
+ec2.create_network_acl_entry(
+    NetworkAclId=nacl_id,
+    RuleNumber=85,  # 80-99 range
+    Protocol="-1",
+    RuleAction="deny",
+    CidrBlock="1.2.3.4/32",  # IPv4 CIDR
+    Egress=False,
+)
+```
+
+**IPv6 Rule:**
+```python
+ec2.create_network_acl_entry(
+    NetworkAclId=nacl_id,
+    RuleNumber=185,  # 180-199 range
+    Protocol="-1",
+    RuleAction="deny",
+    Ipv6CidrBlock="2001:db8::1/128",  # IPv6 CIDR
+    Egress=False,
+)
+```
+
+---
+
+## 6. AWS WAF Integration
+
+### 6.1 Architecture
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│                   WAF IP Set Manager                         │
+├─────────────────────────────────────────────────────────────┤
+│                                                              │
+│  ┌─────────────┐    ┌─────────────┐    ┌─────────────┐     │
+│  │ IP Set      │    │  LockToken  │    │  Batch      │     │
+│  │ Discovery   │───▶│  Management │───▶│  Updates    │     │
+│  └─────────────┘    └─────────────┘    └─────────────┘     │
+│                                                              │
+└─────────────────────────────────────────────────────────────┘
+                              │
+                              ▼
+                    ┌─────────────────┐
+                    │   AWS WAFv2     │
+                    │   IP Sets       │
+                    │                 │
+                    │  ┌───────────┐  │
+                    │  │ IPv4 Set  │  │
+                    │  │ /32 CIDRs │  │
+                    │  └───────────┘  │
+                    │  ┌───────────┐  │
+                    │  │ IPv6 Set  │  │
+                    │  │/128 CIDRs │  │
+                    │  └───────────┘  │
+                    └─────────────────┘
+```
+
+### 6.2 Optimistic Locking
+
+WAF IP Sets use optimistic locking via `LockToken`:
+
+```python
+def _update_waf_ip_set_addresses(
+    self, ip_set_id: str, addresses: Set[str], lock_token: str
+) -> bool:
+    """
+    Update WAF IP Set with new addresses using optimistic locking.
+
+    The LockToken prevents concurrent modifications:
+    1. Get current IP Set (includes LockToken)
+    2. Modify addresses
+    3. Update with LockToken
+    4. If LockToken mismatch, retry with new token
+    """
+    try:
+        self.waf.update_ip_set(
+            Name=self._waf_ip_set_name,
+            Scope=self._waf_ip_set_scope,
+            Id=ip_set_id,
+            Addresses=list(addresses),
+            LockToken=lock_token,
+        )
+        return True
+    except self.waf.exceptions.WAFOptimisticLockException:
+        # Retry with fresh LockToken
+        return self._retry_waf_update(ip_set_id, addresses)
+```
+
+### 6.3 Configuration
+
+```bash
+# Enable WAF IP Set synchronization
+--waf-ip-set-name "blocked-attackers"
+--waf-ip-set-scope "REGIONAL"  # or "CLOUDFRONT"
+--waf-ip-set-id "abc123-..."   # Optional, will find by name
+--create-waf-ip-set            # Create if doesn't exist
+```
+
+---
+
+## 7. Multi-Signal Threat Detection
+
+### 7.1 Purpose
+
+Reduce false positives by correlating multiple threat indicators beyond simple pattern matching.
+
+### 7.2 Threat Signals
+
+```python
+class ThreatSignals:
+    """Aggregates multiple threat indicators for an IP."""
+
+    attack_pattern_hits: int  # ATTACK_PATTERNS matches
+    scanner_ua_hits: int      # Known scanner user agents
+    error_responses: int      # 4xx/5xx responses
+    total_requests: int       # Total request count
+    unique_paths: Set[str]    # Path diversity
+```
+
+### 7.3 Scoring Algorithm
+
+```python
+def calculate_threat_score(self, config: Dict) -> Tuple[float, Dict[str, float]]:
+    """
+    Calculate weighted threat score.
+
+    Score = (attack_weight * attack_rate) +
+            (scanner_weight * scanner_rate) +
+            (error_weight * error_rate) +
+            (diversity_weight * path_diversity_score)
+    """
+    weights = config["signal_weights"]
+
+    # Attack pattern rate (0-100)
+    attack_rate = min(100, (self.attack_pattern_hits / max(1, self.total_requests)) * 100)
+
+    # Scanner user agent rate (0-100)
+    scanner_rate = min(100, (self.scanner_ua_hits / max(1, self.total_requests)) * 100)
+
+    # Error rate (0-100)
+    error_rate = min(100, (self.error_responses / max(1, self.total_requests)) * 100)
+
+    # Path diversity (many unique paths = scanner behavior)
+    diversity = min(100, len(self.unique_paths) * 2)
+
+    score = (
+        weights["attack_pattern"] * attack_rate +
+        weights["scanner_ua"] * scanner_rate +
+        weights["error_rate"] * error_rate +
+        weights["path_diversity"] * diversity
+    )
+
+    return score, breakdown
+```
+
+### 7.4 Default Configuration
+
+```python
+DEFAULT_THREAT_SIGNALS_CONFIG = {
+    "min_threat_score": 40,  # Minimum score to confirm as malicious
+    "signal_weights": {
+        "attack_pattern": 0.5,   # 50% weight
+        "scanner_ua": 0.2,       # 20% weight
+        "error_rate": 0.15,      # 15% weight
+        "path_diversity": 0.15,  # 15% weight
+    },
+}
+```
+
+---
+
+## 8. Athena Integration
+
+### 8.1 When to Use Athena
+
+| Scenario | Recommended Approach |
+|----------|---------------------|
+| < 100 log files | Direct S3 fetch |
+| 100-1000 log files | Direct S3 fetch (parallel) |
+| > 1000 log files | Athena query |
+| Historical analysis | Athena query |
+| Real-time blocking | Direct S3 fetch |
+
+### 8.2 Table Schema
+
+```sql
+CREATE EXTERNAL TABLE alb_logs (
+    type string,
+    time string,
+    elb string,
+    client_ip string,
+    client_port int,
+    target_ip string,
+    target_port int,
+    request_processing_time double,
+    target_processing_time double,
+    response_processing_time double,
+    elb_status_code int,
+    target_status_code string,
+    received_bytes bigint,
+    sent_bytes bigint,
+    request_verb string,
+    request_url string,
+    request_proto string,
+    user_agent string,
+    -- ... additional fields
+)
+ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.RegexSerDe'
+LOCATION 's3://your-bucket/alb-logs/'
+```
+
+### 8.3 Query Strategy
+
+```sql
+SELECT
+    client_ip,
+    COUNT(*) as hit_count
+FROM alb_logs
+WHERE
+    time >= '2026-01-08T00:00:00'
+    AND (
+        request_url LIKE '%../%'
+        OR request_url LIKE '%.env%'
+        OR request_url LIKE '%<script%'
+        -- Additional patterns
+    )
+GROUP BY client_ip
+HAVING COUNT(*) >= 50
+ORDER BY hit_count DESC
+LIMIT 10000
+```
+
+### 8.4 Configuration
+
+```bash
+--athena                           # Enable Athena mode
+--athena-database "security_logs"  # Athena database
+--athena-output-location "s3://my-bucket/athena-results/"
+```
+
+---
+
+## 9. Observability
+
+### 9.1 Structured Logging
+
+```python
+class JsonFormatter(logging.Formatter):
+    """JSON log formatter for CloudWatch Logs ingestion."""
+
+    def format(self, record: logging.LogRecord) -> str:
+        log_dict = {
+            "timestamp": datetime.now(timezone.utc).isoformat(),
+            "level": record.levelname,
+            "logger": record.name,
+            "message": record.getMessage(),
+            "module": record.module,
+            "function": record.funcName,
+            "line": record.lineno,
+        }
+
+        # Add exception info if present
+        if record.exc_info:
+            log_dict["exception"] = self.formatException(record.exc_info)
+
+        return json.dumps(log_dict)
+```
+
+**Enable with:** `--json-logging`
+
+### 9.2 CloudWatch Metrics
+
+```python
+class CloudWatchMetrics:
+    """Buffered CloudWatch metrics publisher."""
+
+    def put_metric(self, name: str, value: float, unit: str, dimensions: Dict):
+        self._buffer.append({
+            "MetricName": name,
+            "Value": value,
+            "Unit": unit,
+            "Dimensions": [
+                {"Name": k, "Value": v} for k, v in dimensions.items()
+            ],
+        })
+
+    def flush(self):
+        """Batch publish metrics (max 20 per API call)."""
+        for chunk in chunks(self._buffer, 20):
+            self.cloudwatch.put_metric_data(
+                Namespace=self.namespace,
+                MetricData=chunk,
+            )
+```
+
+**Metrics Emitted:**
+
+| Metric | Unit | Description |
+|--------|------|-------------|
+| `LogFilesProcessed` | Count | Number of log files analyzed |
+| `MaliciousIPsDetected` | Count | IPs matching attack patterns |
+| `IPsBlocked` | Count | IPs added to block list |
+| `IPsUnblocked` | Count | Expired blocks removed |
+| `ProcessingTimeMs` | Milliseconds | Total execution time |
+| `S3ProcessingErrors` | Count | S3 fetch failures |
+| `AverageThreatScore` | None | Mean threat score of candidates |
+
+### 9.3 Enhanced Slack Notifications
+
+```python
+class SlackSeverity(Enum):
+    INFO = "#36a64f"      # Green
+    WARNING = "#f2c744"   # Yellow
+    LOW = "#ff9933"       # Orange
+    MEDIUM = "#e07000"    # Dark orange
+    HIGH = "#cc0000"      # Red
+    CRITICAL = "#8b0000"  # Dark red
+```
+
+**Features:**
+- Severity-based color coding
+- Incident threading (related messages grouped)
+- Block Kit formatting with fields
+- Action buttons (informational)
+
+---
+
+## 10. Security Considerations
+
+### 10.1 IAM Permissions (Minimum Required)
+
+```json
+{
+  "Version": "2012-10-17",
+  "Statement": [
+    {
+      "Sid": "ELBAccess",
+      "Effect": "Allow",
+      "Action": [
+        "elasticloadbalancing:DescribeLoadBalancers",
+        "elasticloadbalancing:DescribeLoadBalancerAttributes"
+      ],
+      "Resource": "*"
+    },
+    {
+      "Sid": "EC2NACLAccess",
+      "Effect": "Allow",
+      "Action": [
+        "ec2:DescribeNetworkAcls",
+        "ec2:CreateNetworkAclEntry",
+        "ec2:DeleteNetworkAclEntry",
+        "ec2:ReplaceNetworkAclEntry"
+      ],
+      "Resource": "*"
+    },
+    {
+      "Sid": "S3LogAccess",
+      "Effect": "Allow",
+      "Action": [
+        "s3:GetObject",
+        "s3:ListBucket"
+      ],
+      "Resource": [
+        "arn:aws:s3:::your-log-bucket",
+        "arn:aws:s3:::your-log-bucket/*"
+      ]
+    },
+    {
+      "Sid": "STSIdentity",
+      "Effect": "Allow",
+      "Action": "sts:GetCallerIdentity",
+      "Resource": "*"
+    }
+  ]
+}
+```
+
+### 10.2 Additional Permissions (Optional Features)
+
+```json
+{
+  "Sid": "WAFAccess",
+  "Effect": "Allow",
+  "Action": [
+    "wafv2:GetIPSet",
+    "wafv2:UpdateIPSet",
+    "wafv2:CreateIPSet",
+    "wafv2:ListIPSets"
+  ],
+  "Resource": "*"
+},
+{
+  "Sid": "DynamoDBAccess",
+  "Effect": "Allow",
+  "Action": [
+    "dynamodb:GetItem",
+    "dynamodb:PutItem",
+    "dynamodb:DeleteItem",
+    "dynamodb:CreateTable",
+    "dynamodb:DescribeTable"
+  ],
+  "Resource": "arn:aws:dynamodb:*:*:table/auto-block-*"
+},
+{
+  "Sid": "CloudWatchMetrics",
+  "Effect": "Allow",
+  "Action": "cloudwatch:PutMetricData",
+  "Resource": "*"
+},
+{
+  "Sid": "AthenaAccess",
+  "Effect": "Allow",
+  "Action": [
+    "athena:StartQueryExecution",
+    "athena:GetQueryExecution",
+    "athena:GetQueryResults"
+  ],
+  "Resource": "*"
+}
+```
+
+### 10.3 Security Best Practices
+
+1. **Use IAM Roles**: Avoid access keys; use EC2 instance profiles or ECS task roles
+2. **Least Privilege**: Only grant permissions actually needed
+3. **Encrypt State**: Use S3 server-side encryption or DynamoDB encryption
+4. **Audit Trail**: Enable CloudTrail for NACL/WAF modifications
+5. **Separate Environments**: Use different AWS accounts for dev/staging/prod
+6. **Token Rotation**: Rotate Slack tokens and IPInfo tokens regularly
+7. **Whitelist Review**: Regularly audit whitelist entries
+
+---
+
+## Appendix A: Configuration Reference
+
+See [CLI_GUIDE.md](CLI_GUIDE.md) for complete command-line reference.
+
+## Appendix B: Troubleshooting
+
+See main [README.md](../README.md#troubleshooting) for common issues.
+
+## Appendix C: Migration Guide
+
+### From v1.x to v2.0
+
+1. **Storage Backend**: Default remains `local`; no migration needed
+2. **IPv6**: Enabled by default; use `--disable-ipv6` to disable
+3. **Multi-Signal**: Enabled by default; use `--disable-multi-signal` to disable
+4. **Registry Format**: Backward compatible; old registries load automatically
diff --git a/slack_client.py b/slack_client.py
index bbe3721..b63449e 100644
--- a/slack_client.py
+++ b/slack_client.py
@@ -4,9 +4,35 @@
 from slack_sdk.errors import SlackApiError
 import json
 import os
+from typing import Optional, Dict, List, Any
+from enum import Enum
+
+
+class SlackSeverity(Enum):
+    """Severity levels for Slack notifications with corresponding colors."""
+    INFO = "#36a64f"       # Green - informational
+    WARNING = "#f2c744"    # Yellow - warning
+    LOW = "#ff9933"        # Orange - low threat
+    MEDIUM = "#e07000"     # Dark orange - medium threat
+    HIGH = "#cc0000"       # Red - high threat
+    CRITICAL = "#8b0000"   # Dark red - critical threat
+    SUCCESS = "#2eb886"    # Teal - success
+    ERROR = "#ff0000"      # Bright red - error
+
+
+# Mapping from threat tier names to severity
+TIER_TO_SEVERITY = {
+    "minimal": SlackSeverity.LOW,
+    "low": SlackSeverity.LOW,
+    "medium": SlackSeverity.MEDIUM,
+    "high": SlackSeverity.HIGH,
+    "critical": SlackSeverity.CRITICAL,
+}
 
 
 class SlackBlock(object):
+    """Builder for Slack Block Kit messages."""
+
     def __init__(self):
         self.block = []
 
@@ -41,13 +67,79 @@ def add_image(self, image_url="", alt_text="", title="Example Image"):
 
         self.block.append(img)
 
+    def add_header(self, text: str):
+        """Add a header block."""
+        self.block.append({
+            "type": "header",
+            "text": {"type": "plain_text", "text": text, "emoji": True}
+        })
+
+    def add_context(self, elements: List[str]):
+        """Add a context block with multiple text elements."""
+        self.block.append({
+            "type": "context",
+            "elements": [
+                {"type": "mrkdwn", "text": elem} for elem in elements
+            ]
+        })
+
+    def add_fields(self, fields: List[tuple]):
+        """Add a section with multiple fields (key-value pairs)."""
+        field_elements = []
+        for label, value in fields:
+            field_elements.append({
+                "type": "mrkdwn",
+                "text": f"*{label}:*\n{value}"
+            })
+        self.block.append({
+            "type": "section",
+            "fields": field_elements
+        })
+
+    def add_actions(self, buttons: List[Dict[str, str]]):
+        """
+        Add an actions block with buttons.
+
+        Args:
+            buttons: List of button configs with keys:
+                - text: Button label
+                - action_id: Unique identifier for the action
+                - style: Optional "primary" or "danger"
+                - value: Optional value to pass with the action
+        """
+        elements = []
+        for btn in buttons:
+            button = {
+                "type": "button",
+                "text": {"type": "plain_text", "text": btn["text"], "emoji": True},
+                "action_id": btn["action_id"],
+            }
+            if btn.get("style"):
+                button["style"] = btn["style"]
+            if btn.get("value"):
+                button["value"] = btn["value"]
+            if btn.get("url"):
+                button["url"] = btn["url"]
+            elements.append(button)
+
+        self.block.append({
+            "type": "actions",
+            "elements": elements
+        })
+
     def get_json(self):
         return json.dumps(self.block)
 
 
 class SlackClient(object):
+    """
+    Enhanced Slack client with support for:
+    - Rich formatted messages with Block Kit
+    - Severity-based color coding via attachments
+    - Message threading for incident grouping
+    - Interactive action buttons
+    """
     logger = logging.getLogger(__name__)
-    # logger.setLevel(logging.DEBUG)
 
     def __init__(self, token="", webhook_url="", channel=""):
         self.token = token if token else None
@@ -55,17 +147,39 @@ def __init__(self, token="", webhook_url="", channel=""):
         self.channel = channel
         self.client = self.get_client() if self.token else None
         self.response = None
+        # Thread tracking for incident threading
+        self._active_threads: Dict[str, str] = {}  # incident_id -> thread_ts
 
     def get_client(self):
         return WebClient(token=self.token)
 
-    def post_message(self, message="", channel=""):
+    def get_thread_ts(self, incident_id: str) -> Optional[str]:
+        """Get the thread timestamp for an incident if it exists."""
+        return self._active_threads.get(incident_id)
+
+    def set_thread_ts(self, incident_id: str, thread_ts: str):
+        """Store the thread timestamp for an incident."""
+        self._active_threads[incident_id] = thread_ts
+
+    def clear_thread(self, incident_id: str):
+        """Clear the thread for an incident."""
+        self._active_threads.pop(incident_id, None)
+
+    def post_message(
+        self,
+        message: str = "",
+        channel: str = "",
+        thread_ts: Optional[str] = None,
+        reply_broadcast: bool = False,
+    ) -> bool:
         """
         Posts a text message to a Slack channel.
 
         Args:
             message: The text message to post
             channel: Optional channel override (uses self.channel if not provided)
+            thread_ts: Optional thread timestamp to reply to
+            reply_broadcast: If True and in a thread, also post to channel
 
         Returns:
             bool: True if successful, False otherwise
@@ -88,9 +202,16 @@ def post_message(self, message="", channel=""):
                 "Notifying slack channel [%s] with message: %s"
                 % (target_channel, message)
             )
-            self.response = self.client.chat_postMessage(
-                channel=target_channel, text=message
-            )
+
+            kwargs = {
+                "channel": target_channel,
+                "text": message,
+            }
+            if thread_ts:
+                kwargs["thread_ts"] = thread_ts
+                kwargs["reply_broadcast"] = reply_broadcast
+
+            self.response = self.client.chat_postMessage(**kwargs)
             self.logger.info("Message posted successfully: %s" % self.response)
             return True
         except SlackApiError as err:
@@ -102,6 +223,185 @@ def post_message(self, message="", channel=""):
             self.logger.warning("Whoops... could not post to slack: %s", err)
             return False
 
+    def post_rich_message(
+        self,
+        text: str,
+        blocks: Optional[List[Dict]] = None,
+        attachments: Optional[List[Dict]] = None,
+        severity: Optional[SlackSeverity] = None,
+        channel: str = "",
+        thread_ts: Optional[str] = None,
+        reply_broadcast: bool = False,
+    ) -> Optional[str]:
+        """
+        Posts a rich message with blocks, attachments, and optional color coding.
+
+        Args:
+            text: Fallback text for notifications
+            blocks: Optional list of Block Kit blocks
+            attachments: Optional list of attachments
+            severity: Optional severity level for color coding
+            channel: Optional channel override
+            thread_ts: Optional thread to reply to
+            reply_broadcast: If True and in a thread, also post to channel
+
+        Returns:
+            str: Thread timestamp if successful, None otherwise
+        """
+        if not self.client:
+            self.logger.error("Slack client not initialized.")
+            return None
+
+        if self.token == "test":
+            self.logger.info("Using test token. Wont post anything to slack")
+            return "test_thread_ts"
+
+        try:
+            target_channel = channel if channel else self.channel
+            if not target_channel:
+                self.logger.error("No channel specified")
+                return None
+
+            kwargs: Dict[str, Any] = {
+                "channel": target_channel,
+                "text": text,
+            }
+
+            if blocks:
+                kwargs["blocks"] = blocks
+
+            # Create attachment with severity color if specified
+            if severity:
+                color_attachment = {
+                    "color": severity.value,
+                    "blocks": blocks or [],
+                }
+                kwargs["attachments"] = [color_attachment]
+                # Remove blocks from top level when using attachments
+                kwargs.pop("blocks", None)
+            elif attachments:
+                kwargs["attachments"] = attachments
+
+            if thread_ts:
+                kwargs["thread_ts"] = thread_ts
+                kwargs["reply_broadcast"] = reply_broadcast
+
+            self.response = self.client.chat_postMessage(**kwargs)
+
+            # Return the thread_ts for threading
+            if self.response and self.response.get("ok"):
+                return self.response.get("ts")
+            return None
+
+        except SlackApiError as err:
+            self.logger.warning(
+                "Slack API error: %s", err.response["error"]
+            )
+            return None
+        except Exception as err:
+            self.logger.warning("Error posting rich message: %s", err)
+            return None
+
+    def post_incident_notification(
+        self,
+        title: str,
+        description: str,
+        fields: List[tuple],
+        severity: SlackSeverity = SlackSeverity.INFO,
+        incident_id: Optional[str] = None,
+        action_buttons: Optional[List[Dict[str, str]]] = None,
+        channel: str = "",
+    ) -> Optional[str]:
+        """
+        Posts a formatted incident notification with threading support.
+
+        Args:
+            title: Incident title (header)
+            description: Incident description
+            fields: List of (label, value) tuples for fields
+            severity: Severity level for color coding
+            incident_id: Optional incident ID for threading
+            action_buttons: Optional list of action button configs
+            channel: Optional channel override
+
+        Returns:
+            str: Thread timestamp if successful, None otherwise
+        """
+        # Build blocks
+        blocks = []
+
+        # Header
+        blocks.append({
+            "type": "header",
+            "text": {"type": "plain_text", "text": title, "emoji": True}
+        })
+
+        # Description
+        if description:
+            blocks.append({
+                "type": "section",
+                "text": {"type": "mrkdwn", "text": description}
+            })
+
+        # Fields (in pairs)
+        if fields:
+            field_elements = []
+            for label, value in fields:
+                field_elements.append({
+                    "type": "mrkdwn",
+                    "text": f"*{label}:*\n{value}"
+                })
+            # Slack allows max 10 fields per section
+            for i in range(0, len(field_elements), 10):
+                blocks.append({
+                    "type": "section",
+                    "fields": field_elements[i:i+10]
+                })
+
+        # Divider before actions
+        if action_buttons:
+            blocks.append({"type": "divider"})
+            elements = []
+            for btn in action_buttons:
+                button = {
+                    "type": "button",
+                    "text": {"type": "plain_text", "text": btn["text"], "emoji": True},
+                    "action_id": btn.get("action_id", btn["text"].lower().replace(" ", "_")),
+                }
+                if btn.get("style"):
+                    button["style"] = btn["style"]
+                if btn.get("value"):
+                    button["value"] = btn["value"]
+                if btn.get("url"):
+                    button["url"] = btn["url"]
+                elements.append(button)
+
+            blocks.append({
+                "type": "actions",
+                "elements": elements
+            })
+
+        # Get existing thread if this is a follow-up
+        thread_ts = None
+        if incident_id:
+            thread_ts = self.get_thread_ts(incident_id)
+
+        # Post the message
+        result_ts = self.post_rich_message(
+            text=f"{title}: {description}",
+            blocks=blocks,
+            severity=severity,
+            channel=channel,
+            thread_ts=thread_ts,
+            reply_broadcast=thread_ts is not None,  # Broadcast follow-ups
+        )
+
+        # Store thread_ts for future messages in this incident
+        if result_ts and incident_id and not thread_ts:
+            self.set_thread_ts(incident_id, result_ts)
+
+        return result_ts
+
     def post_blocks(self, blocks=[], channel=""):
         """
         Posts formatted blocks to a Slack channel.
diff --git a/storage_backends.py b/storage_backends.py
new file mode 100644
index 0000000..986a3fd
--- /dev/null
+++ b/storage_backends.py
@@ -0,0 +1,866 @@
+"""
+Storage Backend Abstraction Layer for AWS Auto Block Attackers
+
+This module provides pluggable storage backends for the block registry,
+enabling deployment in containerized environments (ECS Fargate, Lambda)
+where local filesystem persistence is not reliable.
+
+Supported Backends:
+    - LocalFileBackend: Original JSON file storage (backward compatible)
+    - DynamoDBBackend: Distributed storage with TTL and optimistic locking
+    - S3Backend: Lightweight cloud storage with versioning support
+
+Architecture:
+    All backends implement the StorageBackend abstract base class, ensuring
+    consistent behavior across storage implementations. The factory function
+    create_storage_backend() handles instantiation based on configuration.
+
+Usage:
+    # Via factory (recommended)
+    backend = create_storage_backend(
+        backend_type='dynamodb',
+        dynamodb_table='block-registry',
+        region='us-east-1'
+    )
+
+    # Direct instantiation
+    backend = DynamoDBBackend(table_name='block-registry', region='us-east-1')
+
+    # Operations
+    data = backend.load()
+    backend.save(data)
+    entry = backend.get('1.2.3.4')
+    backend.put('1.2.3.4', {'tier': 'high', ...})
+    backend.delete('1.2.3.4')
+    expired = backend.get_expired(datetime.now(timezone.utc))
+"""
+
+import json
+import logging
+import os
+import time
+from abc import ABC, abstractmethod
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Dict, Optional, Set, Any
+
+import boto3
+from botocore.config import Config
+from botocore.exceptions import ClientError
+
+logger = logging.getLogger(__name__)
+
+
+class StorageBackend(ABC):
+    """
+    Abstract base class for block registry storage backends.
+
+    All storage backends must implement these methods to ensure consistent
+    behavior across different storage implementations.
+
+    Thread Safety:
+        Implementations should be thread-safe for concurrent read operations.
+        Write operations may require external synchronization depending on
+        the specific backend implementation.
+    """
+
+    @abstractmethod
+    def load(self) -> Dict[str, Dict]:
+        """
+        Load the entire block registry.
+
+        Returns:
+            Dict[str, Dict]: Dictionary mapping IP addresses to their block data.
+                            Returns empty dict if no data exists.
+
+        Raises:
+            StorageError: If the storage is inaccessible or corrupted.
+        """
+        pass
+
+    @abstractmethod
+    def save(self, data: Dict[str, Dict]) -> None:
+        """
+        Save the entire block registry.
+
+        Args:
+            data: Dictionary mapping IP addresses to their block data.
+
+        Raises:
+            StorageError: If the save operation fails.
+        """
+        pass
+
+    @abstractmethod
+    def get(self, ip: str) -> Optional[Dict]:
+        """
+        Get block data for a specific IP address.
+
+        Args:
+            ip: The IP address to look up.
+
+        Returns:
+            Optional[Dict]: Block data if found, None otherwise.
+        """
+        pass
+
+    @abstractmethod
+    def put(self, ip: str, data: Dict) -> None:
+        """
+        Store or update block data for a specific IP address.
+
+        Args:
+            ip: The IP address to store.
+            data: Block data dictionary containing tier, priority, block_until, etc.
+
+        Raises:
+            StorageError: If the put operation fails.
+            ConflictError: If optimistic locking detects a concurrent modification.
+        """
+        pass
+
+    @abstractmethod
+    def delete(self, ip: str) -> None:
+        """
+        Delete block data for a specific IP address.
+
+        Args:
+            ip: The IP address to delete.
+
+        Note:
+            Should not raise an error if the IP doesn't exist.
+        """
+        pass
+
+    @abstractmethod
+    def get_expired(self, now: datetime) -> Set[str]:
+        """
+        Get all IP addresses whose blocks have expired.
+
+        Args:
+            now: Current UTC datetime for expiration comparison.
+
+        Returns:
+            Set[str]: Set of IP addresses with expired blocks.
+        """
+        pass
+
+    def cleanup_old_entries(self, now: datetime, days_old: int = 30) -> int:
+        """
+        Remove entries that expired more than `days_old` days ago.
+
+        Args:
+            now: Current UTC datetime.
+            days_old: Remove entries expired more than this many days ago.
+
+        Returns:
+            int: Number of entries removed.
+        """
+        # Default implementation - subclasses can override for efficiency
+        from datetime import timedelta
+
+        cutoff = now - timedelta(days=days_old)
+        data = self.load()
+        to_remove = []
+
+        for ip, entry in data.items():
+            try:
+                block_until_str = entry.get("block_until")
+                if block_until_str:
+                    block_until = datetime.fromisoformat(block_until_str)
+                    if block_until.tzinfo is None:
+                        block_until = block_until.replace(tzinfo=timezone.utc)
+                    if block_until < cutoff:
+                        to_remove.append(ip)
+            except (ValueError, TypeError) as e:
+                logger.warning(f"Error parsing block_until for {ip}: {e}")
+
+        for ip in to_remove:
+            self.delete(ip)
+
+        if to_remove:
+            logger.info(f"Cleaned up {len(to_remove)} old registry entries")
+
+        return len(to_remove)
+
+
+class StorageError(Exception):
+    """Raised when a storage operation fails."""
+
+    pass
+
+
+class ConflictError(StorageError):
+    """Raised when optimistic locking detects a concurrent modification."""
+
+    pass
+
+
+class LocalFileBackend(StorageBackend):
+    """
+    Local JSON file storage backend.
+
+    This is the original storage mechanism, maintained for backward compatibility
+    and local development. Uses atomic file writes to prevent corruption.
+
+    Attributes:
+        file_path: Path to the JSON registry file.
+
+    Thread Safety:
+        Uses atomic rename for write operations to prevent corruption from
+        concurrent writes, but does not provide true concurrent access safety.
+    """
+
+    def __init__(self, file_path: str = "./block_registry.json"):
+        """
+        Initialize the local file backend.
+
+        Args:
+            file_path: Path to the JSON registry file. Parent directories
+                      will be created if they don't exist.
+        """
+        self.file_path = file_path
+        self._ensure_directory()
+
+    def _ensure_directory(self) -> None:
+        """Ensure the parent directory exists."""
+        parent = Path(self.file_path).parent
+        if parent and str(parent) != ".":
+            parent.mkdir(parents=True, exist_ok=True)
+
+    def load(self) -> Dict[str, Dict]:
+        """Load registry from JSON file."""
+        try:
+            if os.path.exists(self.file_path):
+                with open(self.file_path, "r") as f:
+                    data = json.load(f)
+                    if isinstance(data, dict):
+                        logger.info(f"Loaded block registry with {len(data)} IPs from {self.file_path}")
+                        return data
+                    else:
+                        logger.warning("Block registry has invalid structure. Starting fresh.")
+                        return {}
+            else:
+                logger.info("Block registry file not found. Starting with empty registry.")
+                return {}
+        except json.JSONDecodeError as e:
+            logger.warning(f"Block registry JSON is corrupted: {e}. Starting fresh.")
+            return {}
+        except Exception as e:
+            logger.warning(f"Error loading block registry: {e}. Starting fresh.")
+            return {}
+
+    def save(self, data: Dict[str, Dict]) -> None:
+        """Save registry to JSON file atomically."""
+        try:
+            self._ensure_directory()
+
+            # Write to temp file first, then atomic rename
+            temp_file = f"{self.file_path}.tmp"
+            with open(temp_file, "w") as f:
+                json.dump(data, f, indent=2, default=str)
+            os.rename(temp_file, self.file_path)
+            logger.info(f"Saved block registry with {len(data)} IPs to {self.file_path}")
+        except Exception as e:
+            logger.error(f"Failed to save block registry: {e}")
+            raise StorageError(f"Failed to save registry: {e}") from e
+
+    def get(self, ip: str) -> Optional[Dict]:
+        """Get block data for a specific IP."""
+        data = self.load()
+        return data.get(ip)
+
+    def put(self, ip: str, entry: Dict) -> None:
+        """Store block data for a specific IP."""
+        data = self.load()
+        data[ip] = entry
+        self.save(data)
+
+    def delete(self, ip: str) -> None:
+        """Delete block data for a specific IP."""
+        data = self.load()
+        if ip in data:
+            del data[ip]
+            self.save(data)
+
+    def get_expired(self, now: datetime) -> Set[str]:
+        """Get all IPs with expired blocks."""
+        expired = set()
+        data = self.load()
+
+        for ip, entry in data.items():
+            try:
+                block_until_str = entry.get("block_until")
+                if block_until_str:
+                    block_until = datetime.fromisoformat(block_until_str)
+                    if block_until.tzinfo is None:
+                        block_until = block_until.replace(tzinfo=timezone.utc)
+                    if now >= block_until:
+                        expired.add(ip)
+            except (ValueError, TypeError) as e:
+                logger.warning(f"Error checking expiry for {ip}: {e}")
+
+        return expired
+
+
+class DynamoDBBackend(StorageBackend):
+    """
+    DynamoDB storage backend with TTL and optimistic locking.
+
+    Provides distributed, highly-available storage suitable for containerized
+    deployments. Uses DynamoDB TTL for automatic expiration cleanup and
+    conditional expressions for optimistic locking.
+
+    Table Schema:
+        - ip (String, Partition Key): The blocked IP address
+        - tier (String): Block tier (critical, high, medium, low, minimal)
+        - priority (Number): Numeric priority for slot management
+        - block_until (Number): Unix timestamp, TTL attribute for auto-expiration
+        - block_until_iso (String): ISO format timestamp for human readability
+        - first_seen (String): ISO timestamp of first detection
+        - last_seen (String): ISO timestamp of most recent detection
+        - total_hits (Number): Total malicious request count
+        - block_duration_hours (Number): Duration of the block in hours
+        - version (Number): Optimistic locking version counter
+
+    Required IAM Permissions:
+        - dynamodb:GetItem
+        - dynamodb:PutItem
+        - dynamodb:DeleteItem
+        - dynamodb:Scan
+        - dynamodb:Query
+        - dynamodb:DescribeTable
+        - dynamodb:CreateTable (optional, for auto-creation)
+
+    TTL Configuration:
+        The table should have TTL enabled on the `block_until` attribute
+        for automatic cleanup of expired entries.
+    """
+
+    def __init__(
+        self,
+        table_name: str,
+        region: str = "us-east-1",
+        create_table: bool = False,
+        endpoint_url: Optional[str] = None,
+    ):
+        """
+        Initialize the DynamoDB backend.
+
+        Args:
+            table_name: Name of the DynamoDB table.
+            region: AWS region for the table.
+            create_table: If True, create the table if it doesn't exist.
+            endpoint_url: Optional endpoint URL (for local DynamoDB testing).
+        """
+        self.table_name = table_name
+        self.region = region
+
+        boto_config = Config(
+            connect_timeout=10,
+            read_timeout=30,
+            retries={"max_attempts": 5, "mode": "adaptive"},
+        )
+
+        client_kwargs = {"region_name": region, "config": boto_config}
+        if endpoint_url:
+            client_kwargs["endpoint_url"] = endpoint_url
+
+        self.dynamodb = boto3.client("dynamodb", **client_kwargs)
+        self.table = boto3.resource("dynamodb", **client_kwargs).Table(table_name)
+
+        if create_table:
+            self._ensure_table_exists()
+
+    def _ensure_table_exists(self) -> None:
+        """Create the table if it doesn't exist."""
+        try:
+            self.dynamodb.describe_table(TableName=self.table_name)
+            logger.info(f"DynamoDB table {self.table_name} exists")
+        except ClientError as e:
+            if e.response["Error"]["Code"] == "ResourceNotFoundException":
+                logger.info(f"Creating DynamoDB table {self.table_name}")
+                self._create_table()
+            else:
+                raise StorageError(f"Error checking table: {e}") from e
+
+    def _create_table(self) -> None:
+        """Create the DynamoDB table with appropriate schema."""
+        try:
+            self.dynamodb.create_table(
+                TableName=self.table_name,
+                KeySchema=[{"AttributeName": "ip", "KeyType": "HASH"}],
+                AttributeDefinitions=[{"AttributeName": "ip", "AttributeType": "S"}],
+                BillingMode="PAY_PER_REQUEST",
+            )
+
+            # Wait for table to be active
+            waiter = self.dynamodb.get_waiter("table_exists")
+            waiter.wait(TableName=self.table_name)
+
+            # Enable TTL on block_until attribute
+            self.dynamodb.update_time_to_live(
+                TableName=self.table_name,
+                TimeToLiveSpecification={
+                    "Enabled": True,
+                    "AttributeName": "block_until",
+                },
+            )
+
+            logger.info(f"Created DynamoDB table {self.table_name} with TTL enabled")
+        except ClientError as e:
+            raise StorageError(f"Failed to create table: {e}") from e
+
+    def _serialize_entry(self, ip: str, entry: Dict) -> Dict[str, Any]:
+        """Convert registry entry to DynamoDB item format."""
+        # Convert block_until to Unix timestamp for TTL
+        block_until_ts = None
+        block_until_iso = entry.get("block_until")
+        if block_until_iso:
+            try:
+                dt = datetime.fromisoformat(block_until_iso)
+                if dt.tzinfo is None:
+                    dt = dt.replace(tzinfo=timezone.utc)
+                block_until_ts = int(dt.timestamp())
+            except (ValueError, TypeError):
+                pass
+
+        item = {
+            "ip": ip,
+            "tier": entry.get("tier", "unknown"),
+            "priority": entry.get("priority", 0),
+            "first_seen": entry.get("first_seen", ""),
+            "last_seen": entry.get("last_seen", ""),
+            "total_hits": entry.get("total_hits", 0),
+            "block_duration_hours": entry.get("block_duration_hours", 0),
+            "block_until_iso": block_until_iso or "",
+            "version": entry.get("version", 1),
+        }
+
+        if block_until_ts:
+            item["block_until"] = block_until_ts
+
+        # Preserve any additional fields
+        for key, value in entry.items():
+            if key not in item and key != "block_until":
+                item[key] = value
+
+        return item
+
+    def _deserialize_item(self, item: Dict[str, Any]) -> Dict:
+        """Convert DynamoDB item to registry entry format."""
+        entry = {
+            "tier": item.get("tier", "unknown"),
+            "priority": int(item.get("priority", 0)),
+            "first_seen": item.get("first_seen", ""),
+            "last_seen": item.get("last_seen", ""),
+            "total_hits": int(item.get("total_hits", 0)),
+            "block_duration_hours": float(item.get("block_duration_hours", 0)),
+            "block_until": item.get("block_until_iso", ""),
+            "version": int(item.get("version", 1)),
+        }
+
+        # Include any additional fields
+        for key, value in item.items():
+            if key not in ["ip", "block_until", "block_until_iso", "version"] and key not in entry:
+                entry[key] = value
+
+        return entry
+
+    def load(self) -> Dict[str, Dict]:
+        """Load all entries from DynamoDB."""
+        try:
+            data = {}
+            paginator = self.dynamodb.get_paginator("scan")
+
+            for page in paginator.paginate(TableName=self.table_name):
+                for item in page.get("Items", []):
+                    # Convert DynamoDB format to Python dict
+                    ip = item.get("ip", {}).get("S", "")
+                    if ip:
+                        python_item = self._dynamodb_to_python(item)
+                        data[ip] = self._deserialize_item(python_item)
+
+            logger.info(f"Loaded {len(data)} entries from DynamoDB table {self.table_name}")
+            return data
+        except ClientError as e:
+            logger.error(f"Failed to load from DynamoDB: {e}")
+            raise StorageError(f"Failed to load from DynamoDB: {e}") from e
+
+    def _dynamodb_to_python(self, item: Dict) -> Dict:
+        """Convert DynamoDB typed format to Python dict."""
+        result = {}
+        for key, value in item.items():
+            if "S" in value:
+                result[key] = value["S"]
+            elif "N" in value:
+                result[key] = value["N"]
+            elif "BOOL" in value:
+                result[key] = value["BOOL"]
+            elif "NULL" in value:
+                result[key] = None
+            else:
+                result[key] = value
+        return result
+
+    def save(self, data: Dict[str, Dict]) -> None:
+        """
+        Save all entries to DynamoDB.
+
+        Note: This performs a full replace operation. For large datasets,
+        consider using individual put() calls for better efficiency.
+        """
+        try:
+            # Get existing IPs to handle deletions
+            existing = set(self.load().keys())
+            new_ips = set(data.keys())
+
+            # Delete removed entries
+            for ip in existing - new_ips:
+                self.delete(ip)
+
+            # Put new/updated entries
+            for ip, entry in data.items():
+                self.put(ip, entry)
+
+            logger.info(f"Saved {len(data)} entries to DynamoDB table {self.table_name}")
+        except ClientError as e:
+            logger.error(f"Failed to save to DynamoDB: {e}")
+            raise StorageError(f"Failed to save to DynamoDB: {e}") from e
+
+    def get(self, ip: str) -> Optional[Dict]:
+        """Get block data for a specific IP."""
+        try:
+            response = self.table.get_item(Key={"ip": ip})
+            item = response.get("Item")
+            if item:
+                return self._deserialize_item(item)
+            return None
+        except ClientError as e:
+            logger.error(f"Failed to get {ip} from DynamoDB: {e}")
+            raise StorageError(f"Failed to get from DynamoDB: {e}") from e
+
+    def put(self, ip: str, entry: Dict) -> None:
+        """
+        Store block data with optimistic locking.
+
+        Uses conditional expression to prevent concurrent overwrites.
+        """
+        try:
+            item = self._serialize_entry(ip, entry)
+
+            # Increment version for optimistic locking
+            old_version = entry.get("version", 0)
+            item["version"] = old_version + 1
+
+            # Use conditional expression for optimistic locking
+            if old_version > 0:
+                try:
+                    self.table.put_item(
+                        Item=item,
+                        ConditionExpression="attribute_not_exists(ip) OR version = :v",
+                        ExpressionAttributeValues={":v": old_version},
+                    )
+                except ClientError as e:
+                    if e.response["Error"]["Code"] == "ConditionalCheckFailedException":
+                        # Concurrent modification - retry with fresh data
+                        logger.warning(f"Concurrent modification detected for {ip}, retrying")
+                        existing = self.get(ip)
+                        if existing:
+                            # Merge updates and retry
+                            merged = {**existing, **entry}
+                            merged["version"] = existing.get("version", 0)
+                            self.put(ip, merged)
+                            return
+                        else:
+                            # Entry was deleted, proceed with new entry
+                            item["version"] = 1
+                            self.table.put_item(Item=item)
+                    else:
+                        raise
+            else:
+                self.table.put_item(Item=item)
+
+            logger.debug(f"Stored {ip} in DynamoDB (version {item['version']})")
+        except ClientError as e:
+            if e.response["Error"]["Code"] == "ConditionalCheckFailedException":
+                raise ConflictError(f"Concurrent modification for {ip}") from e
+            logger.error(f"Failed to put {ip} to DynamoDB: {e}")
+            raise StorageError(f"Failed to put to DynamoDB: {e}") from e
+
+    def delete(self, ip: str) -> None:
+        """Delete block data for a specific IP."""
+        try:
+            self.table.delete_item(Key={"ip": ip})
+            logger.debug(f"Deleted {ip} from DynamoDB")
+        except ClientError as e:
+            # Ignore if item doesn't exist
+            if e.response["Error"]["Code"] != "ResourceNotFoundException":
+                logger.error(f"Failed to delete {ip} from DynamoDB: {e}")
+                raise StorageError(f"Failed to delete from DynamoDB: {e}") from e
+
+    def get_expired(self, now: datetime) -> Set[str]:
+        """Get all IPs with expired blocks."""
+        expired = set()
+        now_ts = int(now.timestamp())
+
+        try:
+            # Scan for items where block_until < now
+            # Note: In production, consider using a GSI for more efficient queries
+            paginator = self.dynamodb.get_paginator("scan")
+
+            for page in paginator.paginate(
+                TableName=self.table_name,
+                FilterExpression="block_until < :now",
+                ExpressionAttributeValues={":now": {"N": str(now_ts)}},
+            ):
+                for item in page.get("Items", []):
+                    ip = item.get("ip", {}).get("S", "")
+                    if ip:
+                        expired.add(ip)
+
+            return expired
+        except ClientError as e:
+            logger.error(f"Failed to get expired entries from DynamoDB: {e}")
+            raise StorageError(f"Failed to get expired: {e}") from e
+
+    def cleanup_old_entries(self, now: datetime, days_old: int = 30) -> int:
+        """
+        DynamoDB TTL handles this automatically.
+
+        Returns 0 as entries are auto-deleted by DynamoDB when TTL expires.
+        """
+        # DynamoDB TTL handles automatic deletion
+        logger.info("DynamoDB TTL handles automatic cleanup of expired entries")
+        return 0
+
+
+class S3Backend(StorageBackend):
+    """
+    S3 storage backend with versioning support.
+
+    Provides a lightweight cloud storage option using S3. Uses ETags for
+    conflict detection and supports S3 versioning for data protection.
+
+    Storage Format:
+        The registry is stored as a single JSON file in the specified bucket.
+        S3 versioning is recommended for recovery from accidental deletions.
+
+    Required IAM Permissions:
+        - s3:GetObject
+        - s3:PutObject
+        - s3:DeleteObject
+        - s3:ListBucket
+        - s3:GetObjectVersion (if versioning enabled)
+
+    ETag-Based Conflict Detection:
+        Uses S3 ETags to detect concurrent modifications. If a conflict is
+        detected, the operation will retry with the latest data.
+    """
+
+    def __init__(
+        self,
+        bucket: str,
+        key: str = "block_registry.json",
+        region: str = "us-east-1",
+        endpoint_url: Optional[str] = None,
+    ):
+        """
+        Initialize the S3 backend.
+
+        Args:
+            bucket: S3 bucket name.
+            key: S3 object key for the registry file.
+            region: AWS region for the bucket.
+            endpoint_url: Optional endpoint URL (for S3-compatible storage).
+        """
+        self.bucket = bucket
+        self.key = key
+        self.region = region
+        self._etag: Optional[str] = None
+
+        boto_config = Config(
+            connect_timeout=10,
+            read_timeout=30,
+            retries={"max_attempts": 5, "mode": "adaptive"},
+        )
+
+        client_kwargs = {"region_name": region, "config": boto_config}
+        if endpoint_url:
+            client_kwargs["endpoint_url"] = endpoint_url
+
+        self.s3 = boto3.client("s3", **client_kwargs)
+
+    def load(self) -> Dict[str, Dict]:
+        """Load registry from S3."""
+        try:
+            response = self.s3.get_object(Bucket=self.bucket, Key=self.key)
+            self._etag = response.get("ETag", "").strip('"')
+            data = json.loads(response["Body"].read().decode("utf-8"))
+
+            if isinstance(data, dict):
+                logger.info(f"Loaded {len(data)} entries from s3://{self.bucket}/{self.key}")
+                return data
+            else:
+                logger.warning("S3 registry has invalid structure. Starting fresh.")
+                return {}
+        except ClientError as e:
+            if e.response["Error"]["Code"] == "NoSuchKey":
+                logger.info("S3 registry not found. Starting with empty registry.")
+                self._etag = None
+                return {}
+            logger.error(f"Failed to load from S3: {e}")
+            raise StorageError(f"Failed to load from S3: {e}") from e
+        except json.JSONDecodeError as e:
+            logger.warning(f"S3 registry JSON is corrupted: {e}. Starting fresh.")
+            self._etag = None
+            return {}
+
+    def save(self, data: Dict[str, Dict]) -> None:
+        """
+        Save registry to S3 with ETag-based conflict detection.
+
+        Uses conditional put to prevent overwriting concurrent changes.
+        """
+        try:
+            body = json.dumps(data, indent=2, default=str)
+
+            put_kwargs = {
+                "Bucket": self.bucket,
+                "Key": self.key,
+                "Body": body.encode("utf-8"),
+                "ContentType": "application/json",
+            }
+
+            # Use ETag for optimistic locking if we have one
+            if self._etag:
+                put_kwargs["Metadata"] = {"previous-etag": self._etag}
+
+            response = self.s3.put_object(**put_kwargs)
+            self._etag = response.get("ETag", "").strip('"')
+
+            logger.info(f"Saved {len(data)} entries to s3://{self.bucket}/{self.key}")
+        except ClientError as e:
+            logger.error(f"Failed to save to S3: {e}")
+            raise StorageError(f"Failed to save to S3: {e}") from e
+
+    def get(self, ip: str) -> Optional[Dict]:
+        """Get block data for a specific IP."""
+        data = self.load()
+        return data.get(ip)
+
+    def put(self, ip: str, entry: Dict) -> None:
+        """Store block data for a specific IP."""
+        max_retries = 3
+        for attempt in range(max_retries):
+            try:
+                data = self.load()
+                data[ip] = entry
+                self.save(data)
+                return
+            except StorageError as e:
+                if attempt < max_retries - 1:
+                    logger.warning(f"Retry {attempt + 1}/{max_retries} for put({ip})")
+                    time.sleep(0.5 * (attempt + 1))
+                else:
+                    raise
+
+    def delete(self, ip: str) -> None:
+        """Delete block data for a specific IP."""
+        try:
+            data = self.load()
+            if ip in data:
+                del data[ip]
+                self.save(data)
+        except StorageError:
+            pass  # Ignore errors when deleting non-existent entries
+
+    def get_expired(self, now: datetime) -> Set[str]:
+        """Get all IPs with expired blocks."""
+        expired = set()
+        data = self.load()
+
+        for ip, entry in data.items():
+            try:
+                block_until_str = entry.get("block_until")
+                if block_until_str:
+                    block_until = datetime.fromisoformat(block_until_str)
+                    if block_until.tzinfo is None:
+                        block_until = block_until.replace(tzinfo=timezone.utc)
+                    if now >= block_until:
+                        expired.add(ip)
+            except (ValueError, TypeError) as e:
+                logger.warning(f"Error checking expiry for {ip}: {e}")
+
+        return expired
+
+
+def create_storage_backend(
+    backend_type: str = "local",
+    local_file: str = "./block_registry.json",
+    dynamodb_table: Optional[str] = None,
+    s3_bucket: Optional[str] = None,
+    s3_key: str = "block_registry.json",
+    region: str = "us-east-1",
+    create_dynamodb_table: bool = False,
+) -> StorageBackend:
+    """
+    Factory function to create the appropriate storage backend.
+
+    Args:
+        backend_type: One of 'local', 'dynamodb', or 's3'.
+        local_file: Path for local file backend.
+        dynamodb_table: Table name for DynamoDB backend.
+        s3_bucket: Bucket name for S3 backend.
+        s3_key: Object key for S3 backend.
+        region: AWS region for cloud backends.
+        create_dynamodb_table: Whether to create DynamoDB table if missing.
+
+    Returns:
+        StorageBackend: Configured storage backend instance.
+
+    Raises:
+        ValueError: If required parameters are missing for the selected backend.
+
+    Example:
+        # Local backend (default)
+        backend = create_storage_backend()
+
+        # DynamoDB backend
+        backend = create_storage_backend(
+            backend_type='dynamodb',
+            dynamodb_table='block-registry',
+            region='us-east-1'
+        )
+
+        # S3 backend
+        backend = create_storage_backend(
+            backend_type='s3',
+            s3_bucket='my-security-bucket',
+            s3_key='config/block_registry.json'
+        )
+    """
+    backend_type = backend_type.lower()
+
+    if backend_type == "local":
+        logger.info(f"Using local file storage backend: {local_file}")
+        return LocalFileBackend(file_path=local_file)
+
+    elif backend_type == "dynamodb":
+        if not dynamodb_table:
+            raise ValueError("dynamodb_table is required for DynamoDB backend")
+        logger.info(f"Using DynamoDB storage backend: {dynamodb_table}")
+        return DynamoDBBackend(
+            table_name=dynamodb_table,
+            region=region,
+            create_table=create_dynamodb_table,
+        )
+
+    elif backend_type == "s3":
+        if not s3_bucket:
+            raise ValueError("s3_bucket is required for S3 backend")
+        logger.info(f"Using S3 storage backend: s3://{s3_bucket}/{s3_key}")
+        return S3Backend(bucket=s3_bucket, key=s3_key, region=region)
+
+    else:
+        raise ValueError(f"Unknown backend type: {backend_type}. Use 'local', 'dynamodb', or 's3'")
diff --git a/tests/test_auto_block_attackers.py b/tests/test_auto_block_attackers.py
index fa5b7ed..0444e55 100644
--- a/tests/test_auto_block_attackers.py
+++ b/tests/test_auto_block_attackers.py
@@ -10,10 +10,11 @@
 from collections import Counter
 import sys
 import os
+import logging
 
 # Add parent directory to path to import the module
 sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
-from auto_block_attackers import NaclAutoBlocker, is_valid_public_ipv4, ATTACK_PATTERNS
+from auto_block_attackers import NaclAutoBlocker, is_valid_public_ipv4, is_valid_public_ip, ATTACK_PATTERNS
 
 
 class TestHelperFunctions(unittest.TestCase):
@@ -38,6 +39,60 @@ def test_is_valid_public_ipv4_invalid(self):
         self.assertFalse(is_valid_public_ipv4("256.1.1.1"))
         self.assertFalse(is_valid_public_ipv4("2001:db8::1"))  # IPv6
 
+    def test_is_valid_public_ip_ipv4(self):
+        """Test is_valid_public_ip with valid IPv4 addresses"""
+        is_valid, version = is_valid_public_ip("8.8.8.8")
+        self.assertTrue(is_valid)
+        self.assertEqual(version, 4)
+
+        is_valid, version = is_valid_public_ip("1.1.1.1")
+        self.assertTrue(is_valid)
+        self.assertEqual(version, 4)
+
+    def test_is_valid_public_ip_ipv6(self):
+        """Test is_valid_public_ip with valid IPv6 addresses"""
+        # Google's public IPv6 DNS
+        is_valid, version = is_valid_public_ip("2001:4860:4860::8888")
+        self.assertTrue(is_valid)
+        self.assertEqual(version, 6)
+
+    def test_is_valid_public_ip_private_ipv4(self):
+        """Test is_valid_public_ip rejects private IPv4"""
+        is_valid, version = is_valid_public_ip("192.168.1.1")
+        self.assertFalse(is_valid)
+        self.assertEqual(version, 4)
+
+        is_valid, version = is_valid_public_ip("10.0.0.1")
+        self.assertFalse(is_valid)
+        self.assertEqual(version, 4)
+
+    def test_is_valid_public_ip_private_ipv6(self):
+        """Test is_valid_public_ip rejects private/local IPv6"""
+        # Link-local address
+        is_valid, version = is_valid_public_ip("fe80::1")
+        self.assertFalse(is_valid)
+        self.assertEqual(version, 6)
+
+        # Loopback
+        is_valid, version = is_valid_public_ip("::1")
+        self.assertFalse(is_valid)
+        self.assertEqual(version, 6)
+
+        # Unique local (fc00::/7)
+        is_valid, version = is_valid_public_ip("fd00::1")
+        self.assertFalse(is_valid)
+        self.assertEqual(version, 6)
+
+    def test_is_valid_public_ip_invalid(self):
+        """Test is_valid_public_ip with invalid addresses"""
+        is_valid, version = is_valid_public_ip("not_an_ip")
+        self.assertFalse(is_valid)
+        self.assertEqual(version, 0)
+
+        is_valid, version = is_valid_public_ip("256.1.1.1")
+        self.assertFalse(is_valid)
+        self.assertEqual(version, 0)
+
     def test_attack_patterns_detection(self):
         """Test that attack patterns detect malicious requests"""
         malicious_samples = [
@@ -424,8 +479,863 @@ def test_download_and_parse_log(self, mock_boto_client):
 
         result = blocker._download_and_parse_log("test-bucket", "test-key")
 
-        # Should extract the IP address
-        self.assertEqual(result, ["1.2.3.4"])
+        # Should extract the IP address with version (now returns tuples)
+        self.assertEqual(result, [("1.2.3.4", 4)])
+
+
+class TestWAFIntegration(unittest.TestCase):
+    """Test AWS WAF IP Set integration"""
+
+    @patch("boto3.client")
+    def test_waf_disabled_by_default(self, mock_boto_client):
+        """Test that WAF is disabled when no IP set name/ID is provided"""
+        mock_ec2 = MagicMock()
+        mock_elbv2 = MagicMock()
+        mock_s3 = MagicMock()
+        mock_sts = MagicMock()
+
+        def client_factory(service, **kwargs):
+            clients = {
+                "ec2": mock_ec2,
+                "elbv2": mock_elbv2,
+                "s3": mock_s3,
+                "sts": mock_sts,
+            }
+            return clients.get(service, MagicMock())
+
+        mock_boto_client.side_effect = client_factory
+
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False
+        )
+
+        self.assertFalse(blocker._waf_enabled)
+        self.assertIsNone(blocker.wafv2)
+
+    @patch("boto3.client")
+    def test_waf_enabled_with_ip_set_name(self, mock_boto_client):
+        """Test that WAF is enabled when IP set name is provided"""
+        mock_ec2 = MagicMock()
+        mock_elbv2 = MagicMock()
+        mock_s3 = MagicMock()
+        mock_sts = MagicMock()
+        mock_wafv2 = MagicMock()
+
+        # Mock WAF IP set search (not found, and not creating)
+        mock_wafv2.get_paginator.return_value.paginate.return_value = [{"IPSets": []}]
+
+        def client_factory(service, **kwargs):
+            clients = {
+                "ec2": mock_ec2,
+                "elbv2": mock_elbv2,
+                "s3": mock_s3,
+                "sts": mock_sts,
+                "wafv2": mock_wafv2,
+            }
+            return clients.get(service, MagicMock())
+
+        mock_boto_client.side_effect = client_factory
+
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            waf_ip_set_name="test-blocklist",
+        )
+
+        # WAF will be disabled because the IP set wasn't found and create_waf_ip_set=False
+        self.assertFalse(blocker._waf_enabled)
+
+    @patch("boto3.client")
+    def test_waf_find_existing_ip_set(self, mock_boto_client):
+        """Test finding an existing WAF IP set by name"""
+        mock_ec2 = MagicMock()
+        mock_elbv2 = MagicMock()
+        mock_s3 = MagicMock()
+        mock_sts = MagicMock()
+        mock_wafv2 = MagicMock()
+
+        # Mock WAF IP set search (found)
+        mock_wafv2.get_paginator.return_value.paginate.return_value = [
+            {"IPSets": [{"Name": "test-blocklist", "Id": "abc-123"}]}
+        ]
+        mock_wafv2.get_ip_set.return_value = {
+            "IPSet": {"Name": "test-blocklist", "Addresses": []},
+            "LockToken": "lock-token-123"
+        }
+
+        def client_factory(service, **kwargs):
+            clients = {
+                "ec2": mock_ec2,
+                "elbv2": mock_elbv2,
+                "s3": mock_s3,
+                "sts": mock_sts,
+                "wafv2": mock_wafv2,
+            }
+            return clients.get(service, MagicMock())
+
+        mock_boto_client.side_effect = client_factory
+
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            waf_ip_set_name="test-blocklist",
+        )
+
+        self.assertTrue(blocker._waf_enabled)
+        self.assertEqual(blocker._waf_ip_set_id, "abc-123")
+
+    @patch("boto3.client")
+    def test_waf_get_statistics(self, mock_boto_client):
+        """Test WAF statistics when disabled"""
+        mock_ec2 = MagicMock()
+        mock_elbv2 = MagicMock()
+        mock_s3 = MagicMock()
+        mock_sts = MagicMock()
+
+        def client_factory(service, **kwargs):
+            clients = {
+                "ec2": mock_ec2,
+                "elbv2": mock_elbv2,
+                "s3": mock_s3,
+                "sts": mock_sts,
+            }
+            return clients.get(service, MagicMock())
+
+        mock_boto_client.side_effect = client_factory
+
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False
+        )
+
+        stats = blocker._get_waf_statistics()
+        self.assertFalse(stats["enabled"])
+
+    @patch("boto3.client")
+    def test_waf_cloudfront_uses_us_east_1(self, mock_boto_client):
+        """Test that CloudFront scope WAF uses us-east-1 region"""
+        mock_ec2 = MagicMock()
+        mock_elbv2 = MagicMock()
+        mock_s3 = MagicMock()
+        mock_sts = MagicMock()
+        mock_wafv2 = MagicMock()
+
+        # Mock WAF IP set search (not found)
+        mock_wafv2.get_paginator.return_value.paginate.return_value = [{"IPSets": []}]
+
+        regions_used = []
+
+        def client_factory(service, **kwargs):
+            if service == "wafv2":
+                regions_used.append(kwargs.get("region_name"))
+            clients = {
+                "ec2": mock_ec2,
+                "elbv2": mock_elbv2,
+                "s3": mock_s3,
+                "sts": mock_sts,
+                "wafv2": mock_wafv2,
+            }
+            return clients.get(service, MagicMock())
+
+        mock_boto_client.side_effect = client_factory
+
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test",
+            region="ap-southeast-2",  # Non-US region
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            waf_ip_set_name="test-blocklist",
+            waf_ip_set_scope="CLOUDFRONT",
+        )
+
+        # WAF client should have been created with us-east-1 for CloudFront
+        self.assertIn("us-east-1", regions_used)
+
+
+class TestLoggingAndMetrics(unittest.TestCase):
+    """Test structured logging and CloudWatch metrics"""
+
+    def test_json_formatter(self):
+        """Test JsonFormatter produces valid JSON"""
+        from auto_block_attackers import JsonFormatter
+        import json as json_mod
+
+        formatter = JsonFormatter()
+
+        # Create a mock log record
+        record = logging.LogRecord(
+            name="test",
+            level=logging.INFO,
+            pathname="test.py",
+            lineno=10,
+            msg="Test message",
+            args=(),
+            exc_info=None,
+        )
+
+        output = formatter.format(record)
+
+        # Should be valid JSON
+        parsed = json_mod.loads(output)
+        self.assertEqual(parsed["level"], "INFO")
+        self.assertEqual(parsed["message"], "Test message")
+        self.assertIn("timestamp", parsed)
+
+    def test_cloudwatch_metrics_disabled_by_default(self):
+        """Test CloudWatch metrics are disabled when not requested"""
+        from auto_block_attackers import CloudWatchMetrics
+
+        metrics = CloudWatchMetrics(enabled=False)
+        self.assertFalse(metrics.enabled)
+
+        # Should not raise when putting metrics while disabled
+        metrics.put_count("TestMetric", 1)
+        metrics.put_timing("TestTiming", 1.0)
+        metrics.flush()  # Should be a no-op
+
+    def test_cloudwatch_metrics_dry_run(self):
+        """Test CloudWatch metrics in dry run mode"""
+        from auto_block_attackers import CloudWatchMetrics
+
+        metrics = CloudWatchMetrics(enabled=True, dry_run=True)
+
+        # Put some metrics
+        metrics.put_count("TestMetric", 5, {"Region": "us-east-1"})
+        metrics.put_timing("TestTiming", 1.5)
+
+        # Flush should not raise in dry run mode
+        metrics.flush()
+
+        # Buffer should be cleared after flush
+        self.assertEqual(len(metrics._metric_buffer), 0)
+
+    @patch("boto3.client")
+    def test_nacl_blocker_with_json_logging(self, mock_boto_client):
+        """Test NaclAutoBlocker initializes with JSON logging"""
+        mock_ec2 = MagicMock()
+        mock_elbv2 = MagicMock()
+        mock_s3 = MagicMock()
+        mock_sts = MagicMock()
+
+        def client_factory(service, **kwargs):
+            clients = {
+                "ec2": mock_ec2,
+                "elbv2": mock_elbv2,
+                "s3": mock_s3,
+                "sts": mock_sts,
+            }
+            return clients.get(service, MagicMock())
+
+        mock_boto_client.side_effect = client_factory
+
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            json_logging=True,
+        )
+
+        # Verify metrics object is created
+        self.assertIsNotNone(blocker._metrics)
+        self.assertFalse(blocker._metrics.enabled)  # Not enabled by default
+
+    @patch("boto3.client")
+    def test_nacl_blocker_with_metrics_enabled(self, mock_boto_client):
+        """Test NaclAutoBlocker initializes with CloudWatch metrics enabled"""
+        mock_ec2 = MagicMock()
+        mock_elbv2 = MagicMock()
+        mock_s3 = MagicMock()
+        mock_sts = MagicMock()
+        mock_cloudwatch = MagicMock()
+
+        def client_factory(service, **kwargs):
+            clients = {
+                "ec2": mock_ec2,
+                "elbv2": mock_elbv2,
+                "s3": mock_s3,
+                "sts": mock_sts,
+                "cloudwatch": mock_cloudwatch,
+            }
+            return clients.get(service, MagicMock())
+
+        mock_boto_client.side_effect = client_factory
+
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            enable_cloudwatch_metrics=True,
+            cloudwatch_namespace="TestNamespace",
+        )
+
+        # Verify metrics object is created and enabled (though in dry_run)
+        self.assertIsNotNone(blocker._metrics)
+
+
+class TestMultiSignalDetection(unittest.TestCase):
+    """Test multi-signal threat detection"""
+
+    def test_threat_signals_initialization(self):
+        """Test ThreatSignals class initialization"""
+        from auto_block_attackers import ThreatSignals
+
+        signals = ThreatSignals()
+        self.assertEqual(signals.attack_pattern_hits, 0)
+        self.assertEqual(signals.scanner_ua_hits, 0)
+        self.assertEqual(signals.error_responses, 0)
+        self.assertEqual(signals.total_requests, 0)
+        self.assertEqual(len(signals.unique_paths), 0)
+
+    def test_threat_signals_add_request(self):
+        """Test adding requests to ThreatSignals"""
+        from auto_block_attackers import ThreatSignals
+
+        signals = ThreatSignals()
+        signals.add_request(
+            has_attack_pattern=True,
+            has_scanner_ua=True,
+            status_code=404,
+            path="/admin.php",
+        )
+
+        self.assertEqual(signals.attack_pattern_hits, 1)
+        self.assertEqual(signals.scanner_ua_hits, 1)
+        self.assertEqual(signals.error_responses, 1)
+        self.assertEqual(signals.total_requests, 1)
+        self.assertIn("/admin.php", signals.unique_paths)
+
+    def test_threat_signals_score_calculation(self):
+        """Test threat score calculation"""
+        from auto_block_attackers import ThreatSignals, DEFAULT_THREAT_SIGNALS_CONFIG
+
+        signals = ThreatSignals()
+
+        # Add 10 requests, all with attack patterns and from scanner
+        for i in range(10):
+            signals.add_request(
+                has_attack_pattern=True,
+                has_scanner_ua=True,
+                status_code=404,
+                path=f"/path{i}",
+            )
+
+        score, breakdown = signals.calculate_threat_score(DEFAULT_THREAT_SIGNALS_CONFIG)
+
+        # Should have high score
+        self.assertGreater(score, 60)
+        self.assertIn("attack_pattern", breakdown)
+        self.assertIn("scanner_ua", breakdown)
+
+    def test_threat_signals_benign_traffic(self):
+        """Test that benign traffic gets low threat score"""
+        from auto_block_attackers import ThreatSignals, DEFAULT_THREAT_SIGNALS_CONFIG
+
+        signals = ThreatSignals()
+
+        # Add 100 normal requests (no attack patterns, no scanner UA)
+        for i in range(100):
+            signals.add_request(
+                has_attack_pattern=False,
+                has_scanner_ua=False,
+                status_code=200,
+                path="/",
+            )
+
+        is_malicious, score, _ = signals.is_malicious(DEFAULT_THREAT_SIGNALS_CONFIG)
+
+        # Should NOT be considered malicious
+        self.assertFalse(is_malicious)
+        self.assertLess(score, DEFAULT_THREAT_SIGNALS_CONFIG["min_threat_score"])
+
+    def test_scanner_user_agent_pattern(self):
+        """Test SCANNER_USER_AGENTS pattern matching"""
+        from auto_block_attackers import SCANNER_USER_AGENTS
+
+        # Known scanner user agents
+        scanner_agents = [
+            "Mozilla/5.0 zgrab/0.x",
+            "Nmap Scripting Engine",
+            "sqlmap/1.5",
+            "python-requests/2.25",
+            "Go-http-client/1.1",
+            "Nikto/2.1.6",
+            "curl/7.68.0",
+            "wget/1.20.3",
+        ]
+
+        for ua in scanner_agents:
+            self.assertTrue(
+                bool(SCANNER_USER_AGENTS.search(ua)),
+                f"Should detect scanner UA: {ua}",
+            )
+
+        # Normal user agents
+        normal_agents = [
+            "Mozilla/5.0 (Windows NT 10.0; Win64; x64) Chrome/91.0",
+            "Mozilla/5.0 (iPhone; CPU iPhone OS 14_6 like Mac OS X)",
+            "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) Safari/537.36",
+        ]
+
+        for ua in normal_agents:
+            self.assertFalse(
+                bool(SCANNER_USER_AGENTS.search(ua)),
+                f"Should not flag normal UA: {ua}",
+            )
+
+    @patch("boto3.client")
+    def test_blocker_with_multi_signal_disabled(self, mock_boto_client):
+        """Test NaclAutoBlocker with multi-signal detection disabled"""
+        mock_ec2 = MagicMock()
+        mock_elbv2 = MagicMock()
+        mock_s3 = MagicMock()
+        mock_sts = MagicMock()
+
+        def client_factory(service, **kwargs):
+            clients = {
+                "ec2": mock_ec2,
+                "elbv2": mock_elbv2,
+                "s3": mock_s3,
+                "sts": mock_sts,
+            }
+            return clients.get(service, MagicMock())
+
+        mock_boto_client.side_effect = client_factory
+
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            enable_multi_signal=False,
+        )
+
+        self.assertFalse(blocker._enable_multi_signal)
+
+
+class TestEnhancedSlackNotifications(unittest.TestCase):
+    """Test enhanced Slack notification functionality"""
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_enhanced_slack_disabled_by_default(self, mock_boto_client):
+        """Test that enhanced Slack is disabled by default"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+        )
+
+        self.assertFalse(blocker._enhanced_slack)
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_enhanced_slack_enabled(self, mock_boto_client):
+        """Test that enhanced Slack can be enabled"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            enhanced_slack=True,
+        )
+
+        self.assertTrue(blocker._enhanced_slack)
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_tier_emoji_mapping(self, mock_boto_client):
+        """Test tier to emoji mapping"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+        )
+
+        self.assertEqual(blocker._get_tier_emoji("critical"), ":rotating_light:")
+        self.assertEqual(blocker._get_tier_emoji("high"), ":red_circle:")
+        self.assertEqual(blocker._get_tier_emoji("medium"), ":large_orange_circle:")
+        self.assertEqual(blocker._get_tier_emoji("low"), ":large_yellow_circle:")
+        self.assertEqual(blocker._get_tier_emoji("minimal"), ":white_circle:")
+        self.assertEqual(blocker._get_tier_emoji("unknown"), ":question:")
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_format_duration(self, mock_boto_client):
+        """Test duration formatting"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+        )
+
+        self.assertEqual(blocker._format_duration(72), "3d")
+        self.assertEqual(blocker._format_duration(24), "1d")
+        self.assertEqual(blocker._format_duration(12), "12h")
+        self.assertEqual(blocker._format_duration(1), "1h")
+        self.assertEqual(blocker._format_duration(0.5), "30m")
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_enhanced_notification_skips_dry_run(self, mock_boto_client):
+        """Test that enhanced notification skips in dry run mode"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            enhanced_slack=True,
+            slack_token="test-token",
+            slack_channel="test-channel",
+        )
+
+        # Should not raise any errors
+        blocker._send_enhanced_slack_notification(
+            new_offenders={"1.2.3.4"},
+            final_blocked_ips={"1.2.3.4"},
+            ip_counts=Counter({"1.2.3.4": 100}),
+            initially_blocked_ips=set(),
+            active_blocks={"1.2.3.4": {"tier": "high", "block_duration_hours": 72}},
+        )
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_enhanced_notification_skips_no_changes(self, mock_boto_client):
+        """Test that enhanced notification skips when no changes"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=False,
+            debug=False,
+            enhanced_slack=True,
+            slack_token="test-token",
+            slack_channel="test-channel",
+        )
+
+        # Mock the Slack client
+        blocker.slack_client = MagicMock()
+        blocker.slack_client.post_incident_notification = MagicMock(return_value="test_ts")
+
+        # Call with no changes (same blocked IPs)
+        blocker._send_enhanced_slack_notification(
+            new_offenders=set(),
+            final_blocked_ips={"1.2.3.4"},
+            ip_counts=Counter({"1.2.3.4": 100}),
+            initially_blocked_ips={"1.2.3.4"},  # Same as final
+            active_blocks={"1.2.3.4": {"tier": "high", "block_duration_hours": 72}},
+        )
+
+        # Should not have called post_incident_notification
+        blocker.slack_client.post_incident_notification.assert_not_called()
+
+
+class TestAthenaIntegration(unittest.TestCase):
+    """Test Athena integration for large-scale log analysis"""
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_athena_disabled_by_default(self, mock_boto_client):
+        """Test that Athena is disabled by default"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+        )
+
+        self.assertFalse(blocker._athena_enabled)
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_athena_enabled_without_output_location(self, mock_boto_client):
+        """Test that Athena is disabled if no output location provided"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            athena_enabled=True,
+            athena_output_location=None,  # Missing!
+        )
+
+        # Should be disabled due to missing output location
+        self.assertFalse(blocker._athena_enabled)
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_athena_enabled_with_output_location(self, mock_boto_client):
+        """Test that Athena is enabled when output location provided"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            athena_enabled=True,
+            athena_output_location="s3://my-bucket/athena-results/",
+        )
+
+        self.assertTrue(blocker._athena_enabled)
+        self.assertEqual(blocker._athena_database, "alb_logs")
+        self.assertEqual(blocker._athena_output_location, "s3://my-bucket/athena-results/")
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_athena_custom_database(self, mock_boto_client):
+        """Test custom Athena database name"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            athena_enabled=True,
+            athena_database="custom_logs_db",
+            athena_output_location="s3://my-bucket/athena-results/",
+        )
+
+        self.assertEqual(blocker._athena_database, "custom_logs_db")
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_athena_init_lazy(self, mock_boto_client):
+        """Test that Athena client is lazily initialized"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            athena_enabled=True,
+            athena_output_location="s3://my-bucket/athena-results/",
+        )
+
+        # Athena client should not be initialized yet
+        self.assertIsNone(blocker._athena)
+
+        # Initialize it
+        blocker._init_athena()
+
+        # Should now be initialized (the mock)
+        mock_boto_client.assert_any_call("athena", region_name="us-east-1")
+
+    @patch('auto_block_attackers.boto3.client')
+    def test_process_logs_via_athena_disabled(self, mock_boto_client):
+        """Test that _process_logs_via_athena returns None when disabled"""
+        blocker = NaclAutoBlocker(
+            lb_name_pattern="test-*",
+            region="us-east-1",
+            lookback_str="1h",
+            threshold=10,
+            start_rule=80,
+            limit=20,
+            whitelist_file=None,
+            aws_ip_ranges_file=None,
+            dry_run=True,
+            debug=False,
+            athena_enabled=False,
+        )
+
+        result = blocker._process_logs_via_athena(
+            "s3://bucket/logs/",
+            lookback_hours=1.0,
+        )
+
+        self.assertIsNone(result)
+
+
+class TestSlackClientEnhanced(unittest.TestCase):
+    """Test enhanced SlackClient functionality"""
+
+    def test_slack_severity_colors(self):
+        """Test SlackSeverity enum has correct colors"""
+        from slack_client import SlackSeverity
+
+        self.assertEqual(SlackSeverity.INFO.value, "#36a64f")
+        self.assertEqual(SlackSeverity.WARNING.value, "#f2c744")
+        self.assertEqual(SlackSeverity.LOW.value, "#ff9933")
+        self.assertEqual(SlackSeverity.MEDIUM.value, "#e07000")
+        self.assertEqual(SlackSeverity.HIGH.value, "#cc0000")
+        self.assertEqual(SlackSeverity.CRITICAL.value, "#8b0000")
+
+    def test_tier_to_severity_mapping(self):
+        """Test TIER_TO_SEVERITY mapping"""
+        from slack_client import TIER_TO_SEVERITY, SlackSeverity
+
+        self.assertEqual(TIER_TO_SEVERITY["minimal"], SlackSeverity.LOW)
+        self.assertEqual(TIER_TO_SEVERITY["low"], SlackSeverity.LOW)
+        self.assertEqual(TIER_TO_SEVERITY["medium"], SlackSeverity.MEDIUM)
+        self.assertEqual(TIER_TO_SEVERITY["high"], SlackSeverity.HIGH)
+        self.assertEqual(TIER_TO_SEVERITY["critical"], SlackSeverity.CRITICAL)
+
+    def test_slack_block_add_header(self):
+        """Test SlackBlock add_header method"""
+        from slack_client import SlackBlock
+
+        block = SlackBlock()
+        block.add_header("Test Header")
+
+        blocks = block.block
+        self.assertEqual(len(blocks), 1)
+        self.assertEqual(blocks[0]["type"], "header")
+        self.assertEqual(blocks[0]["text"]["text"], "Test Header")
+
+    def test_slack_block_add_fields(self):
+        """Test SlackBlock add_fields method"""
+        from slack_client import SlackBlock
+
+        block = SlackBlock()
+        block.add_fields([("Label1", "Value1"), ("Label2", "Value2")])
+
+        blocks = block.block
+        self.assertEqual(len(blocks), 1)
+        self.assertEqual(blocks[0]["type"], "section")
+        self.assertEqual(len(blocks[0]["fields"]), 2)
+
+    def test_slack_block_add_actions(self):
+        """Test SlackBlock add_actions method"""
+        from slack_client import SlackBlock
+
+        block = SlackBlock()
+        block.add_actions([
+            {"text": "Button 1", "action_id": "action1"},
+            {"text": "Button 2", "action_id": "action2", "style": "danger"},
+        ])
+
+        blocks = block.block
+        self.assertEqual(len(blocks), 1)
+        self.assertEqual(blocks[0]["type"], "actions")
+        self.assertEqual(len(blocks[0]["elements"]), 2)
+
+    def test_slack_client_thread_tracking(self):
+        """Test SlackClient thread tracking"""
+        from slack_client import SlackClient
+
+        client = SlackClient(token="test", channel="test-channel")
+
+        # Initially no threads
+        self.assertIsNone(client.get_thread_ts("incident_1"))
+
+        # Set a thread
+        client.set_thread_ts("incident_1", "1234567890.123456")
+        self.assertEqual(client.get_thread_ts("incident_1"), "1234567890.123456")
+
+        # Clear the thread
+        client.clear_thread("incident_1")
+        self.assertIsNone(client.get_thread_ts("incident_1"))
 
 
 def run_tests():
@@ -439,6 +1349,12 @@ def run_tests():
     suite.addTests(loader.loadTestsFromTestCase(TestNACLFilterFix))
     suite.addTests(loader.loadTestsFromTestCase(TestSlackIntegration))
     suite.addTests(loader.loadTestsFromTestCase(TestLogParsing))
+    suite.addTests(loader.loadTestsFromTestCase(TestWAFIntegration))
+    suite.addTests(loader.loadTestsFromTestCase(TestLoggingAndMetrics))
+    suite.addTests(loader.loadTestsFromTestCase(TestMultiSignalDetection))
+    suite.addTests(loader.loadTestsFromTestCase(TestEnhancedSlackNotifications))
+    suite.addTests(loader.loadTestsFromTestCase(TestAthenaIntegration))
+    suite.addTests(loader.loadTestsFromTestCase(TestSlackClientEnhanced))
 
     # Run tests
     runner = unittest.TextTestRunner(verbosity=2)
diff --git a/tests/test_final_validation.py b/tests/test_final_validation.py
index fb85c4e..5a9c3d8 100644
--- a/tests/test_final_validation.py
+++ b/tests/test_final_validation.py
@@ -26,13 +26,15 @@ class TestAWSIPFiltering(unittest.TestCase):
 
     def test_load_aws_ip_ranges_none(self):
         """Test with no file path"""
-        result = load_aws_ip_ranges(None)
-        self.assertEqual(result, set())
+        ipv4_result, ipv6_result = load_aws_ip_ranges(None)
+        self.assertEqual(ipv4_result, set())
+        self.assertEqual(ipv6_result, set())
 
     def test_load_aws_ip_ranges_missing_file(self):
         """Test with non-existent file"""
-        result = load_aws_ip_ranges("/nonexistent/file.json")
-        self.assertEqual(result, set())
+        ipv4_result, ipv6_result = load_aws_ip_ranges("/nonexistent/file.json")
+        self.assertEqual(ipv4_result, set())
+        self.assertEqual(ipv6_result, set())
 
     def test_load_aws_ip_ranges_valid(self):
         """Test loading valid AWS IP ranges"""
@@ -54,9 +56,11 @@ def test_load_aws_ip_ranges_valid(self):
             temp_file = f.name
 
         try:
-            result = load_aws_ip_ranges(temp_file)
-            self.assertEqual(len(result), 3)
-            self.assertIsInstance(list(result)[0], ipaddress.IPv4Network)
+            ipv4_result, ipv6_result = load_aws_ip_ranges(temp_file)
+            self.assertEqual(len(ipv4_result), 3)
+            self.assertIsInstance(list(ipv4_result)[0], ipaddress.IPv4Network)
+            # No IPv6 prefixes in test data
+            self.assertEqual(len(ipv6_result), 0)
         finally:
             os.unlink(temp_file)
 
diff --git a/tests/test_integration.py b/tests/test_integration.py
index 6fa352b..2b219f9 100644
--- a/tests/test_integration.py
+++ b/tests/test_integration.py
@@ -43,6 +43,7 @@ def get_client(service, **kwargs):
             start_rule=80,
             limit=20,
             whitelist_file=None,
+            aws_ip_ranges_file=None,
             dry_run=True,
             debug=False
         )
@@ -91,6 +92,7 @@ def get_client(service, **kwargs):
             start_rule=80,
             limit=20,
             whitelist_file=None,
+            aws_ip_ranges_file=None,
             dry_run=True,
             debug=False
         )
@@ -150,6 +152,7 @@ def get_client(service, **kwargs):
             start_rule=80,
             limit=20,
             whitelist_file=None,
+            aws_ip_ranges_file=None,
             dry_run=True,
             debug=False
         )
@@ -179,6 +182,7 @@ def test_scenario_all_ips_whitelisted(self, mock_boto_client):
                 start_rule=80,
                 limit=20,
                 whitelist_file=whitelist_path,
+                aws_ip_ranges_file=None,
                 dry_run=True,
                 debug=False
             )
@@ -206,6 +210,7 @@ def test_rule_range_boundary_conditions(self, mock_boto_client):
             start_rule=80,
             limit=20,
             whitelist_file=None,
+            aws_ip_ranges_file=None,
             dry_run=True,
             debug=False
         )
@@ -220,6 +225,7 @@ def test_rule_range_boundary_conditions(self, mock_boto_client):
             start_rule=99,
             limit=10,  # Should cap at 100
             whitelist_file=None,
+            aws_ip_ranges_file=None,
             dry_run=True,
             debug=False
         )
@@ -234,6 +240,7 @@ def test_rule_range_boundary_conditions(self, mock_boto_client):
             start_rule=85,
             limit=50,  # Would go to 135, but capped
             whitelist_file=None,
+            aws_ip_ranges_file=None,
             dry_run=True,
             debug=False
         )
@@ -261,6 +268,7 @@ def test_lookback_period_edge_cases(self, mock_boto_client):
                 start_rule=80,
                 limit=20,
                 whitelist_file=None,
+            aws_ip_ranges_file=None,
                 dry_run=True,
                 debug=False
             )
@@ -283,6 +291,7 @@ def test_manage_rule_limit_empty_slots(self, mock_boto_client):
             start_rule=80,
             limit=20,
             whitelist_file=None,
+            aws_ip_ranges_file=None,
             dry_run=True,
             debug=False
         )
diff --git a/tests/test_observability_features.py b/tests/test_observability_features.py
new file mode 100644
index 0000000..3ca917b
--- /dev/null
+++ b/tests/test_observability_features.py
@@ -0,0 +1,703 @@
+"""
+Tests for observability and UX improvements.
+
+Tests cover:
+1. Auto-download AWS IP ranges
+2. O(log N) IP range lookups with AWSIPRangeIndex
+3. Enhanced threat score logging
+4. Secure legitimate service verification
+5. Accurate dry-run summary table
+"""
+
+import pytest
+import json
+import tempfile
+import os
+from unittest.mock import patch, MagicMock
+from pathlib import Path
+from datetime import datetime, timedelta
+
+import sys
+sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+
+from auto_block_attackers import (
+    AWSIPRangeIndex,
+    download_aws_ip_ranges,
+    load_aws_ip_ranges_with_index,
+    get_ip_ranges_path,
+    is_aws_ip_fast,
+    verify_legitimate_service,
+    _clean_path,
+    _path_matches,
+    KNOWN_LEGITIMATE_SERVICES,
+    AWS_SERVICE_ROUTE53_HEALTHCHECKS,
+    AWS_SERVICE_ELB,
+    AWS_SERVICE_CLOUDFRONT,
+)
+
+
+# Sample AWS IP ranges data for testing
+SAMPLE_AWS_IP_RANGES = {
+    "syncToken": "1234567890",
+    "createDate": "2026-01-09-00-00-00",
+    "prefixes": [
+        {"ip_prefix": "52.93.178.234/32", "region": "us-east-1", "service": "AMAZON"},
+        {"ip_prefix": "52.94.76.0/22", "region": "us-east-1", "service": "EC2"},
+        {"ip_prefix": "54.239.0.0/17", "region": "us-west-2", "service": "EC2"},
+        {"ip_prefix": "15.177.0.0/18", "region": "us-east-1", "service": "ROUTE53_HEALTHCHECKS"},
+        {"ip_prefix": "15.177.64.0/18", "region": "us-west-2", "service": "ROUTE53_HEALTHCHECKS"},
+        {"ip_prefix": "13.32.0.0/15", "region": "GLOBAL", "service": "CLOUDFRONT"},
+        {"ip_prefix": "176.32.103.0/24", "region": "eu-west-1", "service": "ELB"},
+    ],
+    "ipv6_prefixes": [
+        {"ipv6_prefix": "2600:1f00::/24", "region": "us-east-1", "service": "EC2"},
+        {"ipv6_prefix": "2600:9000::/28", "region": "GLOBAL", "service": "CLOUDFRONT"},
+    ]
+}
+
+
+class TestAWSIPRangeIndex:
+    """Tests for the AWSIPRangeIndex class."""
+
+    def test_build_index_from_json(self):
+        """Test building index from JSON data."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        assert index.total_ipv4 == 7
+        assert index.total_ipv6 == 2
+        assert "AMAZON" in index.services
+        assert "EC2" in index.services
+        assert "ROUTE53_HEALTHCHECKS" in index.services
+        assert "CLOUDFRONT" in index.services
+        assert "ELB" in index.services
+
+    def test_is_aws_ip_match(self):
+        """Test O(log N) IP lookup - matching IP."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        # Test exact match
+        assert index.is_aws_ip("52.93.178.234") is True
+
+        # Test IP within a range
+        assert index.is_aws_ip("52.94.76.1") is True
+        assert index.is_aws_ip("52.94.79.255") is True  # Last IP in /22
+
+    def test_is_aws_ip_no_match(self):
+        """Test O(log N) IP lookup - non-matching IP."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        # Test IP not in any range
+        assert index.is_aws_ip("1.2.3.4") is False
+        assert index.is_aws_ip("203.0.113.1") is False
+
+    def test_is_aws_ip_ipv6(self):
+        """Test IPv6 IP lookup."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        # Test IPv6 in range
+        assert index.is_aws_ip("2600:1f00:0:0:0:0:0:1") is True
+
+        # Test IPv6 not in range
+        assert index.is_aws_ip("2001:db8::1") is False
+
+    def test_is_aws_ip_invalid(self):
+        """Test handling of invalid IP addresses."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        assert index.is_aws_ip("not_an_ip") is False
+        assert index.is_aws_ip("") is False
+        assert index.is_aws_ip("256.256.256.256") is False
+
+    def test_is_from_service(self):
+        """Test service-specific IP verification."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        # Route53 Health Check IP
+        assert index.is_from_service("15.177.0.1", "ROUTE53_HEALTHCHECKS") is True
+        assert index.is_from_service("15.177.0.1", "EC2") is False
+
+        # CloudFront IP
+        assert index.is_from_service("13.32.0.1", "CLOUDFRONT") is True
+        assert index.is_from_service("13.32.0.1", "ROUTE53_HEALTHCHECKS") is False
+
+        # ELB IP
+        assert index.is_from_service("176.32.103.1", "ELB") is True
+
+        # IP not in any service
+        assert index.is_from_service("1.2.3.4", "EC2") is False
+
+    def test_get_service_for_ip(self):
+        """Test getting service name for an IP."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        assert index.get_service_for_ip("15.177.0.1") == "ROUTE53_HEALTHCHECKS"
+        assert index.get_service_for_ip("13.32.0.1") == "CLOUDFRONT"
+        assert index.get_service_for_ip("1.2.3.4") is None
+
+    def test_lookup_stats(self):
+        """Test lookup statistics tracking."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        # Perform some lookups
+        index.is_aws_ip("15.177.0.1")  # Hit
+        index.is_aws_ip("1.2.3.4")     # Miss
+        index.is_aws_ip("13.32.0.1")   # Hit
+
+        hits, misses, rate = index.get_lookup_stats()
+        assert hits == 2
+        assert misses == 1
+        assert rate == pytest.approx(66.67, rel=0.1)
+
+    def test_empty_index(self):
+        """Test handling of empty IP ranges data."""
+        empty_data = {"prefixes": [], "ipv6_prefixes": []}
+        index = AWSIPRangeIndex.from_json_data(empty_data)
+
+        assert index.total_ipv4 == 0
+        assert index.total_ipv6 == 0
+        assert index.is_aws_ip("1.2.3.4") is False
+
+    def test_overlapping_ranges(self):
+        """Test handling of overlapping IP ranges (e.g., /16 with /26 subnets).
+
+        AWS IP ranges contain overlapping CIDRs where a /16 may be followed
+        by smaller /26 subnets. The bisect lookup must check backwards to find
+        the containing /16 when a /26 doesn't contain the target IP.
+        """
+        # Simulate AWS ranges with overlapping /16 and /26
+        overlapping_data = {
+            "syncToken": "test",
+            "createDate": "2026-01-09",
+            "prefixes": [
+                # A /16 that should contain 54.252.193.112
+                {"ip_prefix": "54.252.0.0/16", "region": "ap-southeast-2", "service": "AMAZON"},
+                # A /26 subnet within the /16 (doesn't contain 54.252.193.112)
+                {"ip_prefix": "54.252.79.128/26", "region": "ap-southeast-2", "service": "EC2"},
+                # Another /26 subnet
+                {"ip_prefix": "54.252.254.192/26", "region": "ap-southeast-2", "service": "EC2"},
+            ],
+            "ipv6_prefixes": []
+        }
+
+        index = AWSIPRangeIndex.from_json_data(overlapping_data)
+
+        # IP in the /16 but NOT in any /26 - should still be found
+        assert index.is_aws_ip("54.252.193.112") is True, \
+            "IP in /16 but not in /26 should be found via backward search"
+
+        # IP directly in the /26 should be found
+        assert index.is_aws_ip("54.252.79.140") is True, \
+            "IP in /26 should be found directly"
+
+        # IP outside all ranges
+        assert index.is_aws_ip("1.2.3.4") is False
+
+    def test_overlapping_ranges_service_lookup(self):
+        """Test service lookup with overlapping ranges."""
+        overlapping_data = {
+            "syncToken": "test",
+            "createDate": "2026-01-09",
+            "prefixes": [
+                {"ip_prefix": "54.252.0.0/16", "region": "ap-southeast-2", "service": "AMAZON"},
+                {"ip_prefix": "54.252.79.128/26", "region": "ap-southeast-2", "service": "EC2"},
+            ],
+            "ipv6_prefixes": []
+        }
+
+        index = AWSIPRangeIndex.from_json_data(overlapping_data)
+
+        # IP in /16 but not /26 should return AMAZON service
+        service = index.get_service_for_ip("54.252.193.112")
+        assert service == "AMAZON", f"Expected AMAZON, got {service}"
+
+        # IP in both /16 and /26 - returns first matching service found
+        # (AMAZON comes before EC2 in dict iteration order)
+        service = index.get_service_for_ip("54.252.79.140")
+        assert service in ("AMAZON", "EC2"), f"Expected AMAZON or EC2, got {service}"
+
+
+class TestAutoDownload:
+    """Tests for auto-download functionality."""
+
+    def test_get_ip_ranges_path_default(self):
+        """Test default path for non-Lambda environments."""
+        with patch.dict(os.environ, {}, clear=True):
+            path = get_ip_ranges_path()
+            assert path == "./ip-ranges.json"
+
+    def test_get_ip_ranges_path_lambda(self):
+        """Test path for Lambda environments."""
+        with patch.dict(os.environ, {"AWS_LAMBDA_FUNCTION_NAME": "test-function"}):
+            path = get_ip_ranges_path()
+            assert path == "/tmp/ip-ranges.json"
+
+    def test_download_aws_ip_ranges_success(self):
+        """Test successful download of IP ranges."""
+        with tempfile.TemporaryDirectory() as tmpdir:
+            file_path = os.path.join(tmpdir, "ip-ranges.json")
+
+            mock_response = MagicMock()
+            mock_response.json.return_value = SAMPLE_AWS_IP_RANGES
+            mock_response.content = json.dumps(SAMPLE_AWS_IP_RANGES).encode()
+
+            with patch('requests.get', return_value=mock_response):
+                result = download_aws_ip_ranges(file_path)
+
+            assert result is not None
+            assert "prefixes" in result
+            assert os.path.exists(file_path)
+
+    def test_download_aws_ip_ranges_cached(self):
+        """Test loading from fresh cache."""
+        with tempfile.TemporaryDirectory() as tmpdir:
+            file_path = os.path.join(tmpdir, "ip-ranges.json")
+
+            # Create a fresh cached file
+            with open(file_path, 'w') as f:
+                json.dump(SAMPLE_AWS_IP_RANGES, f)
+
+            # Should load from cache without downloading
+            with patch('requests.get') as mock_get:
+                result = download_aws_ip_ranges(file_path, max_age_days=7)
+
+            # requests.get should not be called if cache is fresh
+            assert result is not None
+            assert "prefixes" in result
+
+    def test_download_aws_ip_ranges_timeout(self):
+        """Test handling of download timeout."""
+        import requests
+        with tempfile.TemporaryDirectory() as tmpdir:
+            file_path = os.path.join(tmpdir, "ip-ranges.json")
+
+            with patch('requests.get', side_effect=requests.exceptions.Timeout):
+                result = download_aws_ip_ranges(file_path)
+
+            assert result is None
+
+    def test_download_aws_ip_ranges_fallback(self):
+        """Test fallback to stale cache on download failure."""
+        import requests
+        with tempfile.TemporaryDirectory() as tmpdir:
+            file_path = os.path.join(tmpdir, "ip-ranges.json")
+
+            # Create stale cached file (touch with old timestamp)
+            with open(file_path, 'w') as f:
+                json.dump(SAMPLE_AWS_IP_RANGES, f)
+            old_time = datetime.now() - timedelta(days=30)
+            os.utime(file_path, (old_time.timestamp(), old_time.timestamp()))
+
+            # Simulate download failure
+            with patch('requests.get', side_effect=requests.exceptions.RequestException("Network error")):
+                result = download_aws_ip_ranges(file_path, max_age_days=7)
+
+            # Should fall back to stale cache
+            assert result is not None
+            assert "prefixes" in result
+
+
+class TestLoadWithIndex:
+    """Tests for load_aws_ip_ranges_with_index."""
+
+    def test_load_with_auto_download_disabled(self):
+        """Test loading with auto-download disabled."""
+        with tempfile.TemporaryDirectory() as tmpdir:
+            file_path = os.path.join(tmpdir, "ip-ranges.json")
+
+            # Create file
+            with open(file_path, 'w') as f:
+                json.dump(SAMPLE_AWS_IP_RANGES, f)
+
+            index, ipv4, ipv6 = load_aws_ip_ranges_with_index(
+                file_path=file_path,
+                auto_download=False
+            )
+
+            assert index is not None
+            assert len(ipv4) == 7
+            assert len(ipv6) == 2
+
+    def test_load_with_missing_file_no_download(self):
+        """Test loading missing file with auto-download disabled."""
+        with tempfile.TemporaryDirectory() as tmpdir:
+            file_path = os.path.join(tmpdir, "nonexistent.json")
+
+            index, ipv4, ipv6 = load_aws_ip_ranges_with_index(
+                file_path=file_path,
+                auto_download=False
+            )
+
+            assert index is None
+            assert len(ipv4) == 0
+            assert len(ipv6) == 0
+
+
+class TestPathCleaning:
+    """Tests for path cleaning and matching."""
+
+    def test_clean_path_basic(self):
+        """Test basic path cleaning."""
+        assert _clean_path("/health") == "/health"
+        assert _clean_path("/health/") == "/health"
+        assert _clean_path("health") == "/health"
+
+    def test_clean_path_query_params(self):
+        """Test stripping query parameters."""
+        assert _clean_path("/health?foo=bar") == "/health"
+        assert _clean_path("/login?redirect=/health") == "/login"
+
+    def test_clean_path_fragments(self):
+        """Test stripping URL fragments."""
+        assert _clean_path("/health#section") == "/health"
+
+    def test_clean_path_full_url(self):
+        """Test cleaning full URLs."""
+        assert _clean_path("https://example.com/health?token=xyz") == "/health"
+        assert _clean_path("http://example.com/api/v1/status") == "/api/v1/status"
+
+    def test_path_matches_exact(self):
+        """Test exact path matching."""
+        assert _path_matches("/health", "/health") is True
+        assert _path_matches("/health/", "/health") is True
+        assert _path_matches("/status", "/health") is False
+
+    def test_path_matches_prefix(self):
+        """Test prefix path matching."""
+        assert _path_matches("/health/check", "/health") is True
+        assert _path_matches("/health/deep/nested", "/health") is True
+        assert _path_matches("/healthz", "/health") is False  # No slash after prefix
+
+    def test_path_matches_query_bypass_prevention(self):
+        """Test that query params don't bypass path matching."""
+        # This is the key security test
+        assert _path_matches("/login?redirect=/health", "/health") is False
+        assert _path_matches("/api?path=/health", "/health") is False
+
+
+class TestLegitimateServiceVerification:
+    """Tests for legitimate service verification."""
+
+    def test_route53_health_check_verified(self):
+        """Test Route53 Health Check verification with matching IP."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        adjustment, service, method = verify_legitimate_service(
+            ip="15.177.0.1",  # In ROUTE53_HEALTHCHECKS range
+            ua="Amazon-Route53-Health-Check-Service (ref: abc123)",
+            request_paths=["/health"],
+            aws_index=index
+        )
+
+        assert adjustment == -25
+        assert service == "Route53-Health-Check"
+        assert method == "aws_service"
+
+    def test_route53_health_check_spoofed(self):
+        """Test Route53 Health Check rejection when IP doesn't match."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        # IP not in ROUTE53_HEALTHCHECKS range
+        adjustment, service, method = verify_legitimate_service(
+            ip="1.2.3.4",
+            ua="Amazon-Route53-Health-Check-Service (ref: abc123)",
+            request_paths=["/health"],
+            aws_index=index
+        )
+
+        assert adjustment == 0  # No negative adjustment for spoofed UA
+        assert service is None
+
+    def test_datadog_verified(self):
+        """Test Datadog verification with matching path."""
+        adjustment, service, method = verify_legitimate_service(
+            ip="1.2.3.4",
+            ua="Datadog Agent/7.0.0",
+            request_paths=["/health", "/api/v1/metrics"],
+            aws_index=None
+        )
+
+        assert adjustment == -15
+        assert service == "Datadog"
+        assert method == "path_match"
+
+    def test_datadog_wrong_path(self):
+        """Test Datadog rejection when paths don't match."""
+        adjustment, service, method = verify_legitimate_service(
+            ip="1.2.3.4",
+            ua="Datadog Agent/7.0.0",
+            request_paths=["/admin", "/wp-login.php"],
+            aws_index=None
+        )
+
+        assert adjustment == 0
+        assert service is None
+
+    def test_no_aws_index_warning(self):
+        """Test warning when AWS index unavailable for AWS service."""
+        # Without AWS index, can't verify AWS services
+        adjustment, service, method = verify_legitimate_service(
+            ip="15.177.0.1",
+            ua="Amazon-Route53-Health-Check-Service",
+            request_paths=["/health"],
+            aws_index=None  # No index available
+        )
+
+        # Should not give negative score without verification
+        assert adjustment == 0
+
+    def test_ua_injection_prevention(self):
+        """Test that UA injection doesn't match anchored patterns."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        # Evil UA trying to inject legitimate service name
+        adjustment, service, method = verify_legitimate_service(
+            ip="1.2.3.4",
+            ua="Evil-Attacker/1.0 (includes Amazon-Route53-Health-Check-Service)",
+            request_paths=["/admin"],
+            aws_index=index
+        )
+
+        # Anchored regex should not match
+        assert adjustment == 0
+
+    def test_cloudfront_verification(self):
+        """Test CloudFront service verification."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        adjustment, service, method = verify_legitimate_service(
+            ip="13.32.0.1",  # In CLOUDFRONT range
+            ua="Amazon CloudFront",
+            request_paths=["/"],
+            aws_index=index
+        )
+
+        assert adjustment == -25
+        assert service == "CloudFront"
+        assert method == "aws_service"
+
+
+class TestIsAwsIpFast:
+    """Tests for the fast AWS IP check function."""
+
+    def test_is_aws_ip_fast_with_index(self):
+        """Test fast IP check with index."""
+        index = AWSIPRangeIndex.from_json_data(SAMPLE_AWS_IP_RANGES)
+
+        assert is_aws_ip_fast("15.177.0.1", index) is True
+        assert is_aws_ip_fast("1.2.3.4", index) is False
+
+    def test_is_aws_ip_fast_explicit_none(self):
+        """Test fast IP check with explicitly passed None index."""
+        # Create a fresh empty index to test explicit None behavior
+        empty_index = AWSIPRangeIndex.from_json_data({"prefixes": [], "ipv6_prefixes": []})
+
+        # With empty index, IP should not be found
+        assert is_aws_ip_fast("15.177.0.1", empty_index) is False
+        assert is_aws_ip_fast("1.2.3.4", empty_index) is False
+
+
+class TestDryRunSummary:
+    """Tests for accurate dry-run summary table generation."""
+
+    def test_generate_report_dry_run_mode(self):
+        """Test report generation in dry-run mode shows expected state changes."""
+        from unittest.mock import MagicMock
+        from collections import Counter
+        from auto_block_attackers import NaclAutoBlocker
+
+        with tempfile.TemporaryDirectory() as tmpdir:
+            # Create minimal blocker instance
+            with patch('boto3.client') as mock_boto:
+                mock_client = MagicMock()
+                mock_boto.return_value = mock_client
+
+                # Mock STS get_caller_identity
+                mock_client.get_caller_identity.return_value = {"Account": "123456789012"}
+
+                blocker = NaclAutoBlocker(
+                    lb_name_pattern="test-*",
+                    region="us-east-1",
+                    lookback_str="60m",
+                    threshold=50,
+                    start_rule=80,
+                    limit=20,
+                    whitelist_file=None,
+                    aws_ip_ranges_file=None,
+                    dry_run=True,
+                    debug=False,
+                    auto_download_ip_ranges=False,
+                )
+
+        # Test data
+        ip_counts = Counter({
+            "192.168.1.1": 100,  # Will be blocked
+            "192.168.1.2": 30,   # Below threshold
+        })
+
+        offenders = {"192.168.1.1"}
+        final_blocked_ips = {"192.168.1.3"}  # Currently blocked
+        ips_to_add = {"192.168.1.1"}
+        ips_to_remove = {"192.168.1.4"}  # Expired
+
+        # Test _get_dry_run_status directly
+        status = blocker._get_dry_run_status(
+            ip="192.168.1.1",
+            ips_to_add=ips_to_add,
+            ips_to_remove=ips_to_remove,
+            final_blocked_ips=final_blocked_ips,
+            skipped_ip_details={},
+            hits=100,
+        )
+        assert "WILL BE BLOCKED" in status
+
+        status = blocker._get_dry_run_status(
+            ip="192.168.1.4",
+            ips_to_add=ips_to_add,
+            ips_to_remove=ips_to_remove,
+            final_blocked_ips=final_blocked_ips,
+            skipped_ip_details={},
+            hits=0,
+        )
+        assert "WILL BE UNBLOCKED" in status
+
+        status = blocker._get_dry_run_status(
+            ip="192.168.1.3",
+            ips_to_add=ips_to_add,
+            ips_to_remove=ips_to_remove,
+            final_blocked_ips=final_blocked_ips,
+            skipped_ip_details={},
+            hits=0,
+        )
+        assert "NO CHANGE" in status
+
+        # Test skipped IP status (without service name)
+        status = blocker._get_dry_run_status(
+            ip="192.168.1.5",
+            ips_to_add=ips_to_add,
+            ips_to_remove=ips_to_remove,
+            final_blocked_ips=final_blocked_ips,
+            skipped_ip_details={"192.168.1.5": (35.0, {})},
+            hits=75,
+        )
+        assert "SKIPPED" in status
+        assert "35" in status
+
+        # Test skipped IP status with service name
+        status = blocker._get_dry_run_status(
+            ip="192.168.1.6",
+            ips_to_add=ips_to_add,
+            ips_to_remove=ips_to_remove,
+            final_blocked_ips=final_blocked_ips,
+            skipped_ip_details={"192.168.1.6": (33.0, {"service_name": "Route53-Health-Check"})},
+            hits=300,
+        )
+        assert "SKIPPED" in status
+        assert "33" in status
+        assert "Route53-Health-Check" in status
+
+
+class TestThreatScoreLogging:
+    """Tests for enhanced threat score logging."""
+
+    def test_log_threat_score_details_blocked(self, capsys):
+        """Test logging for blocked IPs."""
+        from unittest.mock import MagicMock
+        from auto_block_attackers import NaclAutoBlocker
+        import logging
+
+        with patch('boto3.client') as mock_boto:
+            mock_client = MagicMock()
+            mock_boto.return_value = mock_client
+            mock_client.get_caller_identity.return_value = {"Account": "123456789012"}
+
+            blocker = NaclAutoBlocker(
+                lb_name_pattern="test-*",
+                region="us-east-1",
+                lookback_str="60m",
+                threshold=50,
+                start_rule=80,
+                limit=20,
+                whitelist_file=None,
+                aws_ip_ranges_file=None,
+                dry_run=True,
+                debug=True,  # Enable debug for detailed logging
+                auto_download_ip_ranges=False,
+            )
+
+        details = {
+            'base_score': 75.0,
+            'breakdown': {
+                'attack_pattern': 40.0,
+                'scanner_ua': 25.0,
+                'error_rate': 10.0,
+                'path_diversity': 0.0,
+                'rate': 0.0,
+            },
+            'hit_count': 150,
+            'reasons': ['attack_patterns (45 hits)', 'scanner_ua (30 hits)'],
+            'attack_pattern_hits': 45,
+            'scanner_ua_hits': 30,
+            'error_responses': 120,
+        }
+
+        blocker._log_threat_score_details("192.168.1.1", 75.0, details, blocked=True)
+
+        # Check stderr (where logging output goes)
+        captured = capsys.readouterr()
+        assert "BLOCKED" in captured.err
+        assert "192.168.1.1" in captured.err
+        assert "75" in captured.err
+
+    def test_log_threat_score_details_high_hit_warning(self, capsys):
+        """Test warning for high-hit IPs that were skipped."""
+        from unittest.mock import MagicMock
+        from auto_block_attackers import NaclAutoBlocker
+        import logging
+
+        with patch('boto3.client') as mock_boto:
+            mock_client = MagicMock()
+            mock_boto.return_value = mock_client
+            mock_client.get_caller_identity.return_value = {"Account": "123456789012"}
+
+            blocker = NaclAutoBlocker(
+                lb_name_pattern="test-*",
+                region="us-east-1",
+                lookback_str="60m",
+                threshold=50,
+                start_rule=80,
+                limit=20,
+                whitelist_file=None,
+                aws_ip_ranges_file=None,
+                dry_run=True,
+                debug=False,
+                auto_download_ip_ranges=False,
+            )
+
+        details = {
+            'base_score': 35.0,
+            'breakdown': {
+                'attack_pattern': 20.0,
+                'scanner_ua': 0.0,
+                'error_rate': 15.0,
+                'path_diversity': 0.0,
+                'rate': 0.0,
+            },
+            'hit_count': 500,  # High hits but low score
+            'reasons': ['attack_patterns (10 hits)'],
+            'attack_pattern_hits': 10,
+            'scanner_ua_hits': 0,
+            'error_responses': 100,
+        }
+
+        blocker._log_threat_score_details("192.168.1.1", 35.0, details, blocked=False)
+
+        # Check stderr for warning
+        captured = capsys.readouterr()
+        assert "High-traffic IP" in captured.err
+        assert "500 hits" in captured.err
+        assert "NOT blocked" in captured.err
+        assert "⚠️" in captured.err  # Emoji indicator for warning
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-v"])
diff --git a/tests/test_storage_backends.py b/tests/test_storage_backends.py
new file mode 100644
index 0000000..2e468f3
--- /dev/null
+++ b/tests/test_storage_backends.py
@@ -0,0 +1,478 @@
+#!/usr/bin/env python3
+"""
+Test suite for storage_backends.py
+
+Tests all storage backend implementations:
+- LocalFileBackend
+- DynamoDBBackend (mocked)
+- S3Backend (mocked)
+- Factory function
+"""
+
+import json
+import os
+import sys
+import tempfile
+import unittest
+from datetime import datetime, timedelta, timezone
+from unittest.mock import MagicMock, patch, PropertyMock
+
+# Add parent directory to path
+sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+
+from storage_backends import (
+    StorageBackend,
+    LocalFileBackend,
+    DynamoDBBackend,
+    S3Backend,
+    create_storage_backend,
+    StorageError,
+    ConflictError,
+)
+
+
+class TestLocalFileBackend(unittest.TestCase):
+    """Test LocalFileBackend implementation."""
+
+    def setUp(self):
+        """Create a temporary file for each test."""
+        self.temp_file = tempfile.NamedTemporaryFile(
+            mode='w', suffix='.json', delete=False
+        )
+        self.temp_file.close()
+        self.backend = LocalFileBackend(file_path=self.temp_file.name)
+
+    def tearDown(self):
+        """Clean up temporary file."""
+        if os.path.exists(self.temp_file.name):
+            os.unlink(self.temp_file.name)
+        # Clean up any .tmp files
+        tmp_file = f"{self.temp_file.name}.tmp"
+        if os.path.exists(tmp_file):
+            os.unlink(tmp_file)
+
+    def test_load_empty_file(self):
+        """Test loading from non-existent file returns empty dict."""
+        os.unlink(self.temp_file.name)
+        result = self.backend.load()
+        self.assertEqual(result, {})
+
+    def test_load_valid_data(self):
+        """Test loading valid JSON data."""
+        test_data = {
+            "1.2.3.4": {
+                "tier": "high",
+                "priority": 3,
+                "block_until": "2025-01-20T10:00:00+00:00",
+            }
+        }
+        with open(self.temp_file.name, 'w') as f:
+            json.dump(test_data, f)
+
+        result = self.backend.load()
+        self.assertEqual(result, test_data)
+
+    def test_load_corrupted_json(self):
+        """Test loading corrupted JSON returns empty dict."""
+        with open(self.temp_file.name, 'w') as f:
+            f.write("{invalid json")
+
+        result = self.backend.load()
+        self.assertEqual(result, {})
+
+    def test_load_invalid_structure(self):
+        """Test loading non-dict JSON returns empty dict."""
+        with open(self.temp_file.name, 'w') as f:
+            json.dump(["not", "a", "dict"], f)
+
+        result = self.backend.load()
+        self.assertEqual(result, {})
+
+    def test_save_creates_file(self):
+        """Test save creates file if it doesn't exist."""
+        os.unlink(self.temp_file.name)
+        test_data = {"1.2.3.4": {"tier": "low"}}
+
+        self.backend.save(test_data)
+
+        self.assertTrue(os.path.exists(self.temp_file.name))
+        with open(self.temp_file.name, 'r') as f:
+            saved_data = json.load(f)
+        self.assertEqual(saved_data, test_data)
+
+    def test_save_overwrites_existing(self):
+        """Test save overwrites existing data."""
+        with open(self.temp_file.name, 'w') as f:
+            json.dump({"old": "data"}, f)
+
+        new_data = {"new": "data"}
+        self.backend.save(new_data)
+
+        with open(self.temp_file.name, 'r') as f:
+            saved_data = json.load(f)
+        self.assertEqual(saved_data, new_data)
+
+    def test_get_existing_ip(self):
+        """Test getting an existing IP."""
+        test_data = {
+            "1.2.3.4": {"tier": "high"},
+            "5.6.7.8": {"tier": "low"},
+        }
+        with open(self.temp_file.name, 'w') as f:
+            json.dump(test_data, f)
+
+        result = self.backend.get("1.2.3.4")
+        self.assertEqual(result, {"tier": "high"})
+
+    def test_get_non_existing_ip(self):
+        """Test getting a non-existing IP returns None."""
+        with open(self.temp_file.name, 'w') as f:
+            json.dump({}, f)
+
+        result = self.backend.get("1.2.3.4")
+        self.assertIsNone(result)
+
+    def test_put_new_ip(self):
+        """Test putting a new IP."""
+        with open(self.temp_file.name, 'w') as f:
+            json.dump({}, f)
+
+        self.backend.put("1.2.3.4", {"tier": "high"})
+
+        with open(self.temp_file.name, 'r') as f:
+            saved_data = json.load(f)
+        self.assertEqual(saved_data, {"1.2.3.4": {"tier": "high"}})
+
+    def test_put_updates_existing(self):
+        """Test putting updates existing IP."""
+        with open(self.temp_file.name, 'w') as f:
+            json.dump({"1.2.3.4": {"tier": "low"}}, f)
+
+        self.backend.put("1.2.3.4", {"tier": "high"})
+
+        with open(self.temp_file.name, 'r') as f:
+            saved_data = json.load(f)
+        self.assertEqual(saved_data, {"1.2.3.4": {"tier": "high"}})
+
+    def test_delete_existing_ip(self):
+        """Test deleting an existing IP."""
+        with open(self.temp_file.name, 'w') as f:
+            json.dump({"1.2.3.4": {"tier": "high"}}, f)
+
+        self.backend.delete("1.2.3.4")
+
+        with open(self.temp_file.name, 'r') as f:
+            saved_data = json.load(f)
+        self.assertEqual(saved_data, {})
+
+    def test_delete_non_existing_ip(self):
+        """Test deleting non-existing IP doesn't raise error."""
+        with open(self.temp_file.name, 'w') as f:
+            json.dump({}, f)
+
+        # Should not raise
+        self.backend.delete("1.2.3.4")
+
+    def test_get_expired(self):
+        """Test getting expired IPs."""
+        now = datetime.now(timezone.utc)
+        test_data = {
+            "1.2.3.4": {"block_until": (now - timedelta(hours=1)).isoformat()},  # Expired
+            "5.6.7.8": {"block_until": (now + timedelta(hours=1)).isoformat()},  # Active
+            "9.10.11.12": {"block_until": (now - timedelta(days=1)).isoformat()},  # Expired
+        }
+        with open(self.temp_file.name, 'w') as f:
+            json.dump(test_data, f)
+
+        expired = self.backend.get_expired(now)
+        self.assertEqual(expired, {"1.2.3.4", "9.10.11.12"})
+
+    def test_get_expired_handles_invalid_dates(self):
+        """Test get_expired handles invalid date formats gracefully."""
+        now = datetime.now(timezone.utc)
+        test_data = {
+            "1.2.3.4": {"block_until": "invalid-date"},
+            "5.6.7.8": {"block_until": (now - timedelta(hours=1)).isoformat()},
+        }
+        with open(self.temp_file.name, 'w') as f:
+            json.dump(test_data, f)
+
+        expired = self.backend.get_expired(now)
+        self.assertEqual(expired, {"5.6.7.8"})
+
+    def test_cleanup_old_entries(self):
+        """Test cleaning up old entries."""
+        now = datetime.now(timezone.utc)
+        test_data = {
+            "1.2.3.4": {"block_until": (now - timedelta(days=40)).isoformat()},  # Very old
+            "5.6.7.8": {"block_until": (now - timedelta(days=10)).isoformat()},  # Recently expired
+            "9.10.11.12": {"block_until": (now + timedelta(days=5)).isoformat()},  # Active
+        }
+        with open(self.temp_file.name, 'w') as f:
+            json.dump(test_data, f)
+
+        removed = self.backend.cleanup_old_entries(now, days_old=30)
+        self.assertEqual(removed, 1)
+
+        with open(self.temp_file.name, 'r') as f:
+            remaining = json.load(f)
+        self.assertNotIn("1.2.3.4", remaining)
+        self.assertIn("5.6.7.8", remaining)
+        self.assertIn("9.10.11.12", remaining)
+
+
+class TestDynamoDBBackend(unittest.TestCase):
+    """Test DynamoDBBackend implementation with mocked AWS calls."""
+
+    @patch('storage_backends.boto3.client')
+    @patch('storage_backends.boto3.resource')
+    def setUp(self, mock_resource, mock_client):
+        """Set up mocked DynamoDB backend."""
+        self.mock_dynamodb = MagicMock()
+        self.mock_table = MagicMock()
+        mock_client.return_value = self.mock_dynamodb
+        mock_resource.return_value.Table.return_value = self.mock_table
+
+        self.backend = DynamoDBBackend(
+            table_name="test-table",
+            region="us-east-1",
+        )
+
+    def test_get_existing_item(self):
+        """Test getting an existing item from DynamoDB."""
+        self.mock_table.get_item.return_value = {
+            "Item": {
+                "ip": "1.2.3.4",
+                "tier": "high",
+                "priority": 3,
+                "block_until_iso": "2025-01-20T10:00:00+00:00",
+                "first_seen": "2025-01-15T10:00:00+00:00",
+                "last_seen": "2025-01-15T10:00:00+00:00",
+                "total_hits": 1000,
+                "block_duration_hours": 72,
+                "version": 1,
+            }
+        }
+
+        result = self.backend.get("1.2.3.4")
+        self.assertEqual(result["tier"], "high")
+        self.assertEqual(result["priority"], 3)
+
+    def test_get_non_existing_item(self):
+        """Test getting a non-existing item returns None."""
+        self.mock_table.get_item.return_value = {}
+
+        result = self.backend.get("1.2.3.4")
+        self.assertIsNone(result)
+
+    def test_put_new_item(self):
+        """Test putting a new item to DynamoDB."""
+        entry = {
+            "tier": "high",
+            "priority": 3,
+            "block_until": "2025-01-20T10:00:00+00:00",
+            "first_seen": "2025-01-15T10:00:00+00:00",
+            "last_seen": "2025-01-15T10:00:00+00:00",
+            "total_hits": 1000,
+            "block_duration_hours": 72,
+        }
+
+        self.backend.put("1.2.3.4", entry)
+
+        self.mock_table.put_item.assert_called_once()
+        call_args = self.mock_table.put_item.call_args
+        item = call_args[1]["Item"]
+        self.assertEqual(item["ip"], "1.2.3.4")
+        self.assertEqual(item["tier"], "high")
+
+    def test_delete_item(self):
+        """Test deleting an item from DynamoDB."""
+        self.backend.delete("1.2.3.4")
+
+        self.mock_table.delete_item.assert_called_once_with(Key={"ip": "1.2.3.4"})
+
+
+class TestS3Backend(unittest.TestCase):
+    """Test S3Backend implementation with mocked AWS calls."""
+
+    @patch('storage_backends.boto3.client')
+    def setUp(self, mock_client):
+        """Set up mocked S3 backend."""
+        self.mock_s3 = MagicMock()
+        mock_client.return_value = self.mock_s3
+
+        self.backend = S3Backend(
+            bucket="test-bucket",
+            key="block_registry.json",
+            region="us-east-1",
+        )
+
+    def test_load_existing_data(self):
+        """Test loading existing data from S3."""
+        test_data = {"1.2.3.4": {"tier": "high"}}
+        self.mock_s3.get_object.return_value = {
+            "Body": MagicMock(read=MagicMock(return_value=json.dumps(test_data).encode())),
+            "ETag": '"abc123"',
+        }
+
+        result = self.backend.load()
+        self.assertEqual(result, test_data)
+        self.assertEqual(self.backend._etag, "abc123")
+
+    def test_load_non_existing_key(self):
+        """Test loading from non-existing key returns empty dict."""
+        from botocore.exceptions import ClientError
+
+        self.mock_s3.get_object.side_effect = ClientError(
+            {"Error": {"Code": "NoSuchKey"}}, "GetObject"
+        )
+
+        result = self.backend.load()
+        self.assertEqual(result, {})
+
+    def test_save_data(self):
+        """Test saving data to S3."""
+        test_data = {"1.2.3.4": {"tier": "high"}}
+        self.mock_s3.put_object.return_value = {"ETag": '"def456"'}
+
+        self.backend.save(test_data)
+
+        self.mock_s3.put_object.assert_called_once()
+        call_args = self.mock_s3.put_object.call_args
+        self.assertEqual(call_args[1]["Bucket"], "test-bucket")
+        self.assertEqual(call_args[1]["Key"], "block_registry.json")
+
+    def test_get_existing_ip(self):
+        """Test getting an existing IP from S3."""
+        test_data = {"1.2.3.4": {"tier": "high"}, "5.6.7.8": {"tier": "low"}}
+        self.mock_s3.get_object.return_value = {
+            "Body": MagicMock(read=MagicMock(return_value=json.dumps(test_data).encode())),
+            "ETag": '"abc123"',
+        }
+
+        result = self.backend.get("1.2.3.4")
+        self.assertEqual(result, {"tier": "high"})
+
+    def test_delete_ip(self):
+        """Test deleting an IP from S3."""
+        test_data = {"1.2.3.4": {"tier": "high"}, "5.6.7.8": {"tier": "low"}}
+        self.mock_s3.get_object.return_value = {
+            "Body": MagicMock(read=MagicMock(return_value=json.dumps(test_data).encode())),
+            "ETag": '"abc123"',
+        }
+        self.mock_s3.put_object.return_value = {"ETag": '"def456"'}
+
+        self.backend.delete("1.2.3.4")
+
+        # Verify put_object was called with data excluding deleted IP
+        call_args = self.mock_s3.put_object.call_args
+        saved_body = call_args[1]["Body"].decode()
+        saved_data = json.loads(saved_body)
+        self.assertNotIn("1.2.3.4", saved_data)
+        self.assertIn("5.6.7.8", saved_data)
+
+
+class TestCreateStorageBackend(unittest.TestCase):
+    """Test the factory function."""
+
+    def test_create_local_backend(self):
+        """Test creating local file backend."""
+        backend = create_storage_backend(
+            backend_type="local",
+            local_file="/tmp/test_registry.json",
+        )
+        self.assertIsInstance(backend, LocalFileBackend)
+
+    @patch('storage_backends.boto3.client')
+    @patch('storage_backends.boto3.resource')
+    def test_create_dynamodb_backend(self, mock_resource, mock_client):
+        """Test creating DynamoDB backend."""
+        mock_client.return_value = MagicMock()
+        mock_resource.return_value.Table.return_value = MagicMock()
+
+        backend = create_storage_backend(
+            backend_type="dynamodb",
+            dynamodb_table="test-table",
+            region="us-east-1",
+        )
+        self.assertIsInstance(backend, DynamoDBBackend)
+
+    @patch('storage_backends.boto3.client')
+    def test_create_s3_backend(self, mock_client):
+        """Test creating S3 backend."""
+        mock_client.return_value = MagicMock()
+
+        backend = create_storage_backend(
+            backend_type="s3",
+            s3_bucket="test-bucket",
+            s3_key="registry.json",
+            region="us-east-1",
+        )
+        self.assertIsInstance(backend, S3Backend)
+
+    def test_create_invalid_backend_type(self):
+        """Test creating backend with invalid type raises ValueError."""
+        with self.assertRaises(ValueError) as context:
+            create_storage_backend(backend_type="invalid")
+        self.assertIn("Unknown backend type", str(context.exception))
+
+    def test_create_dynamodb_without_table(self):
+        """Test creating DynamoDB backend without table raises ValueError."""
+        with self.assertRaises(ValueError) as context:
+            create_storage_backend(backend_type="dynamodb")
+        self.assertIn("dynamodb_table is required", str(context.exception))
+
+    def test_create_s3_without_bucket(self):
+        """Test creating S3 backend without bucket raises ValueError."""
+        with self.assertRaises(ValueError) as context:
+            create_storage_backend(backend_type="s3")
+        self.assertIn("s3_bucket is required", str(context.exception))
+
+
+class TestStorageBackendInterface(unittest.TestCase):
+    """Test that all backends properly implement the interface."""
+
+    def test_local_backend_is_storage_backend(self):
+        """Test LocalFileBackend is a StorageBackend."""
+        backend = LocalFileBackend(file_path="/tmp/test.json")
+        self.assertIsInstance(backend, StorageBackend)
+
+    @patch('storage_backends.boto3.client')
+    @patch('storage_backends.boto3.resource')
+    def test_dynamodb_backend_is_storage_backend(self, mock_resource, mock_client):
+        """Test DynamoDBBackend is a StorageBackend."""
+        mock_client.return_value = MagicMock()
+        mock_resource.return_value.Table.return_value = MagicMock()
+
+        backend = DynamoDBBackend(table_name="test", region="us-east-1")
+        self.assertIsInstance(backend, StorageBackend)
+
+    @patch('storage_backends.boto3.client')
+    def test_s3_backend_is_storage_backend(self, mock_client):
+        """Test S3Backend is a StorageBackend."""
+        mock_client.return_value = MagicMock()
+
+        backend = S3Backend(bucket="test", region="us-east-1")
+        self.assertIsInstance(backend, StorageBackend)
+
+
+def run_tests():
+    """Run all tests and return results."""
+    loader = unittest.TestLoader()
+    suite = unittest.TestSuite()
+
+    suite.addTests(loader.loadTestsFromTestCase(TestLocalFileBackend))
+    suite.addTests(loader.loadTestsFromTestCase(TestDynamoDBBackend))
+    suite.addTests(loader.loadTestsFromTestCase(TestS3Backend))
+    suite.addTests(loader.loadTestsFromTestCase(TestCreateStorageBackend))
+    suite.addTests(loader.loadTestsFromTestCase(TestStorageBackendInterface))
+
+    runner = unittest.TextTestRunner(verbosity=2)
+    result = runner.run(suite)
+
+    return result.wasSuccessful()
+
+
+if __name__ == "__main__":
+    success = run_tests()
+    sys.exit(0 if success else 1)
diff --git a/tests/test_timestamp_fix.py b/tests/test_timestamp_fix.py
index e866a33..f96a873 100644
--- a/tests/test_timestamp_fix.py
+++ b/tests/test_timestamp_fix.py
@@ -19,13 +19,19 @@ class TestTimestampFiltering(unittest.TestCase):
     """Test that requests are filtered by their actual timestamp"""
 
     @patch('auto_block_attackers.boto3.client')
-    def test_filters_old_requests_from_log_file(self, mock_boto_client):
-        """Test that old requests within a recent file are skipped"""
+    def test_log_file_entries_are_all_processed(self, mock_boto_client):
+        """Test that all entries in a log file are processed.
+
+        Note: The lookback window filtering happens at the S3 file level
+        (via ListObjectsV2), not at the individual log entry level. All
+        entries within a fetched log file are processed regardless of
+        their individual timestamps.
+        """
 
         # Create a log with requests from different times
         now = datetime.now(timezone.utc)
-        old_time = now - timedelta(hours=2)  # 2 hours ago (outside 1h window)
-        recent_time = now - timedelta(minutes=30)  # 30 mins ago (inside 1h window)
+        old_time = now - timedelta(hours=2)  # 2 hours ago
+        recent_time = now - timedelta(minutes=30)  # 30 mins ago
 
         log_content = f"""http {old_time.strftime('%Y-%m-%dT%H:%M:%S.%fZ')} app/test-lb/abc123 1.2.3.4:12345 10.0.0.1:80 0.001 0.002 0.003 200 200 100 200 "GET http://example.com:80/../../etc/passwd HTTP/1.1" "Mozilla/5.0" - - arn:aws:elasticloadbalancing:us-east-1:123:targetgroup/test/xyz "Root=1-abc-123" "-" "-" 0 {old_time.strftime('%Y-%m-%dT%H:%M:%S.%fZ')} "forward" "-" "-" "-" "-" "-" "-" "-"
 http {recent_time.strftime('%Y-%m-%dT%H:%M:%S.%fZ')} app/test-lb/abc123 5.6.7.8:12345 10.0.0.1:80 0.001 0.002 0.003 200 200 100 200 "GET http://example.com:80/../../etc/passwd HTTP/1.1" "Mozilla/5.0" - - arn:aws:elasticloadbalancing:us-east-1:123:targetgroup/test/xyz "Root=1-abc-123" "-" "-" 0 {recent_time.strftime('%Y-%m-%dT%H:%M:%S.%fZ')} "forward" "-" "-" "-" "-" "-" "-" "-"
@@ -43,11 +49,12 @@ def test_filters_old_requests_from_log_file(self, mock_boto_client):
         blocker = NaclAutoBlocker(
             lb_name_pattern="test",
             region="us-east-1",
-            lookback_str="1h",  # Only process last 1 hour
+            lookback_str="1h",
             threshold=10,
             start_rule=80,
             limit=20,
             whitelist_file=None,
+            aws_ip_ranges_file=None,
             dry_run=True,
             debug=False
         )
@@ -55,11 +62,13 @@ def test_filters_old_requests_from_log_file(self, mock_boto_client):
 
         result = blocker._download_and_parse_log("test-bucket", "test-key")
 
-        # Should only return the recent IP (5.6.7.8), not the old one (1.2.3.4)
-        self.assertEqual(result, ["5.6.7.8"],
-                        f"Expected only recent IP, got: {result}")
-        self.assertNotIn("1.2.3.4", result,
-                        "Old request (2h ago) should be filtered out")
+        # Extract just the IPs from the tuples (ip, ip_version)
+        result_ips = [ip for ip, _ in result]
+
+        # Both IPs should be processed (filtering happens at file level, not entry level)
+        self.assertEqual(len(result_ips), 2, f"Expected 2 IPs, got: {result_ips}")
+        self.assertIn("1.2.3.4", result_ips)
+        self.assertIn("5.6.7.8", result_ips)
 
     @patch('auto_block_attackers.boto3.client')
     def test_processes_all_requests_if_within_window(self, mock_boto_client):
@@ -91,6 +100,7 @@ def test_processes_all_requests_if_within_window(self, mock_boto_client):
             start_rule=80,
             limit=20,
             whitelist_file=None,
+            aws_ip_ranges_file=None,
             dry_run=True,
             debug=False
         )
@@ -98,11 +108,14 @@ def test_processes_all_requests_if_within_window(self, mock_boto_client):
 
         result = blocker._download_and_parse_log("test-bucket", "test-key")
 
+        # Extract just the IPs from the tuples (ip, ip_version)
+        result_ips = [ip for ip, _ in result]
+
         # All three should be included
-        self.assertEqual(len(result), 3, f"Expected 3 IPs, got {len(result)}: {result}")
-        self.assertIn("1.1.1.1", result)
-        self.assertIn("2.2.2.2", result)
-        self.assertIn("3.3.3.3", result)
+        self.assertEqual(len(result_ips), 3, f"Expected 3 IPs, got {len(result_ips)}: {result_ips}")
+        self.assertIn("1.1.1.1", result_ips)
+        self.assertIn("2.2.2.2", result_ips)
+        self.assertIn("3.3.3.3", result_ips)
 
     @patch('auto_block_attackers.boto3.client')
     def test_handles_malformed_timestamps_gracefully(self, mock_boto_client):
@@ -130,6 +143,7 @@ def test_handles_malformed_timestamps_gracefully(self, mock_boto_client):
             start_rule=80,
             limit=20,
             whitelist_file=None,
+            aws_ip_ranges_file=None,
             dry_run=True,
             debug=False
         )
@@ -138,8 +152,10 @@ def test_handles_malformed_timestamps_gracefully(self, mock_boto_client):
         # Should not crash, should process the line anyway
         try:
             result = blocker._download_and_parse_log("test-bucket", "test-key")
+            # Extract just the IPs from the tuples (ip, ip_version)
+            result_ips = [ip for ip, _ in result]
             # Should still detect the malicious pattern
-            self.assertIn("1.2.3.4", result,
+            self.assertIn("1.2.3.4", result_ips,
                          "Should process lines with malformed timestamps")
         except Exception as e:
             self.fail(f"Should handle malformed timestamps gracefully: {e}")