From 8639e2d9fc2e01e8936e46795099b43eebe33a08 Mon Sep 17 00:00:00 2001
From: Nitin Ahuja <nitahuja@amazon.com>
Date: Fri, 9 Jan 2026 14:28:21 -0800
Subject: [PATCH 1/5] Add DocumentDB functional testing framework

- Implement complete test framework with pytest
  - 36 tests covering find, aggregate, and insert operations
  - Multi-engine support with custom connection strings
  - Automatic test isolation and cleanup
  - Tag-based test organization and filtering
  - Parallel execution support with pytest-xdist

- Add smart result analyzer
  - Automatic marker detection using heuristics
  - Filters test names, file names, and engine names
  - Categorizes failures: PASS/FAIL/UNSUPPORTED/INFRA_ERROR
  - CLI tool: docdb-analyze with text and JSON output

- Configure development tools
  - Black for code formatting
  - isort for import sorting
  - flake8 for linting
  - mypy for type checking
  - pytest-cov for coverage reporting

- Add comprehensive documentation
  - README with usage examples and best practices
  - CONTRIBUTING guide for writing tests
  - result_analyzer/README explaining analyzer behavior
  - All code formatted and linted

- Add Docker support
  - Dockerfile for containerized testing
  - .dockerignore for clean builds

Test Results: All 36 tests passed (100%) against DocumentDB
---
 .dockerignore                          |  53 ++++
 .flake8                                |  12 +
 .gitignore                             |   3 +
 CONTRIBUTING.md                        | 291 +++++++++++++++++++
 Dockerfile                             |  42 +++
 README.md                              | 374 ++++++++++++++++++++++++-
 conftest.py                            | 159 +++++++++++
 pyproject.toml                         |  36 +++
 pytest.ini                             |  51 ++++
 requirements-dev.txt                   |  11 +
 requirements.txt                       |  14 +
 result_analyzer/README.md              |  88 ++++++
 result_analyzer/__init__.py            |  11 +
 result_analyzer/analyzer.py            | 251 +++++++++++++++++
 result_analyzer/cli.py                 | 124 ++++++++
 result_analyzer/report_generator.py    | 134 +++++++++
 setup.py                               |  39 +++
 tests/__init__.py                      |   5 +
 tests/aggregate/__init__.py            |   1 +
 tests/aggregate/test_group_stage.py    | 128 +++++++++
 tests/aggregate/test_match_stage.py    |  87 ++++++
 tests/common/__init__.py               |   1 +
 tests/common/assertions.py             | 103 +++++++
 tests/find/__init__.py                 |   1 +
 tests/find/test_basic_queries.py       | 136 +++++++++
 tests/find/test_projections.py         | 117 ++++++++
 tests/find/test_query_operators.py     | 158 +++++++++++
 tests/insert/__init__.py               |   1 +
 tests/insert/test_insert_operations.py | 145 ++++++++++
 29 files changed, 2574 insertions(+), 2 deletions(-)
 create mode 100644 .dockerignore
 create mode 100644 .flake8
 create mode 100644 CONTRIBUTING.md
 create mode 100644 Dockerfile
 create mode 100644 conftest.py
 create mode 100644 pyproject.toml
 create mode 100644 pytest.ini
 create mode 100644 requirements-dev.txt
 create mode 100644 requirements.txt
 create mode 100644 result_analyzer/README.md
 create mode 100644 result_analyzer/__init__.py
 create mode 100644 result_analyzer/analyzer.py
 create mode 100644 result_analyzer/cli.py
 create mode 100644 result_analyzer/report_generator.py
 create mode 100644 setup.py
 create mode 100644 tests/__init__.py
 create mode 100644 tests/aggregate/__init__.py
 create mode 100644 tests/aggregate/test_group_stage.py
 create mode 100644 tests/aggregate/test_match_stage.py
 create mode 100644 tests/common/__init__.py
 create mode 100644 tests/common/assertions.py
 create mode 100644 tests/find/__init__.py
 create mode 100644 tests/find/test_basic_queries.py
 create mode 100644 tests/find/test_projections.py
 create mode 100644 tests/find/test_query_operators.py
 create mode 100644 tests/insert/__init__.py
 create mode 100644 tests/insert/test_insert_operations.py

diff --git a/.dockerignore b/.dockerignore
new file mode 100644
index 0000000..ca0dc97
--- /dev/null
+++ b/.dockerignore
@@ -0,0 +1,53 @@
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+*.egg-info/
+dist/
+build/
+.pytest_cache/
+.coverage
+htmlcov/
+
+# Virtual environments
+venv/
+env/
+ENV/
+
+# IDE
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+
+# Git
+.git/
+.gitignore
+.gitattributes
+
+# Documentation
+docs/
+*.md
+!README.md
+
+# Test results
+.test-results/
+test-results/
+*.log
+
+# Development files
+requirements-dev.txt
+.flake8
+.mypy.ini
+
+# CI/CD
+.github/
+.gitlab-ci.yml
+.circleci/
+
+# OS
+.DS_Store
+Thumbs.db
diff --git a/.flake8 b/.flake8
new file mode 100644
index 0000000..95b9a60
--- /dev/null
+++ b/.flake8
@@ -0,0 +1,12 @@
+[flake8]
+max-line-length = 100
+extend-ignore = E203, W503
+exclude =
+    .git,
+    __pycache__,
+    .venv,
+    venv,
+    build,
+    dist,
+    .eggs,
+    *.egg-info
diff --git a/.gitignore b/.gitignore
index b7faf40..f2a869e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -205,3 +205,6 @@ cython_debug/
 marimo/_static/
 marimo/_lsp/
 __marimo__/
+
+# Test results directory
+.test-results/
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
new file mode 100644
index 0000000..d8e5637
--- /dev/null
+++ b/CONTRIBUTING.md
@@ -0,0 +1,291 @@
+# Contributing to DocumentDB Functional Tests
+
+Thank you for your interest in contributing to the DocumentDB Functional Tests! This document provides guidelines for contributing to the project.
+
+## Getting Started
+
+### Prerequisites
+
+- Python 3.9 or higher
+- Git
+- Access to a DocumentDB or MongoDB instance for testing
+
+### Development Setup
+
+1. Fork the repository on GitHub
+2. Clone your fork locally:
+   ```bash
+   git clone https://github.com/YOUR_USERNAME/functional-tests.git
+   cd functional-tests
+   ```
+
+3. Install development dependencies:
+   ```bash
+   pip install -r requirements-dev.txt
+   ```
+
+4. Create a branch for your changes:
+   ```bash
+   git checkout -b feature/your-feature-name
+   ```
+
+## Writing Tests
+
+### Test File Organization
+
+- Place tests in the appropriate directory based on the operation being tested
+- Use descriptive file names: `test_<feature>.py`
+- Group related tests in the same file
+
+### Test Structure
+
+Every test should follow this structure:
+
+```python
+import pytest
+from tests.common.assertions import assert_document_match
+
+@pytest.mark.<operation>  # Required: e.g., find, insert, aggregate
+@pytest.mark.<feature>    # Optional: e.g., rbac, decimal128
+@pytest.mark.documents([  # Optional: test data
+    {"name": "Alice", "age": 30}
+])
+def test_descriptive_name(collection):
+    """
+    Clear description of what this test validates.
+    
+    This should explain:
+    - What feature/behavior is being tested
+    - Expected outcome
+    - Any special conditions or edge cases
+    """
+    # Setup (if needed beyond @pytest.mark.documents)
+    
+    # Execute the operation being tested
+    result = collection.find({"name": "Alice"})
+    
+    # Assert expected behavior
+    assert len(list(result)) == 1
+```
+
+### Naming Conventions
+
+- **Test functions**: `test_<what_is_being_tested>`
+  - Good: `test_find_with_gt_operator`
+  - Bad: `test_1`, `test_query`
+
+- **Test files**: `test_<feature_area>.py`
+  - Good: `test_query_operators.py`
+  - Bad: `tests.py`, `test.py`
+
+### Required Tags
+
+Every test MUST have at least one horizontal tag (operation):
+- `@pytest.mark.find`
+- `@pytest.mark.insert`
+- `@pytest.mark.update`
+- `@pytest.mark.delete`
+- `@pytest.mark.aggregate`
+- `@pytest.mark.index`
+- `@pytest.mark.admin`
+- `@pytest.mark.collection_mgmt`
+
+### Optional Tags
+
+Add vertical tags for cross-cutting features:
+- `@pytest.mark.rbac` - Role-based access control
+- `@pytest.mark.decimal128` - Decimal128 data type
+- `@pytest.mark.collation` - Collation/sorting
+- `@pytest.mark.transactions` - Transactions
+- `@pytest.mark.geospatial` - Geospatial queries
+- `@pytest.mark.text_search` - Text search
+- `@pytest.mark.validation` - Schema validation
+- `@pytest.mark.ttl` - Time-to-live indexes
+
+Add special tags when appropriate:
+- `@pytest.mark.smoke` - Quick smoke tests
+- `@pytest.mark.slow` - Tests taking > 5 seconds
+
+### Using Fixtures
+
+The framework provides three main fixtures:
+
+1. **engine_client**: Raw MongoDB client
+   ```python
+   def test_with_client(engine_client):
+       db = engine_client.test_db
+       collection = db.test_collection
+       # ... test code
+   ```
+
+2. **database_client**: Database with automatic cleanup
+   ```python
+   def test_with_database(database_client):
+       collection = database_client.my_collection
+       # ... test code
+       # Database automatically dropped after test
+   ```
+
+3. **collection**: Collection with automatic data setup and cleanup
+   ```python
+   @pytest.mark.documents([{"name": "Alice"}])
+   def test_with_collection(collection):
+       # Documents already inserted
+       result = collection.find_one({"name": "Alice"})
+       # ... assertions
+       # Collection automatically dropped after test
+   ```
+
+### Custom Assertions
+
+Use the provided assertion helpers for common scenarios:
+
+```python
+from tests.common.assertions import (
+    assert_document_match,
+    assert_documents_match,
+    assert_field_exists,
+    assert_field_not_exists,
+    assert_count
+)
+
+# Good: Use custom assertions
+assert_document_match(actual, expected, ignore_id=True)
+assert_count(collection, {"status": "active"}, 5)
+
+# Avoid: Manual comparison that's verbose
+actual_doc = {k: v for k, v in actual.items() if k != "_id"}
+expected_doc = {k: v for k, v in expected.items() if k != "_id"}
+assert actual_doc == expected_doc
+```
+
+## Code Quality
+
+### Before Submitting
+
+Run these commands to ensure code quality:
+
+```bash
+# Format code
+black .
+
+# Sort imports
+isort .
+
+# Run linter
+flake8
+
+# Type checking (optional but recommended)
+mypy .
+
+# Run tests
+pytest
+```
+
+### Code Style
+
+- Follow PEP 8 style guidelines
+- Use meaningful variable names
+- Add docstrings to test functions
+- Keep test functions focused on a single behavior
+- Avoid complex logic in tests
+
+## Testing Your Changes
+
+### Run Tests Locally
+
+```bash
+# Run all tests
+pytest
+
+# Run specific test file
+pytest tests/find/test_basic_queries.py
+
+# Run specific test
+pytest tests/find/test_basic_queries.py::test_find_all_documents
+
+# Run with your changes only
+pytest -m "your_new_tag"
+```
+
+### Test Against Multiple Engines
+
+```bash
+# Test against both DocumentDB and MongoDB
+pytest --engine documentdb=mongodb://localhost:27017 \
+       --engine mongodb=mongodb://mongo:27017
+```
+
+## Submitting Changes
+
+### Pull Request Process
+
+1. Ensure your code follows the style guidelines
+2. Add tests for new functionality
+3. Update documentation if needed
+4. Commit with clear, descriptive messages:
+   ```bash
+   git commit -m "Add tests for $group stage with $avg operator"
+   ```
+
+5. Push to your fork:
+   ```bash
+   git push origin feature/your-feature-name
+   ```
+
+6. Create a Pull Request on GitHub
+
+### Pull Request Guidelines
+
+Your PR should:
+- Have a clear title describing the change
+- Include a description explaining:
+  - What the change does
+  - Why it's needed
+  - How to test it
+- Reference any related issues
+- Pass all CI checks
+
+### Commit Message Guidelines
+
+- Use present tense: "Add test" not "Added test"
+- Be descriptive but concise
+- Reference issues: "Fix #123: Add validation tests"
+
+## Adding New Test Categories
+
+If you're adding tests for a new feature area:
+
+1. Create a new directory under `tests/`:
+   ```bash
+   mkdir tests/update
+   ```
+
+2. Add `__init__.py`:
+   ```python
+   """Update operation tests."""
+   ```
+
+3. Create test files following naming conventions
+
+4. Add appropriate markers to `pytest.ini`:
+   ```ini
+   markers =
+       update: Update operation tests
+   ```
+
+5. Update documentation in README.md
+
+## Questions?
+
+- Open an issue for questions about contributing
+- Check existing tests for examples
+- Review the RFC document for framework design
+
+## Code of Conduct
+
+This project follows the Contributor Covenant Code of Conduct. By participating, you are expected to uphold this code.
+
+## License
+
+By contributing, you agree that your contributions will be licensed under the MIT License.
diff --git a/Dockerfile b/Dockerfile
new file mode 100644
index 0000000..9fc7292
--- /dev/null
+++ b/Dockerfile
@@ -0,0 +1,42 @@
+# Multi-stage build for DocumentDB Functional Tests
+
+# Stage 1: Build stage
+FROM python:3.11-slim as builder
+
+WORKDIR /build
+
+# Copy requirements
+COPY requirements.txt .
+
+# Install dependencies
+RUN pip install --no-cache-dir --user -r requirements.txt
+
+# Stage 2: Runtime stage
+FROM python:3.11-slim
+
+# Set working directory
+WORKDIR /app
+
+# Copy installed packages from builder
+COPY --from=builder /root/.local /root/.local
+
+# Copy application code
+COPY tests/ tests/
+COPY result_analyzer/ result_analyzer/
+COPY conftest.py .
+COPY pytest.ini .
+COPY setup.py .
+
+# Ensure scripts are in PATH
+ENV PATH=/root/.local/bin:$PATH
+
+# Create directory for test results
+RUN mkdir -p .test-results
+
+# Set Python to run unbuffered (so logs appear immediately)
+ENV PYTHONUNBUFFERED=1
+
+# Default command: run all tests
+# Users can override with command line arguments
+ENTRYPOINT ["pytest"]
+CMD ["--help"]
diff --git a/README.md b/README.md
index dcdb725..6db5fa9 100644
--- a/README.md
+++ b/README.md
@@ -1,2 +1,372 @@
-# functional-tests
-End-to-end functional testing framework for DocumentDB using pytest
+# DocumentDB Functional Tests
+
+End-to-end functional testing framework for DocumentDB using pytest. This framework validates DocumentDB functionality against specifications through comprehensive test suites.
+
+## Overview
+
+This testing framework provides:
+
+- **Specification-based Testing**: Tests define explicit expected behavior for DocumentDB features
+- **Multi-Engine Support**: Run the same tests against DocumentDB, MongoDB, and other compatible engines
+- **Parallel Execution**: Fast test execution using pytest-xdist
+- **Tag-Based Organization**: Flexible test filtering using pytest markers
+- **Result Analysis**: Automatic categorization and reporting of test results
+
+## Quick Start
+
+### Prerequisites
+
+- Python 3.9 or higher
+- Access to a DocumentDB or MongoDB instance
+- pip package manager
+
+### Installation
+
+```bash
+# Clone the repository
+git clone https://github.com/documentdb/functional-tests.git
+cd functional-tests
+
+# Install dependencies
+pip install -r requirements.txt
+```
+
+### Running Tests
+
+#### Basic Usage
+
+```bash
+# Run all tests against default localhost
+pytest
+
+# Run against specific engine
+pytest --engine documentdb=mongodb://localhost:27017
+
+# Run against multiple engines
+pytest --engine documentdb=mongodb://localhost:27017 \
+       --engine mongodb=mongodb://mongo:27017
+```
+
+#### Filter by Tags
+
+```bash
+# Run only find operation tests
+pytest -m find
+
+# Run smoke tests
+pytest -m smoke
+
+# Run find tests with RBAC
+pytest -m "find and rbac"
+
+# Exclude slow tests
+pytest -m "not slow"
+```
+
+#### Parallel Execution
+
+The framework supports parallel test execution using pytest-xdist, which can significantly reduce test execution time.
+
+```bash
+# Run with 4 parallel processes
+pytest -n 4
+
+# Auto-detect number of CPUs (recommended)
+pytest -n auto
+
+# Combine with other options
+pytest -n auto -m smoke --engine documentdb=mongodb://localhost:27017
+```
+
+**Performance Benefits:**
+- Significantly faster test execution with multiple workers
+- Scales with number of available CPU cores
+- Particularly effective for large test suites
+
+**Best Practices:**
+- Use `-n auto` to automatically detect optimal worker count
+- Parallel execution works best with 4+ workers
+- Each worker runs tests in isolation (separate database/collection)
+- Safe for tests with automatic cleanup (all framework tests are safe)
+
+**When to Use:**
+- Large test suites
+- Local development for quick validation
+
+**Example with full options:**
+```bash
+pytest -n 4 \
+  --engine documentdb=mongodb://localhost:27017 \
+  -m "find or aggregate" \
+  -v \
+  --json-report --json-report-file=results.json
+```
+
+#### Output Formats
+
+```bash
+# Generate JSON report
+pytest --json-report --json-report-file=results.json
+
+# Generate JUnit XML
+pytest --junitxml=results.xml
+
+# Verbose output
+pytest -v
+
+# Show local variables on failure
+pytest -l
+```
+
+## Docker Usage
+
+### Build the Image
+
+```bash
+docker build -t documentdb/functional-tests .
+```
+
+### Run Tests in Container
+
+```bash
+# Run against DocumentDB
+docker run --network host \
+  documentdb/functional-tests \
+  --engine documentdb=mongodb://localhost:27017
+
+# Run specific tags
+docker run documentdb/functional-tests \
+  --engine documentdb=mongodb://cluster.docdb.amazonaws.com:27017 \
+  -m smoke
+
+# Run with parallel execution
+docker run documentdb/functional-tests \
+  --engine documentdb=mongodb://localhost:27017 \
+  -n 4
+```
+
+## Test Organization
+
+Tests are organized by API operations with cross-cutting feature tags:
+
+```
+tests/
+├── find/                    # Find operation tests
+│   ├── test_basic_queries.py
+│   ├── test_query_operators.py
+│   └── test_projections.py
+├── aggregate/               # Aggregation tests
+│   ├── test_match_stage.py
+│   └── test_group_stage.py
+├── insert/                  # Insert operation tests
+│   └── test_insert_operations.py
+└── common/                  # Shared utilities
+    └── assertions.py
+```
+
+## Test Tags
+
+### Horizontal Tags (API Operations)
+- `find`: Find operation tests
+- `insert`: Insert operation tests
+- `update`: Update operation tests
+- `delete`: Delete operation tests
+- `aggregate`: Aggregation pipeline tests
+- `index`: Index management tests
+- `admin`: Administrative command tests
+- `collection_mgmt`: Collection management tests
+
+### Vertical Tags (Cross-cutting Features)
+- `rbac`: Role-based access control tests
+- `decimal128`: Decimal128 data type tests
+- `collation`: Collation and sorting tests
+- `transactions`: Transaction tests
+- `geospatial`: Geospatial query tests
+- `text_search`: Text search tests
+- `validation`: Schema validation tests
+- `ttl`: Time-to-live index tests
+
+### Special Tags
+- `smoke`: Quick smoke tests for feature detection
+- `slow`: Tests that take longer to execute
+
+## Writing Tests
+
+### Basic Test Structure
+
+```python
+import pytest
+from tests.common.assertions import assert_document_match
+
+@pytest.mark.find  # Required: operation tag
+@pytest.mark.smoke  # Optional: additional tags
+@pytest.mark.documents([  # Optional: test data
+    {"name": "Alice", "age": 30},
+    {"name": "Bob", "age": 25}
+])
+def test_find_with_filter(collection):
+    """Test description."""
+    # Execute operation
+    result = list(collection.find({"age": {"$gt": 25}}))
+    
+    # Verify results
+    assert len(result) == 1
+    assert_document_match(result[0], {"name": "Alice", "age": 30})
+```
+
+### Test Fixtures
+
+- `engine_client`: MongoDB client for the engine
+- `database_client`: Database with automatic cleanup
+- `collection`: Collection with automatic test data setup and cleanup
+
+### Custom Assertions
+
+```python
+from tests.common.assertions import (
+    assert_document_match,
+    assert_documents_match,
+    assert_field_exists,
+    assert_field_not_exists,
+    assert_count
+)
+
+# Compare documents ignoring _id
+assert_document_match(actual, expected, ignore_id=True)
+
+# Compare lists of documents
+assert_documents_match(actual_list, expected_list, ignore_order=True)
+
+# Check field existence
+assert_field_exists(document, "user.name")
+assert_field_not_exists(document, "password")
+
+# Count documents matching filter
+assert_count(collection, {"status": "active"}, 5)
+```
+
+## Result Analysis
+
+The framework includes a command-line tool to analyze test results and generate detailed reports categorized by feature tags.
+
+### Installation
+
+```bash
+# Install the package to get the CLI tool
+pip install -e .
+```
+
+### CLI Tool Usage
+
+```bash
+# Analyze default report location
+docdb-analyze
+
+# Analyze specific report
+docdb-analyze --input custom-results.json
+
+# Generate text report
+docdb-analyze --output report.txt --format text
+
+# Generate JSON analysis
+docdb-analyze --output analysis.json --format json
+
+# Quiet mode (only write to file, no console output)
+docdb-analyze --output report.txt --quiet
+
+# Get help
+docdb-analyze --help
+```
+
+### Programmatic Usage
+
+You can also use the result analyzer as a Python library:
+
+```python
+from result_analyzer import analyze_results, generate_report, print_summary
+
+# Analyze JSON report
+analysis = analyze_results(".test-results/report.json")
+
+# Print summary to console
+print_summary(analysis)
+
+# Generate text report
+generate_report(analysis, "report.txt", format="text")
+
+# Generate JSON report
+generate_report(analysis, "report.json", format="json")
+```
+
+### Failure Categories
+
+Tests are automatically categorized into:
+- **PASS**: Test succeeded, behavior matches specification
+- **FAIL**: Test failed, feature exists but behaves incorrectly
+- **UNSUPPORTED**: Feature not implemented
+- **INFRA_ERROR**: Infrastructure issue (connection, timeout, etc.)
+
+### Example Workflow
+
+```bash
+# Run tests with JSON report
+pytest --engine documentdb=mongodb://localhost:27017 \
+       --json-report --json-report-file=.test-results/report.json
+
+# Analyze results
+docdb-analyze
+
+# Generate detailed text report
+docdb-analyze --output detailed-report.txt --format text
+
+# Generate JSON for further processing
+docdb-analyze --output analysis.json --format json
+```
+
+## Development
+
+### Install Development Dependencies
+
+```bash
+pip install -r requirements-dev.txt
+```
+
+### Code Quality
+
+```bash
+# Format code
+black .
+
+# Sort imports
+isort .
+
+# Lint
+flake8
+
+# Type checking
+mypy .
+```
+
+### Run Tests with Coverage
+
+```bash
+pytest --cov=. --cov-report=html
+```
+
+## Contributing
+
+1. Fork the repository
+2. Create a feature branch
+3. Write tests following the test structure guidelines
+4. Ensure tests pass locally
+5. Submit a pull request
+
+## License
+
+This project is licensed under the MIT License - see the [LICENSE](LICENSE) file for details.
+
+## Support
+
+For issues and questions:
+- GitHub Issues: https://github.com/documentdb/functional-tests/issues
+- Documentation: https://github.com/documentdb/functional-tests/docs
diff --git a/conftest.py b/conftest.py
new file mode 100644
index 0000000..422e021
--- /dev/null
+++ b/conftest.py
@@ -0,0 +1,159 @@
+"""
+Global pytest fixtures for functional testing framework.
+
+This module provides fixtures for:
+- Engine parametrization
+- Database connection management
+- Test isolation
+"""
+
+
+import pytest
+from pymongo import MongoClient
+
+
+def pytest_addoption(parser):
+    """Add custom command-line options for pytest."""
+    parser.addoption(
+        "--engine",
+        action="append",
+        default=[],
+        help="Engine to test against. Format: name=connection_string. "
+        "Example: --engine documentdb=mongodb://localhost:27017 "
+        "--engine mongodb=mongodb://mongo:27017",
+    )
+
+
+def pytest_configure(config):
+    """Configure pytest with custom settings."""
+    # Parse engine configurations
+    engines = {}
+    for engine_spec in config.getoption("--engine"):
+        if "=" not in engine_spec:
+            raise ValueError(
+                f"Invalid engine specification: {engine_spec}. "
+                "Expected format: name=connection_string"
+            )
+        name, connection_string = engine_spec.split("=", 1)
+        engines[name] = connection_string
+
+    # Store in config for access by fixtures
+    config.engines = engines
+
+    # If no engines specified, default to localhost
+    if not engines:
+        config.engines = {"default": "mongodb://localhost:27017"}
+
+
+def pytest_generate_tests(metafunc):
+    """
+    Parametrize tests to run against multiple engines.
+
+    Tests that use the 'engine_client' fixture will automatically
+    run against all configured engines.
+    """
+    if "engine_client" in metafunc.fixturenames:
+        engines = metafunc.config.engines
+        metafunc.parametrize(
+            "engine_name,engine_connection_string",
+            [(name, conn) for name, conn in engines.items()],
+            ids=list(engines.keys()),
+            scope="function",
+        )
+
+
+@pytest.fixture(scope="function")
+def engine_client(engine_name, engine_connection_string):
+    """
+    Create a MongoDB client for the specified engine.
+
+    This fixture is parametrized to run tests against all configured engines.
+
+    Args:
+        engine_name: Name of the engine (from --engine option)
+        engine_connection_string: Connection string for the engine
+
+    Yields:
+        MongoClient: Connected MongoDB client
+    """
+    client = MongoClient(engine_connection_string)
+
+    # Verify connection
+    try:
+        client.admin.command("ping")
+    except Exception as e:
+        pytest.skip(f"Cannot connect to {engine_name}: {e}")
+
+    yield client
+
+    # Cleanup: close connection
+    client.close()
+
+
+@pytest.fixture(scope="function")
+def database_client(engine_client, request):
+    """
+    Provide a database client with automatic cleanup.
+
+    Creates a test database named after the test function for isolation.
+    Automatically drops the database after the test completes.
+
+    Args:
+        engine_client: MongoDB client from engine_client fixture
+        request: pytest request object
+
+    Yields:
+        Database: MongoDB database object
+    """
+    # Create unique database name based on test name
+    test_name = request.node.name.replace("[", "_").replace("]", "_")
+    db_name = f"test_{test_name}"[:63]  # MongoDB database name limit
+
+    db = engine_client[db_name]
+
+    yield db
+
+    # Cleanup: drop test database
+    try:
+        engine_client.drop_database(db_name)
+    except Exception:
+        pass  # Best effort cleanup
+
+
+@pytest.fixture(scope="function")
+def collection(database_client, request):
+    """
+    Provide a collection with automatic test data setup and cleanup.
+
+    If the test is marked with @pytest.mark.documents([...]), this fixture
+    will automatically insert those documents before the test runs.
+
+    Args:
+        database_client: Database from database_client fixture
+        request: pytest request object
+
+    Yields:
+        Collection: MongoDB collection object
+    """
+    # Use test name as collection name for isolation
+    collection_name = request.node.name.replace("[", "_").replace("]", "_")[:100]
+    coll = database_client[collection_name]
+
+    # Check if test has @pytest.mark.documents decorator
+    marker = request.node.get_closest_marker("documents")
+    if marker and marker.args:
+        documents = marker.args[0]
+        if documents:
+            coll.insert_many(documents)
+
+    yield coll
+
+    # Cleanup: drop collection
+    try:
+        coll.drop()
+    except Exception:
+        pass  # Best effort cleanup
+
+
+# Custom marker for test data setup
+pytest.mark.documents = pytest.mark.documents
diff --git a/pyproject.toml b/pyproject.toml
new file mode 100644
index 0000000..905e866
--- /dev/null
+++ b/pyproject.toml
@@ -0,0 +1,36 @@
+[tool.black]
+line-length = 100
+target-version = ['py39', 'py310', 'py311']
+include = '\.pyi?$'
+extend-exclude = '''
+/(
+  # directories
+  \.eggs
+  | \.git
+  | \.venv
+  | venv
+  | build
+  | dist
+)/
+'''
+
+[tool.isort]
+profile = "black"
+line_length = 100
+skip_gitignore = true
+
+[tool.mypy]
+python_version = "3.9"
+warn_return_any = true
+warn_unused_configs = true
+disallow_untyped_defs = false
+ignore_missing_imports = true
+exclude = [
+    'venv',
+    '.venv',
+    'build',
+    'dist',
+]
+
+[tool.pytest.ini_options]
+# Already in pytest.ini, keeping this for reference
diff --git a/pytest.ini b/pytest.ini
new file mode 100644
index 0000000..3cc2c44
--- /dev/null
+++ b/pytest.ini
@@ -0,0 +1,51 @@
+[pytest]
+# Test discovery
+testpaths = tests
+python_files = test_*.py
+python_classes = Test*
+python_functions = test_*
+
+# Output options
+addopts = 
+    -v
+    --strict-markers
+    --tb=short
+    --color=yes
+
+# Markers for test categorization
+markers =
+    # Horizontal tags (API Operations)
+    find: Find operation tests
+    insert: Insert operation tests
+    update: Update operation tests
+    delete: Delete operation tests
+    aggregate: Aggregation pipeline tests
+    index: Index management tests
+    admin: Administrative command tests
+    collection_mgmt: Collection management tests
+    
+    # Vertical tags (Cross-cutting Features)
+    rbac: Role-based access control tests
+    decimal128: Decimal128 data type tests
+    collation: Collation and sorting tests
+    transactions: Transaction tests
+    geospatial: Geospatial query tests
+    text_search: Text search tests
+    validation: Schema validation tests
+    ttl: Time-to-live index tests
+    
+    # Special markers
+    smoke: Quick smoke tests for feature detection
+    slow: Tests that take longer to execute
+
+# Timeout for tests (seconds)
+timeout = 300
+
+# Parallel execution settings
+# Use with: pytest -n auto
+# Or: pytest -n 4 (for 4 processes)
+
+# JSON report configuration
+json_report = .test-results/report.json
+json_report_indent = 2
+json_report_omit = log
diff --git a/requirements-dev.txt b/requirements-dev.txt
new file mode 100644
index 0000000..e8f0654
--- /dev/null
+++ b/requirements-dev.txt
@@ -0,0 +1,11 @@
+# Development dependencies
+-r requirements.txt
+
+# Code quality
+black>=23.7.0  # Code formatting
+flake8>=6.1.0  # Linting
+mypy>=1.5.0  # Type checking
+isort>=5.12.0  # Import sorting
+
+# Testing
+pytest-cov>=4.1.0  # Coverage reporting
diff --git a/requirements.txt b/requirements.txt
new file mode 100644
index 0000000..0577522
--- /dev/null
+++ b/requirements.txt
@@ -0,0 +1,14 @@
+# Core testing dependencies
+pytest>=7.4.0
+pytest-xdist>=3.3.0  # Parallel test execution
+pytest-json-report>=1.5.0  # JSON output format
+pytest-timeout>=2.1.0  # Test timeout support
+
+# Database connectivity
+pymongo>=4.5.0
+
+# Configuration management
+pyyaml>=6.0
+
+# Reporting
+jinja2>=3.1.2  # Template rendering for reports
diff --git a/result_analyzer/README.md b/result_analyzer/README.md
new file mode 100644
index 0000000..151882b
--- /dev/null
+++ b/result_analyzer/README.md
@@ -0,0 +1,88 @@
+# Result Analyzer
+
+The Result Analyzer automatically processes pytest JSON reports and categorizes results by meaningful test markers.
+
+## Features
+
+- **Automatic Marker Detection**: Uses heuristics to identify meaningful test markers
+- **Smart Filtering**: Automatically excludes test names, file names, and internal markers
+- **Flexible**: Supports new markers without code changes
+- **CLI Tool**: `docdb-analyze` command for quick analysis
+
+## Marker Detection
+
+The analyzer automatically identifies meaningful markers by excluding:
+
+### Excluded by Pattern
+- **Test function names**: Any marker containing `[` or starting with `test_`
+- **File names**: Any marker containing `.py` or `/`
+- **Directory names**: Common names like `tests`, `functional-tests`, `src`, `lib`
+
+### Excluded by Name
+- **Pytest internal**: `parametrize`, `usefixtures`, `filterwarnings`, `pytestmark`
+- **Fixture markers**: `documents` (used for test data setup)
+- **Engine names**: `documentdb`, `mongodb`, `cosmosdb`, `default` (from parametrization)
+
+### Result
+Only meaningful categorization markers remain:
+- Horizontal tags: `find`, `insert`, `update`, `delete`, `aggregate`, `index`, `admin`, `collection_mgmt`
+- Vertical tags: `rbac`, `decimal128`, `collation`, `transactions`, `geospatial`, `text_search`, `validation`, `ttl`
+- Special tags: `smoke`, `slow`
+
+## Adding New Markers
+
+Simply add the marker to `pytest.ini` and use it in your tests:
+
+```python
+@pytest.mark.mynewfeature
+def test_something():
+    pass
+```
+
+The analyzer will automatically detect and report on it - no code changes needed!
+
+## Failure Categorization
+
+Tests are categorized into four types:
+
+1. **PASS**: Test succeeded
+2. **FAIL**: Test failed, feature exists but behaves incorrectly
+3. **UNSUPPORTED**: Feature not implemented (skipped tests)
+4. **INFRA_ERROR**: Infrastructure issue (connection, timeout, etc.)
+
+## Usage
+
+### CLI
+```bash
+# Quick analysis
+docdb-analyze
+
+# Custom input/output
+docdb-analyze --input results.json --output report.txt
+```
+
+### Programmatic
+```python
+from result_analyzer import analyze_results, generate_report
+
+analysis = analyze_results("report.json")
+generate_report(analysis, "report.txt", format="text")
+```
+
+## Maintenance
+
+The heuristic-based approach means:
+- ✅ **No maintenance** for new test markers
+- ✅ **Automatic adaptation** to new patterns
+- ⚠️ **May need updates** if new fixture patterns emerge (e.g., new engine names)
+
+To add a new fixture marker or engine name to exclude, update the filter in `analyzer.py`:
+
+```python
+# Skip fixture markers
+if marker in {"documents", "mynewfixture"}:
+    continue
+    
+# Skip engine names
+if marker in {"documentdb", "mongodb", "mynewengine"}:
+    continue
diff --git a/result_analyzer/__init__.py b/result_analyzer/__init__.py
new file mode 100644
index 0000000..63faf0a
--- /dev/null
+++ b/result_analyzer/__init__.py
@@ -0,0 +1,11 @@
+"""
+Result Analyzer for DocumentDB Functional Tests.
+
+This module provides tools for analyzing pytest test results and generating
+reports categorized by feature tags.
+"""
+
+from .analyzer import analyze_results, categorize_failure
+from .report_generator import generate_report, print_summary
+
+__all__ = ["analyze_results", "categorize_failure", "generate_report", "print_summary"]
diff --git a/result_analyzer/analyzer.py b/result_analyzer/analyzer.py
new file mode 100644
index 0000000..af2b2a1
--- /dev/null
+++ b/result_analyzer/analyzer.py
@@ -0,0 +1,251 @@
+"""
+Result analyzer for parsing and categorizing test results.
+
+This module provides functions to analyze pytest JSON output and categorize
+test results by tags and failure types.
+"""
+
+import json
+from collections import defaultdict
+from typing import Any, Dict, List
+
+
+class FailureType:
+    """Enumeration of failure types."""
+
+    PASS = "PASS"
+    FAIL = "FAIL"
+    UNSUPPORTED = "UNSUPPORTED"
+    INFRA_ERROR = "INFRA_ERROR"
+
+
+def categorize_failure(test_result: Dict[str, Any]) -> str:
+    """
+    Categorize a test failure based on error information.
+
+    Args:
+        test_result: Test result dictionary from pytest JSON report
+
+    Returns:
+        One of: PASS, FAIL, UNSUPPORTED, INFRA_ERROR
+    """
+    outcome = test_result.get("outcome", "")
+
+    if outcome == "passed":
+        return FailureType.PASS
+
+    if outcome == "skipped":
+        # Skipped tests typically indicate unsupported features
+        return FailureType.UNSUPPORTED
+
+    if outcome == "failed":
+        # Analyze the failure to determine if it's infrastructure or functionality
+        call_info = test_result.get("call", {})
+        longrepr = call_info.get("longrepr", "")
+
+        # Check for infrastructure-related errors
+        infra_keywords = [
+            "connection",
+            "timeout",
+            "network",
+            "cannot connect",
+            "refused",
+            "unreachable",
+            "host",
+        ]
+
+        if any(keyword in longrepr.lower() for keyword in infra_keywords):
+            return FailureType.INFRA_ERROR
+
+        # Otherwise, it's a functional failure
+        return FailureType.FAIL
+
+    # Unknown outcome, treat as infrastructure error
+    return FailureType.INFRA_ERROR
+
+
+def extract_markers(test_result: Dict[str, Any]) -> List[str]:
+    """
+    Extract pytest markers (tags) from a test result.
+
+    Automatically filters out test names, file names, and pytest internal markers
+    using heuristics, keeping only meaningful test categorization markers.
+
+    Args:
+        test_result: Test result dictionary from pytest JSON report
+
+    Returns:
+        List of marker names
+    """
+    markers = []
+
+    # Extract from keywords
+    keywords = test_result.get("keywords", [])
+    if isinstance(keywords, list):
+        markers.extend(keywords)
+
+    # Extract from markers field if present
+    test_markers = test_result.get("markers", [])
+    if isinstance(test_markers, list):
+        for marker in test_markers:
+            if isinstance(marker, dict):
+                markers.append(marker.get("name", ""))
+            else:
+                markers.append(str(marker))
+
+    # Filter out non-meaningful markers using heuristics
+    filtered_markers = []
+    for marker in markers:
+        # Skip empty strings
+        if not marker:
+            continue
+
+        # Skip if it looks like a test function name (contains brackets or starts with test_)
+        if "[" in marker or marker.startswith("test_"):
+            continue
+
+        # Skip if it looks like a file name (contains .py or /)
+        if ".py" in marker or "/" in marker:
+            continue
+
+        # Skip if it's a directory name (common directory names)
+        if marker in {"tests", "functional-tests", "src", "lib"}:
+            continue
+
+        # Skip pytest internal markers
+        if marker in {"parametrize", "usefixtures", "filterwarnings", "pytestmark"}:
+            continue
+
+        # Skip fixture markers (markers used for setup, not categorization)
+        # These are markers that take arguments in the decorator
+        if marker in {"documents"}:
+            continue
+
+        # Skip engine names (from parametrization like [documentdb], [mongodb])
+        # Common engine names that appear in test results
+        if marker in {"documentdb", "mongodb", "cosmosdb", "default"}:
+            continue
+
+        # If it passed all filters, it's likely a meaningful marker
+        filtered_markers.append(marker)
+
+    return filtered_markers
+
+
+def analyze_results(json_report_path: str) -> Dict[str, Any]:
+    """
+    Analyze pytest JSON report and generate categorized results.
+
+    Args:
+        json_report_path: Path to pytest JSON report file
+
+    Returns:
+        Dictionary containing analysis results with structure:
+        {
+            "summary": {
+                "total": int,
+                "passed": int,
+                "failed": int,
+                "unsupported": int,
+                "infra_error": int
+            },
+            "by_tag": {
+                "tag_name": {
+                    "passed": int,
+                    "failed": int,
+                    "unsupported": int,
+                    "infra_error": int,
+                    "pass_rate": float
+                }
+            },
+            "tests": [
+                {
+                    "name": str,
+                    "outcome": str,
+                    "duration": float,
+                    "tags": List[str],
+                    "error": str (optional)
+                }
+            ]
+        }
+    """
+    # Load JSON report
+    with open(json_report_path, "r") as f:
+        report = json.load(f)
+
+    # Initialize counters
+    summary: Dict[str, Any] = {
+        "total": 0,
+        "passed": 0,
+        "failed": 0,
+        "unsupported": 0,
+        "infra_error": 0,
+    }
+
+    by_tag: Dict[str, Dict[str, int]] = defaultdict(
+        lambda: {"passed": 0, "failed": 0, "unsupported": 0, "infra_error": 0}
+    )
+
+    tests_details = []
+
+    # Process each test
+    tests = report.get("tests", [])
+    for test in tests:
+        summary["total"] += 1
+
+        # Categorize the result
+        failure_type = categorize_failure(test)
+
+        # Extract tags
+        tags = extract_markers(test)
+
+        # Update summary counters
+        if failure_type == FailureType.PASS:
+            summary["passed"] += 1
+        elif failure_type == FailureType.FAIL:
+            summary["failed"] += 1
+        elif failure_type == FailureType.UNSUPPORTED:
+            summary["unsupported"] += 1
+        elif failure_type == FailureType.INFRA_ERROR:
+            summary["infra_error"] += 1
+
+        # Update tag-specific counters
+        for tag in tags:
+            if failure_type == FailureType.PASS:
+                by_tag[tag]["passed"] += 1
+            elif failure_type == FailureType.FAIL:
+                by_tag[tag]["failed"] += 1
+            elif failure_type == FailureType.UNSUPPORTED:
+                by_tag[tag]["unsupported"] += 1
+            elif failure_type == FailureType.INFRA_ERROR:
+                by_tag[tag]["infra_error"] += 1
+
+        # Store test details
+        test_detail = {
+            "name": test.get("nodeid", ""),
+            "outcome": failure_type,
+            "duration": test.get("duration", 0),
+            "tags": tags,
+        }
+
+        # Add error information if failed
+        if failure_type in [FailureType.FAIL, FailureType.INFRA_ERROR]:
+            call_info = test.get("call", {})
+            test_detail["error"] = call_info.get("longrepr", "")
+
+        tests_details.append(test_detail)
+
+    # Calculate pass rates for each tag
+    by_tag_with_rates = {}
+    for tag, counts in by_tag.items():
+        total = counts["passed"] + counts["failed"] + counts["unsupported"] + counts["infra_error"]
+        pass_rate = (counts["passed"] / total * 100) if total > 0 else 0
+
+        by_tag_with_rates[tag] = {**counts, "total": total, "pass_rate": round(pass_rate, 2)}
+
+    # Calculate overall pass rate
+    summary["pass_rate"] = round(
+        (summary["passed"] / summary["total"] * 100) if summary["total"] > 0 else 0, 2
+    )
+
+    return {"summary": summary, "by_tag": by_tag_with_rates, "tests": tests_details}
diff --git a/result_analyzer/cli.py b/result_analyzer/cli.py
new file mode 100644
index 0000000..99ccad7
--- /dev/null
+++ b/result_analyzer/cli.py
@@ -0,0 +1,124 @@
+#!/usr/bin/env python3
+"""
+DocumentDB Functional Test Results Analyzer - CLI
+
+Command-line interface for analyzing pytest JSON reports and generating
+categorized results by feature tags.
+"""
+
+import argparse
+import sys
+from pathlib import Path
+
+from .analyzer import analyze_results
+from .report_generator import generate_report, print_summary
+
+
+def main():
+    parser = argparse.ArgumentParser(
+        description="Analyze DocumentDB functional test results and generate reports",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        epilog="""
+Examples:
+  # Analyze default report location
+  %(prog)s
+
+  # Analyze specific report
+  %(prog)s --input my-results.json
+
+  # Generate text report
+  %(prog)s --output report.txt --format text
+
+  # Generate JSON analysis
+  %(prog)s --output analysis.json --format json
+
+  # Quiet mode (no console output)
+  %(prog)s --output report.txt --quiet
+        """,
+    )
+
+    parser.add_argument(
+        "-i",
+        "--input",
+        default=".test-results/report.json",
+        help="Path to pytest JSON report file (default: .test-results/report.json)",
+    )
+
+    parser.add_argument(
+        "-o", "--output", help="Path to output report file (if not specified, prints to console)"
+    )
+
+    parser.add_argument(
+        "-f",
+        "--format",
+        choices=["text", "json"],
+        default="text",
+        help="Output format: text or json (default: text)",
+    )
+
+    parser.add_argument(
+        "-q",
+        "--quiet",
+        action="store_true",
+        help="Suppress console output (only write to output file)",
+    )
+
+    parser.add_argument(
+        "--no-summary", action="store_true", help="Skip printing summary to console"
+    )
+
+    args = parser.parse_args()
+
+    # Check if input file exists
+    input_path = Path(args.input)
+    if not input_path.exists():
+        print(f"Error: Input file not found: {args.input}", file=sys.stderr)
+        print("\nMake sure to run pytest with --json-report first:", file=sys.stderr)
+        print(f"  pytest --json-report --json-report-file={args.input}", file=sys.stderr)
+        return 1
+
+    try:
+        # Analyze the results
+        if not args.quiet:
+            print(f"Analyzing test results from: {args.input}")
+
+        analysis = analyze_results(args.input)
+
+        # Print summary to console (unless quiet or no-summary)
+        if not args.quiet and not args.no_summary:
+            print_summary(analysis)
+
+        # Generate output file if specified
+        if args.output:
+            generate_report(analysis, args.output, format=args.format)
+            if not args.quiet:
+                print(f"\nReport saved to: {args.output}")
+
+        # If no output file and quiet mode, print to stdout
+        elif not args.quiet:
+            print("\nResults by Tag:")
+            print("-" * 60)
+            for tag, stats in sorted(
+                analysis["by_tag"].items(), key=lambda x: x[1]["pass_rate"], reverse=True
+            ):
+                passed = stats["passed"]
+                total = stats["total"]
+                rate = stats["pass_rate"]
+                print(f"{tag:30s} | {passed:3d}/{total:3d} passed ({rate:5.1f}%)")
+
+        # Return exit code based on test results
+        if analysis["summary"]["failed"] > 0:
+            return 1
+        return 0
+
+    except Exception as e:
+        print(f"Error analyzing results: {e}", file=sys.stderr)
+        if not args.quiet:
+            import traceback
+
+            traceback.print_exc()
+        return 1
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/result_analyzer/report_generator.py b/result_analyzer/report_generator.py
new file mode 100644
index 0000000..c0d2b26
--- /dev/null
+++ b/result_analyzer/report_generator.py
@@ -0,0 +1,134 @@
+"""
+Report generator for creating human-readable reports from analysis results.
+
+This module provides functions to generate various report formats from
+analyzed test results.
+"""
+
+import json
+from datetime import datetime
+from typing import Any, Dict
+
+
+def generate_report(analysis: Dict[str, Any], output_path: str, format: str = "json"):
+    """
+    Generate a report from analysis results.
+
+    Args:
+        analysis: Analysis results from analyze_results()
+        output_path: Path to write the report
+        format: Report format ("json" or "text")
+    """
+    if format == "json":
+        generate_json_report(analysis, output_path)
+    elif format == "text":
+        generate_text_report(analysis, output_path)
+    else:
+        raise ValueError(f"Unsupported report format: {format}")
+
+
+def generate_json_report(analysis: Dict[str, Any], output_path: str):
+    """
+    Generate a JSON report.
+
+    Args:
+        analysis: Analysis results from analyze_results()
+        output_path: Path to write the JSON report
+    """
+    report = {
+        "generated_at": datetime.now().isoformat(),
+        "summary": analysis["summary"],
+        "by_tag": analysis["by_tag"],
+        "tests": analysis["tests"],
+    }
+
+    with open(output_path, "w") as f:
+        json.dump(report, f, indent=2)
+
+
+def generate_text_report(analysis: Dict[str, Any], output_path: str):
+    """
+    Generate a human-readable text report.
+
+    Args:
+        analysis: Analysis results from analyze_results()
+        output_path: Path to write the text report
+    """
+    lines = []
+
+    # Header
+    lines.append("=" * 80)
+    lines.append("DocumentDB Functional Test Results")
+    lines.append("=" * 80)
+    lines.append(f"Generated: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}")
+    lines.append("")
+
+    # Summary
+    summary = analysis["summary"]
+    lines.append("SUMMARY")
+    lines.append("-" * 80)
+    lines.append(f"Total Tests:        {summary['total']}")
+    lines.append(f"Passed:             {summary['passed']} ({summary['pass_rate']}%)")
+    lines.append(f"Failed:             {summary['failed']}")
+    lines.append(f"Unsupported:        {summary['unsupported']}")
+    lines.append(f"Infrastructure Errors: {summary['infra_error']}")
+    lines.append("")
+
+    # Results by tag
+    lines.append("RESULTS BY TAG")
+    lines.append("-" * 80)
+
+    if analysis["by_tag"]:
+        # Sort tags by pass rate (ascending) to highlight problematic areas
+        sorted_tags = sorted(analysis["by_tag"].items(), key=lambda x: x[1]["pass_rate"])
+
+        for tag, stats in sorted_tags:
+            lines.append(f"\n{tag}:")
+            lines.append(f"  Total:       {stats['total']}")
+            lines.append(f"  Passed:      {stats['passed']} ({stats['pass_rate']}%)")
+            lines.append(f"  Failed:      {stats['failed']}")
+            lines.append(f"  Unsupported: {stats['unsupported']}")
+            lines.append(f"  Infra Error: {stats['infra_error']}")
+    else:
+        lines.append("No tags found in test results.")
+
+    lines.append("")
+
+    # Failed tests details
+    failed_tests = [t for t in analysis["tests"] if t["outcome"] == "FAIL"]
+    if failed_tests:
+        lines.append("FAILED TESTS")
+        lines.append("-" * 80)
+        for test in failed_tests:
+            lines.append(f"\n{test['name']}")
+            lines.append(f"  Tags: {', '.join(test['tags'])}")
+            lines.append(f"  Duration: {test['duration']:.2f}s")
+            if "error" in test:
+                error_preview = test["error"][:200]
+                lines.append(f"  Error: {error_preview}...")
+
+    lines.append("")
+    lines.append("=" * 80)
+
+    # Write report
+    with open(output_path, "w") as f:
+        f.write("\n".join(lines))
+
+
+def print_summary(analysis: Dict[str, Any]):
+    """
+    Print a brief summary to console.
+
+    Args:
+        analysis: Analysis results from analyze_results()
+    """
+    summary = analysis["summary"]
+    print("\n" + "=" * 60)
+    print("Test Results Summary")
+    print("=" * 60)
+    print(f"Total:       {summary['total']}")
+    print(f"Passed:      {summary['passed']} ({summary['pass_rate']}%)")
+    print(f"Failed:      {summary['failed']}")
+    print(f"Unsupported: {summary['unsupported']}")
+    print(f"Infra Error: {summary['infra_error']}")
+    print("=" * 60 + "\n")
diff --git a/setup.py b/setup.py
new file mode 100644
index 0000000..22194cf
--- /dev/null
+++ b/setup.py
@@ -0,0 +1,39 @@
+from setuptools import find_packages, setup
+
+with open("README.md", "r", encoding="utf-8") as fh:
+    long_description = fh.read()
+
+setup(
+    name="documentdb-functional-tests",
+    version="0.1.0",
+    author="DocumentDB Contributors",
+    description="End-to-end functional testing framework for DocumentDB",
+    long_description=long_description,
+    long_description_content_type="text/markdown",
+    url="https://github.com/documentdb/functional-tests",
+    packages=find_packages(),
+    classifiers=[
+        "Development Status :: 3 - Alpha",
+        "Intended Audience :: Developers",
+        "License :: OSI Approved :: MIT License",
+        "Programming Language :: Python :: 3",
+        "Programming Language :: Python :: 3.9",
+        "Programming Language :: Python :: 3.10",
+        "Programming Language :: Python :: 3.11",
+    ],
+    python_requires=">=3.9",
+    install_requires=[
+        "pytest>=7.4.0",
+        "pytest-xdist>=3.3.0",
+        "pytest-json-report>=1.5.0",
+        "pytest-timeout>=2.1.0",
+        "pymongo>=4.5.0",
+        "pyyaml>=6.0",
+        "jinja2>=3.1.2",
+    ],
+    entry_points={
+        "console_scripts": [
+            "docdb-analyze=result_analyzer.cli:main",
+        ],
+    },
+)
diff --git a/tests/__init__.py b/tests/__init__.py
new file mode 100644
index 0000000..3492497
--- /dev/null
+++ b/tests/__init__.py
@@ -0,0 +1,5 @@
+"""
+DocumentDB Functional Tests
+
+End-to-end functional testing suite for DocumentDB.
+"""
diff --git a/tests/aggregate/__init__.py b/tests/aggregate/__init__.py
new file mode 100644
index 0000000..1103a4a
--- /dev/null
+++ b/tests/aggregate/__init__.py
@@ -0,0 +1 @@
+"""Aggregation pipeline tests."""
diff --git a/tests/aggregate/test_group_stage.py b/tests/aggregate/test_group_stage.py
new file mode 100644
index 0000000..1a51748
--- /dev/null
+++ b/tests/aggregate/test_group_stage.py
@@ -0,0 +1,128 @@
+"""
+Aggregation $group stage tests.
+
+Tests for the $group stage in aggregation pipelines.
+"""
+
+import pytest
+
+
+@pytest.mark.aggregate
+@pytest.mark.smoke
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "department": "Engineering", "salary": 100000},
+        {"name": "Bob", "department": "Engineering", "salary": 90000},
+        {"name": "Charlie", "department": "Sales", "salary": 80000},
+        {"name": "David", "department": "Sales", "salary": 75000},
+    ]
+)
+def test_group_with_count(collection):
+    """Test $group stage with count aggregation."""
+    # Execute aggregation to count documents by department
+    pipeline = [{"$group": {"_id": "$department", "count": {"$sum": 1}}}]
+    result = list(collection.aggregate(pipeline))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 departments"
+
+    # Convert to dict for easier verification
+    dept_counts = {doc["_id"]: doc["count"] for doc in result}
+    assert dept_counts["Engineering"] == 2, "Expected 2 employees in Engineering"
+    assert dept_counts["Sales"] == 2, "Expected 2 employees in Sales"
+
+
+@pytest.mark.aggregate
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "department": "Engineering", "salary": 100000},
+        {"name": "Bob", "department": "Engineering", "salary": 90000},
+        {"name": "Charlie", "department": "Sales", "salary": 80000},
+    ]
+)
+def test_group_with_sum(collection):
+    """Test $group stage with sum aggregation."""
+    # Execute aggregation to sum salaries by department
+    pipeline = [{"$group": {"_id": "$department", "totalSalary": {"$sum": "$salary"}}}]
+    result = list(collection.aggregate(pipeline))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 departments"
+
+    # Convert to dict for easier verification
+    dept_salaries = {doc["_id"]: doc["totalSalary"] for doc in result}
+    assert dept_salaries["Engineering"] == 190000, "Expected total Engineering salary of 190000"
+    assert dept_salaries["Sales"] == 80000, "Expected total Sales salary of 80000"
+
+
+@pytest.mark.aggregate
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "department": "Engineering", "salary": 100000},
+        {"name": "Bob", "department": "Engineering", "salary": 90000},
+        {"name": "Charlie", "department": "Sales", "salary": 80000},
+    ]
+)
+def test_group_with_avg(collection):
+    """Test $group stage with average aggregation."""
+    # Execute aggregation to calculate average salary by department
+    pipeline = [{"$group": {"_id": "$department", "avgSalary": {"$avg": "$salary"}}}]
+    result = list(collection.aggregate(pipeline))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 departments"
+
+    # Convert to dict for easier verification
+    dept_avg = {doc["_id"]: doc["avgSalary"] for doc in result}
+    assert dept_avg["Engineering"] == 95000, "Expected average Engineering salary of 95000"
+    assert dept_avg["Sales"] == 80000, "Expected average Sales salary of 80000"
+
+
+@pytest.mark.aggregate
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "department": "Engineering", "salary": 100000},
+        {"name": "Bob", "department": "Engineering", "salary": 90000},
+        {"name": "Charlie", "department": "Sales", "salary": 80000},
+    ]
+)
+def test_group_with_min_max(collection):
+    """Test $group stage with min and max aggregations."""
+    # Execute aggregation to find min and max salary by department
+    pipeline = [
+        {
+            "$group": {
+                "_id": "$department",
+                "minSalary": {"$min": "$salary"},
+                "maxSalary": {"$max": "$salary"},
+            }
+        }
+    ]
+    result = list(collection.aggregate(pipeline))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 departments"
+
+    # Verify Engineering department
+    eng_dept = next(doc for doc in result if doc["_id"] == "Engineering")
+    assert eng_dept["minSalary"] == 90000, "Expected min Engineering salary of 90000"
+    assert eng_dept["maxSalary"] == 100000, "Expected max Engineering salary of 100000"
+
+
+@pytest.mark.aggregate
+@pytest.mark.documents(
+    [
+        {"item": "A", "quantity": 5},
+        {"item": "B", "quantity": 10},
+        {"item": "A", "quantity": 3},
+    ]
+)
+def test_group_all_documents(collection):
+    """Test $group stage grouping all documents (using null as _id)."""
+    # Execute aggregation to sum quantities across all documents
+    pipeline = [{"$group": {"_id": None, "totalQuantity": {"$sum": "$quantity"}}}]
+    result = list(collection.aggregate(pipeline))
+
+    # Verify results
+    assert len(result) == 1, "Expected single result grouping all documents"
+    assert result[0]["totalQuantity"] == 18, "Expected total quantity of 18"
diff --git a/tests/aggregate/test_match_stage.py b/tests/aggregate/test_match_stage.py
new file mode 100644
index 0000000..886b78e
--- /dev/null
+++ b/tests/aggregate/test_match_stage.py
@@ -0,0 +1,87 @@
+"""
+Aggregation $match stage tests.
+
+Tests for the $match stage in aggregation pipelines.
+"""
+
+import pytest
+
+
+@pytest.mark.aggregate
+@pytest.mark.smoke
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30, "status": "active"},
+        {"name": "Bob", "age": 25, "status": "active"},
+        {"name": "Charlie", "age": 35, "status": "inactive"},
+    ]
+)
+def test_match_simple_filter(collection):
+    """Test $match stage with simple equality filter."""
+    # Execute aggregation with $match stage
+    pipeline = [{"$match": {"status": "active"}}]
+    result = list(collection.aggregate(pipeline))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 active users"
+    names = {doc["name"] for doc in result}
+    assert names == {"Alice", "Bob"}, "Expected Alice and Bob"
+
+
+@pytest.mark.aggregate
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30},
+        {"name": "Bob", "age": 25},
+        {"name": "Charlie", "age": 35},
+    ]
+)
+def test_match_with_comparison_operator(collection):
+    """Test $match stage with comparison operators."""
+    # Execute aggregation with $match using $gt
+    pipeline = [{"$match": {"age": {"$gt": 25}}}]
+    result = list(collection.aggregate(pipeline))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 users with age > 25"
+    names = {doc["name"] for doc in result}
+    assert names == {"Alice", "Charlie"}, "Expected Alice and Charlie"
+
+
+@pytest.mark.aggregate
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30, "city": "NYC"},
+        {"name": "Bob", "age": 25, "city": "SF"},
+        {"name": "Charlie", "age": 35, "city": "NYC"},
+    ]
+)
+def test_match_multiple_conditions(collection):
+    """Test $match stage with multiple filter conditions."""
+    # Execute aggregation with multiple conditions in $match
+    pipeline = [{"$match": {"city": "NYC", "age": {"$gte": 30}}}]
+    result = list(collection.aggregate(pipeline))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 users from NYC with age >= 30"
+    names = {doc["name"] for doc in result}
+    assert names == {"Alice", "Charlie"}, "Expected Alice and Charlie"
+
+
+@pytest.mark.aggregate
+def test_match_empty_result(collection):
+    """Test $match stage that matches no documents."""
+    # Insert test data
+    collection.insert_many(
+        [
+            {"name": "Alice", "status": "active"},
+            {"name": "Bob", "status": "active"},
+        ]
+    )
+
+    # Execute aggregation with $match that matches nothing
+    pipeline = [{"$match": {"status": "inactive"}}]
+    result = list(collection.aggregate(pipeline))
+
+    # Verify empty result
+    assert result == [], "Expected empty result when no documents match"
diff --git a/tests/common/__init__.py b/tests/common/__init__.py
new file mode 100644
index 0000000..b34d9ac
--- /dev/null
+++ b/tests/common/__init__.py
@@ -0,0 +1 @@
+"""Common utilities and helpers for functional tests."""
diff --git a/tests/common/assertions.py b/tests/common/assertions.py
new file mode 100644
index 0000000..c6d9e89
--- /dev/null
+++ b/tests/common/assertions.py
@@ -0,0 +1,103 @@
+"""
+Custom assertion helpers for functional tests.
+
+Provides convenient assertion methods for common test scenarios.
+"""
+
+from typing import Dict, List
+
+
+def assert_document_match(actual: Dict, expected: Dict, ignore_id: bool = True):
+    """
+    Assert that a document matches the expected structure and values.
+
+    Args:
+        actual: The actual document from the database
+        expected: The expected document structure
+        ignore_id: If True, ignore _id field in comparison (default: True)
+    """
+    if ignore_id:
+        actual = {k: v for k, v in actual.items() if k != "_id"}
+        expected = {k: v for k, v in expected.items() if k != "_id"}
+
+    assert actual == expected, f"Document mismatch.\nExpected: {expected}\nActual: {actual}"
+
+
+def assert_documents_match(
+    actual: List[Dict], expected: List[Dict], ignore_id: bool = True, ignore_order: bool = False
+):
+    """
+    Assert that a list of documents matches the expected list.
+
+    Args:
+        actual: List of actual documents from the database
+        expected: List of expected documents
+        ignore_id: If True, ignore _id field in comparison (default: True)
+        ignore_order: If True, sort both lists before comparison (default: False)
+    """
+    if ignore_id:
+        actual = [{k: v for k, v in doc.items() if k != "_id"} for doc in actual]
+        expected = [{k: v for k, v in doc.items() if k != "_id"} for doc in expected]
+
+    assert len(actual) == len(
+        expected
+    ), f"Document count mismatch. Expected {len(expected)}, got {len(actual)}"
+
+    if ignore_order:
+        # Sort for comparison
+        actual = sorted(actual, key=lambda x: str(x))
+        expected = sorted(expected, key=lambda x: str(x))
+
+    for i, (act, exp) in enumerate(zip(actual, expected)):
+        assert act == exp, f"Document at index {i} does not match.\nExpected: {exp}\nActual: {act}"
+
+
+def assert_field_exists(document: Dict, field_path: str):
+    """
+    Assert that a field exists in a document (supports nested paths).
+
+    Args:
+        document: The document to check
+        field_path: Dot-notation field path (e.g., "user.name")
+    """
+    parts = field_path.split(".")
+    current = document
+
+    for part in parts:
+        assert part in current, f"Field '{field_path}' does not exist in document"
+        current = current[part]
+
+
+def assert_field_not_exists(document: Dict, field_path: str):
+    """
+    Assert that a field does not exist in a document (supports nested paths).
+
+    Args:
+        document: The document to check
+        field_path: Dot-notation field path (e.g., "user.name")
+    """
+    parts = field_path.split(".")
+    current = document
+
+    for i, part in enumerate(parts):
+        if part not in current:
+            return  # Field doesn't exist, assertion passes
+        if i == len(parts) - 1:
+            raise AssertionError(f"Field '{field_path}' exists in document but should not")
+        current = current[part]
+
+
+def assert_count(collection, filter_query: Dict, expected_count: int):
+    """
+    Assert that a collection contains the expected number of documents matching a filter.
+
+    Args:
+        collection: MongoDB collection object
+        filter_query: Query filter
+        expected_count: Expected number of matching documents
+    """
+    actual_count = collection.count_documents(filter_query)
+    assert actual_count == expected_count, (
+        f"Document count mismatch for filter {filter_query}. "
+        f"Expected {expected_count}, got {actual_count}"
+    )
diff --git a/tests/find/__init__.py b/tests/find/__init__.py
new file mode 100644
index 0000000..0bdc7e7
--- /dev/null
+++ b/tests/find/__init__.py
@@ -0,0 +1 @@
+"""Find operation tests."""
diff --git a/tests/find/test_basic_queries.py b/tests/find/test_basic_queries.py
new file mode 100644
index 0000000..9a27d1d
--- /dev/null
+++ b/tests/find/test_basic_queries.py
@@ -0,0 +1,136 @@
+"""
+Basic find operation tests.
+
+Tests for fundamental find() and findOne() operations.
+"""
+
+import pytest
+
+from tests.common.assertions import assert_document_match
+
+
+@pytest.mark.find
+@pytest.mark.smoke
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30, "status": "active"},
+        {"name": "Bob", "age": 25, "status": "active"},
+        {"name": "Charlie", "age": 35, "status": "inactive"},
+    ]
+)
+def test_find_all_documents(collection):
+    """Test finding all documents in a collection."""
+    # Execute find operation
+    result = list(collection.find())
+
+    # Verify all documents are returned
+    assert len(result) == 3, "Expected to find 3 documents"
+
+    # Verify document content
+    names = {doc["name"] for doc in result}
+    assert names == {"Alice", "Bob", "Charlie"}, "Expected to find all three users"
+
+
+@pytest.mark.find
+@pytest.mark.smoke
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30, "status": "active"},
+        {"name": "Bob", "age": 25, "status": "active"},
+        {"name": "Charlie", "age": 35, "status": "inactive"},
+    ]
+)
+def test_find_with_filter(collection):
+    """Test find operation with a simple equality filter."""
+    # Execute find with filter
+    result = list(collection.find({"status": "active"}))
+
+    # Verify only active users are returned
+    assert len(result) == 2, "Expected to find 2 active users"
+
+    # Verify all returned documents have status "active"
+    for doc in result:
+        assert doc["status"] == "active", "All returned documents should have status 'active'"
+
+    # Verify correct users are returned
+    names = {doc["name"] for doc in result}
+    assert names == {"Alice", "Bob"}, "Expected to find Alice and Bob"
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30},
+        {"name": "Bob", "age": 25},
+    ]
+)
+def test_find_one(collection):
+    """Test findOne operation returns a single document."""
+    # Execute findOne
+    result = collection.find_one({"name": "Alice"})
+
+    # Verify document is returned
+    assert result is not None, "Expected to find a document"
+
+    # Verify document content
+    assert_document_match(result, {"name": "Alice", "age": 30})
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30},
+    ]
+)
+def test_find_one_not_found(collection):
+    """Test findOne returns None when no document matches."""
+    # Execute findOne with non-matching filter
+    result = collection.find_one({"name": "NonExistent"})
+
+    # Verify None is returned
+    assert result is None, "Expected None when no document matches"
+
+
+@pytest.mark.find
+def test_find_empty_collection(collection):
+    """Test find on an empty collection returns empty result."""
+    # Execute find on empty collection
+    result = list(collection.find())
+
+    # Verify empty result
+    assert result == [], "Expected empty result for empty collection"
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30, "city": "NYC"},
+        {"name": "Bob", "age": 25, "city": "SF"},
+        {"name": "Charlie", "age": 35, "city": "NYC"},
+    ]
+)
+def test_find_with_multiple_conditions(collection):
+    """Test find with multiple filter conditions (implicit AND)."""
+    # Execute find with multiple conditions
+    result = list(collection.find({"city": "NYC", "age": 30}))
+
+    # Verify only matching document is returned
+    assert len(result) == 1, "Expected to find 1 document"
+    assert_document_match(result[0], {"name": "Alice", "age": 30, "city": "NYC"})
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "profile": {"age": 30, "city": "NYC"}},
+        {"name": "Bob", "profile": {"age": 25, "city": "SF"}},
+    ]
+)
+def test_find_nested_field(collection):
+    """Test find with nested field query using dot notation."""
+    # Execute find with nested field
+    result = list(collection.find({"profile.city": "NYC"}))
+
+    # Verify correct document is returned
+    assert len(result) == 1, "Expected to find 1 document"
+    assert result[0]["name"] == "Alice", "Expected to find Alice"
diff --git a/tests/find/test_projections.py b/tests/find/test_projections.py
new file mode 100644
index 0000000..51c6e49
--- /dev/null
+++ b/tests/find/test_projections.py
@@ -0,0 +1,117 @@
+"""
+Projection tests for find operations.
+
+Tests for field inclusion, exclusion, and projection operators.
+"""
+
+import pytest
+
+from tests.common.assertions import assert_field_exists, assert_field_not_exists
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30, "email": "alice@example.com", "city": "NYC"},
+        {"name": "Bob", "age": 25, "email": "bob@example.com", "city": "SF"},
+    ]
+)
+def test_find_with_field_inclusion(collection):
+    """Test find with explicit field inclusion."""
+    # Find with projection to include only name and age
+    result = list(collection.find({}, {"name": 1, "age": 1}))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 documents"
+
+    # Verify included fields exist
+    for doc in result:
+        assert_field_exists(doc, "_id")  # _id is included by default
+        assert_field_exists(doc, "name")
+        assert_field_exists(doc, "age")
+
+        # Verify excluded fields don't exist
+        assert_field_not_exists(doc, "email")
+        assert_field_not_exists(doc, "city")
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30, "email": "alice@example.com", "city": "NYC"},
+        {"name": "Bob", "age": 25, "email": "bob@example.com", "city": "SF"},
+    ]
+)
+def test_find_with_field_exclusion(collection):
+    """Test find with explicit field exclusion."""
+    # Find with projection to exclude email and city
+    result = list(collection.find({}, {"email": 0, "city": 0}))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 documents"
+
+    # Verify included fields exist
+    for doc in result:
+        assert_field_exists(doc, "_id")
+        assert_field_exists(doc, "name")
+        assert_field_exists(doc, "age")
+
+        # Verify excluded fields don't exist
+        assert_field_not_exists(doc, "email")
+        assert_field_not_exists(doc, "city")
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30, "email": "alice@example.com"},
+    ]
+)
+def test_find_exclude_id(collection):
+    """Test find with _id exclusion."""
+    # Find with projection to exclude _id
+    result = list(collection.find({}, {"_id": 0, "name": 1, "age": 1}))
+
+    # Verify results
+    assert len(result) == 1, "Expected 1 document"
+
+    # Verify _id is excluded
+    assert_field_not_exists(result[0], "_id")
+    assert_field_exists(result[0], "name")
+    assert_field_exists(result[0], "age")
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "profile": {"age": 30, "city": "NYC", "email": "alice@example.com"}},
+    ]
+)
+def test_find_nested_field_projection(collection):
+    """Test find with nested field projection."""
+    # Find with projection for nested field
+    result = list(collection.find({}, {"name": 1, "profile.age": 1}))
+
+    # Verify results
+    assert len(result) == 1, "Expected 1 document"
+    assert_field_exists(result[0], "name")
+    assert_field_exists(result[0], "profile.age")
+
+    # Verify other nested fields are not included
+    assert "city" not in result[0].get("profile", {}), "city should not be in profile"
+    assert "email" not in result[0].get("profile", {}), "email should not be in profile"
+
+
+@pytest.mark.find
+def test_find_empty_projection(collection):
+    """Test find with empty projection returns all fields."""
+    # Insert test data
+    collection.insert_one({"name": "Alice", "age": 30})
+
+    # Find with empty projection
+    result = collection.find_one({}, {})
+
+    # Verify all fields are present
+    assert_field_exists(result, "_id")
+    assert_field_exists(result, "name")
+    assert_field_exists(result, "age")
diff --git a/tests/find/test_query_operators.py b/tests/find/test_query_operators.py
new file mode 100644
index 0000000..780f3d4
--- /dev/null
+++ b/tests/find/test_query_operators.py
@@ -0,0 +1,158 @@
+"""
+Query operator tests for find operations.
+
+Tests for comparison operators: $eq, $ne, $gt, $gte, $lt, $lte, $in, $nin
+"""
+
+import pytest
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30},
+        {"name": "Bob", "age": 25},
+        {"name": "Charlie", "age": 35},
+    ]
+)
+def test_find_gt_operator(collection):
+    """Test find with $gt (greater than) operator."""
+    # Find documents where age > 25
+    result = list(collection.find({"age": {"$gt": 25}}))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 documents with age > 25"
+    names = {doc["name"] for doc in result}
+    assert names == {"Alice", "Charlie"}, "Expected Alice and Charlie"
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30},
+        {"name": "Bob", "age": 25},
+        {"name": "Charlie", "age": 35},
+    ]
+)
+def test_find_gte_operator(collection):
+    """Test find with $gte (greater than or equal) operator."""
+    # Find documents where age >= 30
+    result = list(collection.find({"age": {"$gte": 30}}))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 documents with age >= 30"
+    names = {doc["name"] for doc in result}
+    assert names == {"Alice", "Charlie"}, "Expected Alice and Charlie"
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30},
+        {"name": "Bob", "age": 25},
+        {"name": "Charlie", "age": 35},
+    ]
+)
+def test_find_lt_operator(collection):
+    """Test find with $lt (less than) operator."""
+    # Find documents where age < 30
+    result = list(collection.find({"age": {"$lt": 30}}))
+
+    # Verify results
+    assert len(result) == 1, "Expected 1 document with age < 30"
+    assert result[0]["name"] == "Bob", "Expected Bob"
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30},
+        {"name": "Bob", "age": 25},
+        {"name": "Charlie", "age": 35},
+    ]
+)
+def test_find_lte_operator(collection):
+    """Test find with $lte (less than or equal) operator."""
+    # Find documents where age <= 30
+    result = list(collection.find({"age": {"$lte": 30}}))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 documents with age <= 30"
+    names = {doc["name"] for doc in result}
+    assert names == {"Alice", "Bob"}, "Expected Alice and Bob"
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30},
+        {"name": "Bob", "age": 25},
+        {"name": "Charlie", "age": 35},
+    ]
+)
+def test_find_ne_operator(collection):
+    """Test find with $ne (not equal) operator."""
+    # Find documents where age != 30
+    result = list(collection.find({"age": {"$ne": 30}}))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 documents with age != 30"
+    names = {doc["name"] for doc in result}
+    assert names == {"Bob", "Charlie"}, "Expected Bob and Charlie"
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "status": "active"},
+        {"name": "Bob", "status": "inactive"},
+        {"name": "Charlie", "status": "pending"},
+        {"name": "David", "status": "active"},
+    ]
+)
+def test_find_in_operator(collection):
+    """Test find with $in operator."""
+    # Find documents where status is in ["active", "pending"]
+    result = list(collection.find({"status": {"$in": ["active", "pending"]}}))
+
+    # Verify results
+    assert len(result) == 3, "Expected 3 documents with status in [active, pending]"
+    names = {doc["name"] for doc in result}
+    assert names == {"Alice", "Charlie", "David"}, "Expected Alice, Charlie, and David"
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "status": "active"},
+        {"name": "Bob", "status": "inactive"},
+        {"name": "Charlie", "status": "pending"},
+    ]
+)
+def test_find_nin_operator(collection):
+    """Test find with $nin (not in) operator."""
+    # Find documents where status is not in ["active", "pending"]
+    result = list(collection.find({"status": {"$nin": ["active", "pending"]}}))
+
+    # Verify results
+    assert len(result) == 1, "Expected 1 document with status not in [active, pending]"
+    assert result[0]["name"] == "Bob", "Expected Bob"
+
+
+@pytest.mark.find
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "age": 30},
+        {"name": "Bob", "age": 25},
+        {"name": "Charlie", "age": 35},
+    ]
+)
+def test_find_range_query(collection):
+    """Test find with range query (combining $gte and $lte)."""
+    # Find documents where 25 <= age <= 30
+    result = list(collection.find({"age": {"$gte": 25, "$lte": 30}}))
+
+    # Verify results
+    assert len(result) == 2, "Expected 2 documents with age between 25 and 30"
+    names = {doc["name"] for doc in result}
+    assert names == {"Alice", "Bob"}, "Expected Alice and Bob"
diff --git a/tests/insert/__init__.py b/tests/insert/__init__.py
new file mode 100644
index 0000000..47ae134
--- /dev/null
+++ b/tests/insert/__init__.py
@@ -0,0 +1 @@
+"""Insert operation tests."""
diff --git a/tests/insert/test_insert_operations.py b/tests/insert/test_insert_operations.py
new file mode 100644
index 0000000..659d26b
--- /dev/null
+++ b/tests/insert/test_insert_operations.py
@@ -0,0 +1,145 @@
+"""
+Insert operation tests.
+
+Tests for insertOne, insertMany, and related operations.
+"""
+
+import pytest
+from bson import ObjectId
+
+from tests.common.assertions import assert_count
+
+
+@pytest.mark.insert
+@pytest.mark.smoke
+def test_insert_one_document(collection):
+    """Test inserting a single document."""
+    # Insert one document
+    document = {"name": "Alice", "age": 30}
+    result = collection.insert_one(document)
+
+    # Verify insert was acknowledged
+    assert result.acknowledged, "Insert should be acknowledged"
+    assert result.inserted_id is not None, "Should return inserted _id"
+    assert isinstance(result.inserted_id, ObjectId), "Inserted _id should be ObjectId"
+
+    # Verify document exists in collection
+    assert_count(collection, {}, 1)
+
+    # Verify document content
+    found = collection.find_one({"name": "Alice"})
+    assert found is not None, "Document should exist"
+    assert found["name"] == "Alice"
+    assert found["age"] == 30
+
+
+@pytest.mark.insert
+@pytest.mark.smoke
+def test_insert_many_documents(collection):
+    """Test inserting multiple documents."""
+    # Insert multiple documents
+    documents = [
+        {"name": "Alice", "age": 30},
+        {"name": "Bob", "age": 25},
+        {"name": "Charlie", "age": 35},
+    ]
+    result = collection.insert_many(documents)
+
+    # Verify insert was acknowledged
+    assert result.acknowledged, "Insert should be acknowledged"
+    assert len(result.inserted_ids) == 3, "Should return 3 inserted IDs"
+
+    # Verify all IDs are ObjectIds
+    for inserted_id in result.inserted_ids:
+        assert isinstance(inserted_id, ObjectId), "Each inserted _id should be ObjectId"
+
+    # Verify all documents exist
+    assert_count(collection, {}, 3)
+
+
+@pytest.mark.insert
+def test_insert_with_custom_id(collection):
+    """Test inserting document with custom _id."""
+    # Insert document with custom _id
+    custom_id = "custom_123"
+    document = {"_id": custom_id, "name": "Alice"}
+    result = collection.insert_one(document)
+
+    # Verify custom _id is used
+    assert result.inserted_id == custom_id, "Should use custom _id"
+
+    # Verify document can be retrieved by custom _id
+    found = collection.find_one({"_id": custom_id})
+    assert found is not None, "Document should exist"
+    assert found["name"] == "Alice"
+
+
+@pytest.mark.insert
+def test_insert_duplicate_id_fails(collection):
+    """Test that inserting duplicate _id raises error."""
+    # Insert first document
+    document = {"_id": "duplicate_id", "name": "Alice"}
+    collection.insert_one(document)
+
+    # Try to insert document with same _id
+    duplicate = {"_id": "duplicate_id", "name": "Bob"}
+
+    # Should raise exception
+    with pytest.raises(Exception):  # DuplicateKeyError or similar
+        collection.insert_one(duplicate)
+
+    # Verify only first document exists
+    assert_count(collection, {}, 1)
+    found = collection.find_one({"_id": "duplicate_id"})
+    assert found["name"] == "Alice", "Should have first document"
+
+
+@pytest.mark.insert
+def test_insert_nested_document(collection):
+    """Test inserting document with nested structure."""
+    # Insert document with nested fields
+    document = {
+        "name": "Alice",
+        "profile": {"age": 30, "address": {"city": "NYC", "country": "USA"}},
+    }
+    result = collection.insert_one(document)
+
+    # Verify insert
+    assert result.inserted_id is not None
+
+    # Verify nested structure is preserved
+    found = collection.find_one({"name": "Alice"})
+    assert found["profile"]["age"] == 30
+    assert found["profile"]["address"]["city"] == "NYC"
+
+
+@pytest.mark.insert
+def test_insert_array_field(collection):
+    """Test inserting document with array fields."""
+    # Insert document with array
+    document = {"name": "Alice", "tags": ["python", "mongodb", "testing"], "scores": [95, 87, 92]}
+    result = collection.insert_one(document)
+
+    # Verify insert
+    assert result.inserted_id is not None
+
+    # Verify array fields are preserved
+    found = collection.find_one({"name": "Alice"})
+    assert found["tags"] == ["python", "mongodb", "testing"]
+    assert found["scores"] == [95, 87, 92]
+
+
+@pytest.mark.insert
+def test_insert_empty_document(collection):
+    """Test inserting an empty document."""
+    # Insert empty document
+    result = collection.insert_one({})
+
+    # Verify insert was successful
+    assert result.inserted_id is not None
+
+    # Verify document exists (only has _id)
+    found = collection.find_one({"_id": result.inserted_id})
+    assert found is not None
+    assert len(found) == 1  # Only _id field
+    assert "_id" in found

From d1e49c8e55bb2cc5c2cd5fe8a8f33578914eadab Mon Sep 17 00:00:00 2001
From: Nitin Ahuja <nitahuja@amazon.com>
Date: Mon, 12 Jan 2026 10:07:34 -0800
Subject: [PATCH 2/5] Fix tests to consistently use @pytest.mark.documents
 decorator

- Update test_find_empty_projection to use documents marker instead of manual insert
- Update test_match_empty_result to use documents marker instead of manual insert
- Ensures consistent test data setup and automatic cleanup
- All 36 tests still passing
---
 tests/aggregate/test_match_stage.py | 14 ++++++--------
 tests/find/test_projections.py      |  4 +---
 2 files changed, 7 insertions(+), 11 deletions(-)

diff --git a/tests/aggregate/test_match_stage.py b/tests/aggregate/test_match_stage.py
index 886b78e..05640af 100644
--- a/tests/aggregate/test_match_stage.py
+++ b/tests/aggregate/test_match_stage.py
@@ -69,16 +69,14 @@ def test_match_multiple_conditions(collection):
 
 
 @pytest.mark.aggregate
+@pytest.mark.documents(
+    [
+        {"name": "Alice", "status": "active"},
+        {"name": "Bob", "status": "active"},
+    ]
+)
 def test_match_empty_result(collection):
     """Test $match stage that matches no documents."""
-    # Insert test data
-    collection.insert_many(
-        [
-            {"name": "Alice", "status": "active"},
-            {"name": "Bob", "status": "active"},
-        ]
-    )
-
     # Execute aggregation with $match that matches nothing
     pipeline = [{"$match": {"status": "inactive"}}]
     result = list(collection.aggregate(pipeline))
diff --git a/tests/find/test_projections.py b/tests/find/test_projections.py
index 51c6e49..c841f63 100644
--- a/tests/find/test_projections.py
+++ b/tests/find/test_projections.py
@@ -103,11 +103,9 @@ def test_find_nested_field_projection(collection):
 
 
 @pytest.mark.find
+@pytest.mark.documents([{"name": "Alice", "age": 30}])
 def test_find_empty_projection(collection):
     """Test find with empty projection returns all fields."""
-    # Insert test data
-    collection.insert_one({"name": "Alice", "age": 30})
-
     # Find with empty projection
     result = collection.find_one({}, {})
 

From 51d29bfbbfc7e72fa8c4bb39dcf4f98d4a7c91b6 Mon Sep 17 00:00:00 2001
From: Nitin Ahuja <nitahuja@amazon.com>
Date: Mon, 12 Jan 2026 10:18:00 -0800
Subject: [PATCH 3/5] Fix pytest.ini warnings by removing invalid config
 options

- Remove json_report, json_report_indent, json_report_omit from config
- These are command-line options, not pytest.ini settings
- Add comment explaining proper usage
- All 36 tests still passing with no warnings
---
 pytest.ini | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/pytest.ini b/pytest.ini
index 3cc2c44..f9c263e 100644
--- a/pytest.ini
+++ b/pytest.ini
@@ -45,7 +45,6 @@ timeout = 300
 # Use with: pytest -n auto
 # Or: pytest -n 4 (for 4 processes)
 
-# JSON report configuration
-json_report = .test-results/report.json
-json_report_indent = 2
-json_report_omit = log
+# JSON report options
+# These are command-line options, not config file options
+# Use with: pytest --json-report --json-report-file=.test-results/report.json

From c0cda4bd2dd6bcaca457f14b7c377321e6f96326 Mon Sep 17 00:00:00 2001
From: Nitin Ahuja <nitahuja@amazon.com>
Date: Mon, 12 Jan 2026 12:07:11 -0800
Subject: [PATCH 4/5] Add multi-platform Docker build workflow

- Add GitHub Actions workflow for automated Docker builds
- Build for linux/amd64 and linux/arm64 platforms
- Push to GitHub Container Registry (ghcr.io)
- Auto-tags images: latest, sha-*, version tags
- Update README with pre-built image pull instructions
- Fix Dockerfile casing warning (FROM...AS)

Workflow Features:
- Runs on push to main and on pull requests
- Multi-platform support for Intel/AMD and ARM/Graviton
- Automatic versioning from git tags
- GitHub Actions cache for faster builds
- Uses dynamic repository variable (works on forks and upstream)
---
 .github/workflows/docker-build.yml | 68 ++++++++++++++++++++++++++++++
 Dockerfile                         |  2 +-
 README.md                          | 37 +++++++++++++++-
 3 files changed, 105 insertions(+), 2 deletions(-)
 create mode 100644 .github/workflows/docker-build.yml

diff --git a/.github/workflows/docker-build.yml b/.github/workflows/docker-build.yml
new file mode 100644
index 0000000..c223330
--- /dev/null
+++ b/.github/workflows/docker-build.yml
@@ -0,0 +1,68 @@
+name: Build and Push Docker Image
+
+on:
+  push:
+    branches:
+      - main
+    tags:
+      - 'v*.*.*'
+  pull_request:
+    branches:
+      - main
+
+env:
+  REGISTRY: ghcr.io
+  IMAGE_NAME: ${{ github.repository }}
+
+jobs:
+  build-and-push:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      packages: write
+
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+
+      - name: Set up QEMU
+        uses: docker/setup-qemu-action@v3
+
+      - name: Set up Docker Buildx
+        uses: docker/setup-buildx-action@v3
+
+      - name: Log in to Container Registry
+        if: github.event_name != 'pull_request'
+        uses: docker/login-action@v3
+        with:
+          registry: ${{ env.REGISTRY }}
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Extract metadata (tags, labels)
+        id: meta
+        uses: docker/metadata-action@v5
+        with:
+          images: ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}
+          tags: |
+            type=ref,event=branch
+            type=ref,event=pr
+            type=semver,pattern={{version}}
+            type=semver,pattern={{major}}.{{minor}}
+            type=semver,pattern={{major}}
+            type=sha,prefix=sha-
+            type=raw,value=latest,enable={{is_default_branch}}
+
+      - name: Build and push Docker image
+        uses: docker/build-push-action@v5
+        with:
+          context: .
+          platforms: linux/amd64,linux/arm64
+          push: ${{ github.event_name != 'pull_request' }}
+          tags: ${{ steps.meta.outputs.tags }}
+          labels: ${{ steps.meta.outputs.labels }}
+          cache-from: type=gha
+          cache-to: type=gha,mode=max
+
+      - name: Image digest
+        run: echo ${{ steps.meta.outputs.tags }}
diff --git a/Dockerfile b/Dockerfile
index 9fc7292..d1cc5ee 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -1,7 +1,7 @@
 # Multi-stage build for DocumentDB Functional Tests
 
 # Stage 1: Build stage
-FROM python:3.11-slim as builder
+FROM python:3.11-slim AS builder
 
 WORKDIR /build
 
diff --git a/README.md b/README.md
index 6db5fa9..0476a5a 100644
--- a/README.md
+++ b/README.md
@@ -120,7 +120,42 @@ pytest -l
 
 ## Docker Usage
 
-### Build the Image
+### Option 1: Use Pre-built Image (Recommended)
+
+Pull the latest image from GitHub Container Registry:
+
+```bash
+# Pull latest version
+docker pull ghcr.io/documentdb/functional-tests:latest
+
+# Or pull a specific version
+docker pull ghcr.io/documentdb/functional-tests:v1.0.0
+```
+
+Run tests with the pre-built image:
+
+```bash
+# Run all tests
+docker run --network host \
+  ghcr.io/documentdb/functional-tests:latest \
+  --engine documentdb="mongodb://user:pass@host:port/?tls=true&tlsAllowInvalidCertificates=true"
+
+# Run specific tags
+docker run --network host \
+  ghcr.io/documentdb/functional-tests:latest \
+  -m smoke \
+  --engine documentdb="mongodb://localhost:10260/?tls=true"
+
+# Run with parallel execution
+docker run --network host \
+  ghcr.io/documentdb/functional-tests:latest \
+  -n 4 \
+  --engine documentdb="mongodb://localhost:27017"
+```
+
+### Option 2: Build Locally
+
+If you need to build from source:
 
 ```bash
 docker build -t documentdb/functional-tests .

From 57fb249ddfdc14f54d983766d118c3d7374aa35b Mon Sep 17 00:00:00 2001
From: Nitin Ahuja <nitahuja@amazon.com>
Date: Mon, 12 Jan 2026 12:17:42 -0800
Subject: [PATCH 5/5] Fix workflow error: remove problematic image digest step

- Remove the 'Image digest' step that was causing exit code 127
- The metadata and tags are already captured by the build step
- Build step itself will show all relevant information in logs
---
 .github/workflows/docker-build.yml | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/.github/workflows/docker-build.yml b/.github/workflows/docker-build.yml
index c223330..135473e 100644
--- a/.github/workflows/docker-build.yml
+++ b/.github/workflows/docker-build.yml
@@ -63,6 +63,3 @@ jobs:
           labels: ${{ steps.meta.outputs.labels }}
           cache-from: type=gha
           cache-to: type=gha,mode=max
-
-      - name: Image digest
-        run: echo ${{ steps.meta.outputs.tags }}