diff --git a/docs/REQUIREMENTS_AND_SAMPLING_GUIDE.md b/docs/REQUIREMENTS_AND_SAMPLING_GUIDE.md
new file mode 100644
index 000000000..3d5df1feb
--- /dev/null
+++ b/docs/REQUIREMENTS_AND_SAMPLING_GUIDE.md
@@ -0,0 +1,852 @@
+# Requirements and Sampling Guide
+
+> **Complete guide to using Requirements, Sampling Strategies, and Composite Requirements in Mellea**
+
+## Table of Contents
+
+1. [Introduction](#introduction)
+2. [Requirements Basics](#requirements-basics)
+3. [Guardrails Library](#guardrails-library)
+4. [Composite Requirements](#composite-requirements)
+5. [Sampling Strategies](#sampling-strategies)
+6. [Advanced Patterns](#advanced-patterns)
+7. [Best Practices](#best-practices)
+
+---
+
+## Introduction
+
+Mellea provides a powerful system for constraining and validating LLM outputs through three key concepts:
+
+- **Requirements**: Validation rules that check LLM outputs
+- **Guardrails**: Pre-built, reusable requirements for common patterns
+- **Sampling Strategies**: Algorithms that retry generation until requirements are met
+
+This guide covers all three concepts and how to use them together effectively.
+
+---
+
+## Requirements Basics
+
+### What is a Requirement?
+
+A `Requirement` is a validation rule that checks whether an LLM output meets certain criteria. Requirements can be:
+
+- **Simple checks**: Boolean functions that return True/False
+- **LLM-based validators**: Use another LLM call to validate output
+- **Hybrid validators**: Combine programmatic checks with LLM reasoning
+
+### Creating Simple Requirements
+
+```python
+from mellea.stdlib.requirements import Requirement
+
+# Simple boolean check
+def check_length(output: str) -> bool:
+    return len(output) <= 100
+
+length_req = Requirement(
+    description="Output must be 100 characters or less",
+    validation_fn=check_length,
+    check_only=True  # Don't provide repair feedback
+)
+```
+
+### Creating LLM-Based Requirements
+
+```python
+# LLM validates the output
+tone_req = Requirement(
+    description="Output must have a professional tone",
+    check_only=False  # Provide repair feedback when validation fails
+)
+# When check_only=False, the LLM provides detailed feedback on why validation failed
+```
+
+### Validation Results
+
+Requirements return `ValidationResult` objects:
+
+```python
+from mellea.stdlib.requirements import ValidationResult
+
+# Boolean result
+result = ValidationResult(True)
+assert result.as_bool() == True
+
+# Result with reason (for repair feedback)
+result = ValidationResult(
+    False,
+    reason="Output contains informal language like 'gonna' and 'wanna'"
+)
+assert result.as_bool() == False
+assert "informal language" in result.reason
+```
+
+---
+
+## Guardrails Library
+
+The guardrails library provides 10 pre-built requirements for common validation patterns.
+
+### Available Guardrails
+
+#### 1. PII Detection: `no_pii()`
+
+Detects and rejects personally identifiable information using hybrid detection (regex + spaCy NER).
+
+```python
+from mellea.stdlib.requirements.guardrails import no_pii
+
+# Basic usage
+pii_guard = no_pii()
+
+# With custom detection mode
+pii_guard = no_pii(mode="regex")  # Options: "auto", "regex", "spacy"
+
+# Example violations:
+# ❌ "Contact me at john@example.com"
+# ❌ "My SSN is 123-45-6789"
+# ❌ "Call me at (555) 123-4567"
+# ✅ "Contact us through our website"
+```
+
+**Detection modes:**
+- `"auto"` (default): Try spaCy, fallback to regex if unavailable
+- `"regex"`: Fast pattern matching for emails, phones, SSNs, credit cards
+- `"spacy"`: NER-based detection for names, locations, organizations
+
+#### 2. JSON Validation: `json_valid()`
+
+Ensures output is valid JSON.
+
+```python
+from mellea.stdlib.requirements.guardrails import json_valid
+
+json_guard = json_valid()
+
+# ✅ '{"name": "Alice", "age": 30}'
+# ✅ '[1, 2, 3]'
+# ❌ '{name: "Alice"}'  # Missing quotes
+# ❌ '{"name": "Alice",}'  # Trailing comma
+```
+
+#### 3. Length Constraints: `max_length()`, `min_length()`
+
+Enforce character or word count limits.
+
+```python
+from mellea.stdlib.requirements.guardrails import max_length, min_length
+
+# Character limits
+max_chars = max_length(100)  # Default: characters
+min_chars = min_length(50)
+
+# Word limits
+max_words = max_length(20, unit="words")
+min_words = min_length(10, unit="words")
+
+# ✅ "This is a short response."  # 26 chars, 5 words
+# ❌ "x" * 101  # Exceeds max_length(100)
+```
+
+#### 4. Keyword Matching: `contains_keywords()`, `excludes_keywords()`
+
+Require or forbid specific keywords.
+
+```python
+from mellea.stdlib.requirements.guardrails import contains_keywords, excludes_keywords
+
+# Require at least one keyword
+must_have = contains_keywords(["python", "javascript", "java"])
+
+# Require all keywords
+must_have_all = contains_keywords(
+    ["function", "return", "parameter"],
+    require_all=True
+)
+
+# Forbid keywords
+no_profanity = excludes_keywords(["damn", "hell", "crap"])
+
+# Case sensitivity
+case_sensitive = contains_keywords(["API"], case_sensitive=True)
+
+# ✅ "Python is a great language"  # Contains "python"
+# ❌ "Ruby is also nice"  # Missing required keywords
+```
+
+#### 5. Harmful Content: `no_harmful_content()`
+
+Detects harmful, toxic, or inappropriate content using keyword-based detection.
+
+```python
+from mellea.stdlib.requirements.guardrails import no_harmful_content
+
+# Default: checks all harm categories
+safety_guard = no_harmful_content()
+
+# Specific categories
+violence_guard = no_harmful_content(harm_categories=["violence"])
+profanity_guard = no_harmful_content(harm_categories=["profanity"])
+
+# Available categories:
+# - "violence": violent content
+# - "hate": hate speech, discrimination
+# - "sexual": sexual content
+# - "self_harm": self-harm content
+# - "profanity": profane language
+# - "harassment": harassment, bullying
+
+# ✅ "The weather is nice today"
+# ❌ "I want to hurt someone"  # Violence
+# ❌ "You're a stupid idiot"  # Harassment/profanity
+```
+
+**Future Enhancement**: See `docs/GUARDRAILS_GUARDIAN_INTEGRATION.md` for planned IBM Guardian intrinsics integration.
+
+#### 6. JSON Schema: `matches_schema()`
+
+Validates JSON against a JSON Schema.
+
+```python
+from mellea.stdlib.requirements.guardrails import matches_schema
+
+# Define schema
+user_schema = {
+    "type": "object",
+    "properties": {
+        "name": {"type": "string"},
+        "age": {"type": "integer", "minimum": 0},
+        "email": {"type": "string", "format": "email"}
+    },
+    "required": ["name", "age"]
+}
+
+schema_guard = matches_schema(user_schema)
+
+# ✅ '{"name": "Alice", "age": 30, "email": "alice@example.com"}'
+# ❌ '{"name": "Bob"}'  # Missing required "age"
+# ❌ '{"name": "Charlie", "age": -5}'  # Age below minimum
+```
+
+#### 7. Code Validation: `is_code()`
+
+Validates code syntax for various programming languages.
+
+```python
+from mellea.stdlib.requirements.guardrails import is_code
+
+# Language-specific validation
+python_guard = is_code("python")
+js_guard = is_code("javascript")
+java_guard = is_code("java")
+
+# Generic code validation (checks for code-like patterns)
+code_guard = is_code()
+
+# ✅ "def hello():\n    print('Hello')"  # Valid Python
+# ❌ "def hello(\n    print('Hello')"  # Syntax error
+# ✅ "function hello() { console.log('Hi'); }"  # Valid JS
+```
+
+**Supported languages**: `python`, `javascript`, `java`, or `None` (generic)
+
+#### 8. Factual Grounding: `factual_grounding()`
+
+Ensures output is grounded in provided context using token overlap.
+
+```python
+from mellea.stdlib.requirements.guardrails import factual_grounding
+
+context = """
+Python was created by Guido van Rossum and first released in 1991.
+It emphasizes code readability with significant whitespace.
+"""
+
+grounding_guard = factual_grounding(context, threshold=0.3)
+
+# ✅ "Python was created by Guido van Rossum in 1991"  # High overlap
+# ❌ "Python was created by Dennis Ritchie in 1972"  # Low overlap, wrong facts
+```
+
+**Parameters:**
+- `context`: Reference text for grounding
+- `threshold`: Minimum token overlap ratio (default: 0.3)
+
+**Future Enhancement**: See `docs/GUARDRAILS_NLI_GROUNDING.md` for planned NLI-based semantic grounding.
+
+### Repair Strategies
+
+All guardrails support repair mode (`check_only=False`) which provides detailed feedback when validation fails:
+
+```python
+from mellea.stdlib.requirements.guardrails import max_length
+
+# Check-only mode (default)
+guard_check = max_length(100, check_only=True)
+# Returns: ValidationResult(False) - just pass/fail
+
+# Repair mode
+guard_repair = max_length(100, check_only=False)
+# Returns: ValidationResult(False, reason="Output is 150 characters but maximum is 100. Please shorten by 50 characters.")
+```
+
+**Repair feedback examples:**
+
+```python
+# no_pii with repair
+result = no_pii(check_only=False).validation_fn("Email: john@example.com", {})
+# reason: "Found PII: email address (john@example.com). Please remove or redact."
+
+# json_valid with repair
+result = json_valid(check_only=False).validation_fn("{invalid}", {})
+# reason: "Invalid JSON: Expecting property name enclosed in double quotes. Check syntax."
+
+# contains_keywords with repair
+result = contains_keywords(["python"], check_only=False).validation_fn("Java code", {})
+# reason: "Missing required keywords: python. Please include at least one."
+```
+
+See `docs/GUARDRAILS_REPAIR_STRATEGIES.md` for complete repair strategy design.
+
+---
+
+## Composite Requirements
+
+### RequirementSet
+
+`RequirementSet` provides a composable way to combine multiple requirements:
+
+```python
+from mellea.stdlib.requirements import RequirementSet
+from mellea.stdlib.requirements.guardrails import no_pii, json_valid, max_length
+
+# Create a set
+reqs = RequirementSet([
+    no_pii(),
+    json_valid(),
+    max_length(500)
+])
+
+# Fluent API
+reqs = RequirementSet().add(no_pii()).add(json_valid())
+
+# Addition operator
+reqs = RequirementSet([no_pii()]) + [json_valid(), max_length(500)]
+
+# Extend with multiple
+reqs.extend([min_length(10), contains_keywords(["data"])])
+```
+
+### GuardrailProfiles
+
+Pre-built requirement sets for common use cases:
+
+```python
+from mellea.stdlib.requirements import GuardrailProfiles
+
+# 1. Basic Safety - PII + harmful content
+reqs = GuardrailProfiles.basic_safety()
+
+# 2. JSON Output - Valid JSON with length limits
+reqs = GuardrailProfiles.json_output(max_length=1000)
+
+# 3. Code Generation - Valid code with safety
+reqs = GuardrailProfiles.code_generation(language="python")
+
+# 4. Professional Content - Safe, appropriate, length-limited
+reqs = GuardrailProfiles.professional_content(max_length=500)
+
+# 5. API Documentation - Code + JSON + professional
+reqs = GuardrailProfiles.api_documentation(language="python")
+
+# 6. Grounded Summary - Factually grounded with length limits
+reqs = GuardrailProfiles.grounded_summary(context="...", max_length=200)
+
+# 7. Safe Chat - Conversational safety
+reqs = GuardrailProfiles.safe_chat(max_length=300)
+
+# 8. Structured Data - JSON with optional schema
+reqs = GuardrailProfiles.structured_data(schema={...})
+
+# 9. Content Moderation - Comprehensive safety
+reqs = GuardrailProfiles.content_moderation()
+
+# 10. Minimal - Just PII detection
+reqs = GuardrailProfiles.minimal()
+
+# 11. Strict - All safety + format + length
+reqs = GuardrailProfiles.strict(max_length=500)
+```
+
+### Customizing Profiles
+
+```python
+# Start with a profile and customize
+reqs = GuardrailProfiles.safe_chat()
+reqs = reqs.add(matches_schema(my_schema))
+reqs = reqs.remove(max_length(300))  # Remove default length limit
+reqs = reqs.add(max_length(1000))    # Add custom limit
+
+# Compose multiple profiles
+reqs = GuardrailProfiles.basic_safety() + GuardrailProfiles.json_output()
+```
+
+---
+
+## Sampling Strategies
+
+Sampling strategies control how Mellea retries generation when requirements fail.
+
+### Available Strategies
+
+#### 1. RejectionSamplingStrategy
+
+Simplest strategy: retry the same prompt until requirements pass or budget exhausted.
+
+```python
+from mellea.stdlib.sampling import RejectionSamplingStrategy
+
+strategy = RejectionSamplingStrategy(
+    loop_budget=3,  # Try up to 3 times
+    requirements=[no_pii(), json_valid()]
+)
+
+# Use with session
+result = await session.generate(
+    instruction,
+    sampling_strategy=strategy
+)
+```
+
+**How it works:**
+1. Generate output
+2. Validate against requirements
+3. If failed, retry with same prompt
+4. Repeat until success or budget exhausted
+
+**Best for:** Simple retries without prompt modification
+
+#### 2. RepairTemplateStrategy
+
+Adds failure feedback to the prompt on retry.
+
+```python
+from mellea.stdlib.sampling import RepairTemplateStrategy
+
+strategy = RepairTemplateStrategy(
+    loop_budget=3,
+    requirements=[no_pii(), max_length(100)]
+)
+```
+
+**How it works:**
+1. Generate output
+2. Validate against requirements
+3. If failed, add failure details to prompt:
+   ```
+   The following requirements failed before:
+   * Output contains PII: email address
+   * Output exceeds maximum length of 100 characters
+   ```
+4. Retry with enhanced prompt
+
+**Best for:** Giving the model feedback to improve
+
+#### 3. MultiTurnStrategy
+
+Uses multi-turn conversation for repair (agentic approach).
+
+```python
+from mellea.stdlib.sampling import MultiTurnStrategy
+
+strategy = MultiTurnStrategy(
+    loop_budget=3,
+    requirements=[json_valid(), contains_keywords(["summary"])]
+)
+```
+
+**How it works:**
+1. Generate output
+2. Validate against requirements
+3. If failed, add user message:
+   ```
+   The following requirements have not been met:
+   * Output is not valid JSON
+   * Output must contain keyword: summary
+   Please try again to fulfill the requirements.
+   ```
+4. Model responds in conversation
+
+**Best for:** Complex tasks where conversation helps
+
+**Requires:** `ChatContext` (not compatible with simple `Context`)
+
+#### 4. MajorityVotingStrategyForMath
+
+Generates multiple samples and selects best via majority voting (MBRD).
+
+```python
+from mellea.stdlib.sampling import MajorityVotingStrategyForMath
+
+strategy = MajorityVotingStrategyForMath(
+    number_of_samples=8,  # Generate 8 candidates
+    loop_budget=1,
+    requirements=[contains_keywords(["answer"])]
+)
+```
+
+**How it works:**
+1. Generate N samples concurrently
+2. Compare all pairs using math expression equivalence
+3. Select sample with highest agreement score
+
+**Best for:** Math problems where multiple solutions should agree
+
+#### 5. MBRDRougeLStrategy
+
+Like majority voting but uses RougeL for text similarity.
+
+```python
+from mellea.stdlib.sampling import MBRDRougeLStrategy
+
+strategy = MBRDRougeLStrategy(
+    number_of_samples=5,
+    loop_budget=1,
+    requirements=[min_length(50)]
+)
+```
+
+**Best for:** Text generation where consistency matters
+
+#### 6. BudgetForcingSamplingStrategy
+
+Allocates token budget for thinking vs. answering (Ollama only).
+
+```python
+from mellea.stdlib.sampling import BudgetForcingSamplingStrategy
+
+strategy = BudgetForcingSamplingStrategy(
+    think_max_tokens=4096,  # Tokens for reasoning
+    answer_max_tokens=512,  # Tokens for final answer
+    start_think_token="<think>",
+    end_think_token="</think>",
+    loop_budget=1,
+    requirements=[is_code("python")]
+)
+```
+
+**How it works:**
+1. Model generates reasoning in `<think>` block
+2. Forces model to continue thinking if needed
+3. Generates final answer with separate token budget
+
+**Best for:** Complex reasoning tasks (Ollama backend only)
+
+### Choosing a Strategy
+
+| Strategy | Use Case | Pros | Cons |
+|----------|----------|------|------|
+| **RejectionSampling** | Simple retries | Fast, simple | No learning from failures |
+| **RepairTemplate** | Iterative improvement | Model learns from errors | Requires good repair feedback |
+| **MultiTurn** | Complex tasks | Conversational repair | Requires ChatContext |
+| **MajorityVoting** | Math/reasoning | Robust to errors | Expensive (N samples) |
+| **MBRDRougeL** | Text consistency | Good for summaries | Expensive (N samples) |
+| **BudgetForcing** | Deep reasoning | Explicit thinking | Ollama only |
+
+---
+
+## Advanced Patterns
+
+### Pattern 1: Progressive Validation
+
+Start with cheap checks, add expensive ones only if needed:
+
+```python
+# Fast checks first
+fast_reqs = RequirementSet([
+    json_valid(),
+    max_length(1000)
+])
+
+# Expensive checks later
+expensive_reqs = RequirementSet([
+    matches_schema(complex_schema),
+    factual_grounding(long_context)
+])
+
+# Use in stages
+result = await session.generate(
+    instruction,
+    sampling_strategy=RejectionSamplingStrategy(
+        loop_budget=2,
+        requirements=fast_reqs.to_list()
+    )
+)
+
+# Only validate expensive if fast checks passed
+if result.success:
+    # Validate with expensive checks
+    ...
+```
+
+### Pattern 2: Conditional Requirements
+
+Apply different requirements based on task type:
+
+```python
+def get_requirements(task_type: str) -> list[Requirement]:
+    base = [no_pii(), no_harmful_content()]
+    
+    if task_type == "code":
+        return base + [is_code("python"), max_length(2000)]
+    elif task_type == "summary":
+        return base + [min_length(50), max_length(200)]
+    elif task_type == "json":
+        return base + [json_valid(), matches_schema(schema)]
+    else:
+        return base
+
+reqs = get_requirements("code")
+```
+
+### Pattern 3: Layered Sampling
+
+Combine multiple strategies:
+
+```python
+# First: Try with repair feedback
+result = await session.generate(
+    instruction,
+    sampling_strategy=RepairTemplateStrategy(
+        loop_budget=2,
+        requirements=[json_valid(), no_pii()]
+    )
+)
+
+# If failed: Try majority voting
+if not result.success:
+    result = await session.generate(
+        instruction,
+        sampling_strategy=MBRDRougeLStrategy(
+            number_of_samples=5,
+            requirements=[json_valid(), no_pii()]
+        )
+    )
+```
+
+### Pattern 4: Custom Validation Functions
+
+Create domain-specific requirements:
+
+```python
+def validate_email_format(output: str, context: dict) -> ValidationResult:
+    """Validate email has proper format."""
+    import re
+    pattern = r'^[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,}$'
+    
+    if re.match(pattern, output.strip()):
+        return ValidationResult(True)
+    else:
+        return ValidationResult(
+            False,
+            reason="Email format invalid. Expected: user@domain.com"
+        )
+
+email_req = Requirement(
+    description="Output must be a valid email address",
+    validation_fn=validate_email_format,
+    check_only=False
+)
+```
+
+### Pattern 5: Dynamic Requirements
+
+Generate requirements based on runtime data:
+
+```python
+def create_keyword_requirements(keywords: list[str]) -> RequirementSet:
+    """Create requirements for multiple keyword sets."""
+    reqs = RequirementSet()
+    
+    for keyword in keywords:
+        reqs = reqs.add(contains_keywords([keyword]))
+    
+    return reqs
+
+# Use with dynamic data
+user_keywords = ["python", "async", "await"]
+reqs = create_keyword_requirements(user_keywords)
+```
+
+---
+
+## Best Practices
+
+### 1. Start Simple, Add Complexity
+
+```python
+# ❌ Don't start with everything
+reqs = GuardrailProfiles.strict(max_length=100) + [
+    matches_schema(complex_schema),
+    factual_grounding(huge_context),
+    is_code("python")
+]
+
+# ✅ Start minimal, add as needed
+reqs = GuardrailProfiles.minimal()  # Just PII
+# Test, then add more...
+reqs = reqs.add(json_valid())
+# Test, then add more...
+reqs = reqs.add(max_length(500))
+```
+
+### 2. Use Repair Mode for Development
+
+```python
+# During development: get detailed feedback
+dev_reqs = RequirementSet([
+    no_pii(check_only=False),
+    json_valid(check_only=False),
+    max_length(100, check_only=False)
+])
+
+# In production: faster check-only mode
+prod_reqs = RequirementSet([
+    no_pii(check_only=True),
+    json_valid(check_only=True),
+    max_length(100, check_only=True)
+])
+```
+
+### 3. Profile Before Optimizing
+
+```python
+import time
+
+start = time.time()
+result = await session.generate(
+    instruction,
+    sampling_strategy=strategy,
+    requirements=reqs
+)
+elapsed = time.time() - start
+
+print(f"Generation took {elapsed:.2f}s")
+print(f"Attempts: {len(result.sample_generations)}")
+print(f"Success: {result.success}")
+```
+
+### 4. Handle Failures Gracefully
+
+```python
+result = await session.generate(
+    instruction,
+    sampling_strategy=RepairTemplateStrategy(loop_budget=3),
+    requirements=reqs
+)
+
+if result.success:
+    print("✅ All requirements met")
+    output = result.result
+else:
+    print("⚠️ Requirements not met after 3 attempts")
+    # Use best attempt
+    output = result.result
+    
+    # Log failures for analysis
+    for i, validation in enumerate(result.sample_validations):
+        failed = [r for r, v in validation if not v.as_bool()]
+        print(f"Attempt {i+1} failed: {len(failed)} requirements")
+```
+
+### 5. Combine Profiles Wisely
+
+```python
+# ✅ Good: Complementary profiles
+reqs = GuardrailProfiles.basic_safety() + GuardrailProfiles.json_output()
+
+# ❌ Bad: Conflicting requirements
+reqs = GuardrailProfiles.minimal() + GuardrailProfiles.strict()
+# (strict already includes minimal, creates duplicates)
+
+# ✅ Better: Use strict directly
+reqs = GuardrailProfiles.strict()
+```
+
+### 6. Test Requirements Independently
+
+```python
+# Test each requirement separately
+test_output = '{"name": "test@example.com"}'
+
+for req in reqs:
+    result = req.validation_fn(test_output, {})
+    print(f"{req.description}: {result.as_bool()}")
+    if not result.as_bool() and result.reason:
+        print(f"  Reason: {result.reason}")
+```
+
+### 7. Use Type Hints
+
+```python
+from mellea.stdlib.requirements import Requirement, RequirementSet, ValidationResult
+
+def create_requirements() -> RequirementSet:
+    """Create requirements with proper typing."""
+    return RequirementSet([
+        no_pii(),
+        json_valid()
+    ])
+
+def custom_validator(output: str, context: dict) -> ValidationResult:
+    """Custom validator with proper return type."""
+    return ValidationResult(len(output) > 0)
+```
+
+### 8. Document Your Requirements
+
+```python
+# ✅ Good: Clear descriptions
+email_req = Requirement(
+    description="Output must be a valid email in format user@domain.com",
+    validation_fn=validate_email,
+    check_only=False
+)
+
+# ❌ Bad: Vague descriptions
+email_req = Requirement(
+    description="Check email",
+    validation_fn=validate_email
+)
+```
+
+---
+
+## Summary
+
+**Requirements** validate LLM outputs against rules:
+- Use **guardrails** for common patterns (PII, JSON, length, etc.)
+- Create **custom requirements** for domain-specific needs
+- Enable **repair mode** for detailed feedback
+
+**Composite Requirements** organize validation:
+- Use **RequirementSet** for flexible composition
+- Use **GuardrailProfiles** for pre-built combinations
+- Customize profiles for your use case
+
+**Sampling Strategies** handle retries:
+- **RejectionSampling**: Simple retries
+- **RepairTemplate**: Learning from failures
+- **MultiTurn**: Conversational repair
+- **MajorityVoting**: Consensus from multiple samples
+- **BudgetForcing**: Explicit reasoning (Ollama)
+
+**Best Practices:**
+1. Start simple, add complexity gradually
+2. Use repair mode during development
+3. Profile performance before optimizing
+4. Handle failures gracefully
+5. Test requirements independently
+6. Document clearly
diff --git a/docs/examples/guardrails.py b/docs/examples/guardrails.py
new file mode 100644
index 000000000..4e8d0ba3f
--- /dev/null
+++ b/docs/examples/guardrails.py
@@ -0,0 +1,516 @@
+# pytest: ollama, llm
+"""Comprehensive example demonstrating all guardrails in the Mellea library.
+
+This example showcases all 10 pre-built guardrails:
+
+Basic Guardrails:
+- no_pii: PII detection (hybrid: spaCy + regex)
+- json_valid: JSON format validation
+- max_length/min_length: Length constraints
+- contains_keywords/excludes_keywords: Keyword matching
+
+Advanced Guardrails:
+- no_harmful_content: Harmful content detection
+- matches_schema: JSON schema validation
+- is_code: Code syntax validation
+- factual_grounding: Context grounding validation
+"""
+
+from mellea.stdlib.requirements.guardrails import (
+    contains_keywords,
+    excludes_keywords,
+    factual_grounding,
+    is_code,
+    json_valid,
+    matches_schema,
+    max_length,
+    min_length,
+    no_harmful_content,
+    no_pii,
+)
+from mellea.stdlib.session import start_session
+
+# ============================================================================
+# BASIC GUARDRAILS EXAMPLES
+# ============================================================================
+
+
+def example_no_pii_basic():
+    """Basic example of PII detection with default settings."""
+    print("\n=== PII Detection (Basic) ===")
+
+    m = start_session()
+
+    # This should pass - no PII in the output
+    result = m.instruct(
+        "Describe a typical software engineer's daily routine without mentioning specific people or companies.",
+        requirements=[no_pii()],
+    )
+    print(f"Clean output: {result.value[:100] if result.value else 'None'}...")
+
+
+def example_no_pii_modes():
+    """Example showing different PII detection modes."""
+    print("\n=== PII Detection (Different Modes) ===")
+
+    m = start_session()
+
+    # Regex-only (no dependencies)
+    result = m.instruct(
+        "Write a professional email template without any contact details.",
+        requirements=[no_pii(method="regex")],
+    )
+    print(f"Regex-only: {result.value[:100] if result.value else 'None'}...")
+
+    # Strict mode
+    result = m.instruct(
+        "Write a short story about a programmer, using only generic descriptions.",
+        requirements=[no_pii(strict=True)],
+    )
+    print(f"Strict mode: {result.value[:100] if result.value else 'None'}...")
+
+
+def example_json_validation():
+    """Example of JSON format validation."""
+    print("\n=== JSON Validation ===")
+
+    m = start_session()
+
+    result = m.instruct(
+        "Generate a JSON object with fields: name (string), age (number), hobbies (array)",
+        requirements=[json_valid()],
+    )
+    print(f"Valid JSON output: {result.value}")
+
+
+def example_length_constraints():
+    """Example of length constraints."""
+    print("\n=== Length Constraints ===")
+
+    m = start_session()
+
+    # Maximum length
+    result = m.instruct(
+        "Write a one-sentence summary of Python", requirements=[max_length(100)]
+    )
+    print(
+        f"Short summary ({len(result.value) if result.value else 0} chars): {result.value}"
+    )
+
+    # Minimum length
+    result = m.instruct(
+        "Write a detailed explanation of REST APIs", requirements=[min_length(200)]
+    )
+    print(
+        f"Detailed explanation ({len(result.value) if result.value else 0} chars): {result.value[:100] if result.value else 'None'}..."
+    )
+
+    # Word-based constraints
+    result = m.instruct(
+        "List 5 programming languages", requirements=[max_length(50, unit="words")]
+    )
+    word_count = len(result.value.split()) if result.value else 0
+    print(f"Word-limited output ({word_count} words): {result.value}")
+
+
+def example_keyword_matching():
+    """Example of keyword matching."""
+    print("\n=== Keyword Matching ===")
+
+    m = start_session()
+
+    # Require specific keywords (any)
+    result = m.instruct(
+        "Explain web development technologies",
+        requirements=[contains_keywords(["HTML", "CSS", "JavaScript"])],
+    )
+    print(f"Contains keywords: {result.value[:150] if result.value else 'None'}...")
+
+    # Require ALL keywords
+    result = m.instruct(
+        "Describe a RESTful API",
+        requirements=[
+            contains_keywords(["HTTP", "JSON", "endpoint"], require_all=True)
+        ],
+    )
+    print(f"Contains all keywords: {result.value[:150] if result.value else 'None'}...")
+
+    # Exclude keywords
+    result = m.instruct(
+        "Write professional documentation about software testing",
+        requirements=[excludes_keywords(["TODO", "FIXME", "hack"])],
+    )
+    print(f"Professional output: {result.value[:150] if result.value else 'None'}...")
+
+
+def example_case_sensitivity():
+    """Example showing case sensitivity options."""
+    print("\n=== Case Sensitivity ===")
+
+    m = start_session()
+
+    # Case-insensitive (default)
+    _ = m.instruct(
+        "Explain python programming",
+        requirements=[contains_keywords(["Python"], case_sensitive=False)],
+    )
+    print("Case-insensitive match: Success")
+
+    # Case-sensitive
+    _ = m.instruct(
+        "Explain the Python programming language",
+        requirements=[contains_keywords(["Python"], case_sensitive=True)],
+    )
+    print("Case-sensitive match: Success")
+
+
+# ============================================================================
+# ADVANCED GUARDRAILS EXAMPLES
+# ============================================================================
+
+
+def example_harmful_content_detection():
+    """Example of harmful content detection."""
+    print("\n=== Harmful Content Detection ===")
+
+    m = start_session()
+
+    # Check for general harm
+    result = m.instruct(
+        "Write a helpful guide about online safety", requirements=[no_harmful_content()]
+    )
+    print(f"Safe content: {result.value[:100] if result.value else 'None'}...")
+
+    # Check specific risk types
+    result = m.instruct(
+        "Write a professional article about conflict resolution",
+        requirements=[no_harmful_content(risk_types=["violence", "profanity"])],
+    )
+    print(f"Professional content: {result.value[:100] if result.value else 'None'}...")
+
+
+def example_schema_validation():
+    """Example of JSON schema validation."""
+    print("\n=== JSON Schema Validation ===")
+
+    m = start_session()
+
+    # Define a schema for a person object
+    person_schema = {
+        "type": "object",
+        "properties": {
+            "name": {"type": "string"},
+            "age": {"type": "number", "minimum": 0, "maximum": 150},
+            "email": {"type": "string", "format": "email"},
+            "skills": {"type": "array", "items": {"type": "string"}, "minItems": 1},
+        },
+        "required": ["name", "age"],
+    }
+
+    result = m.instruct(
+        "Generate a JSON object for a software developer with name, age, email, and skills",
+        requirements=[matches_schema(person_schema)],
+    )
+    print(f"Valid schema output: {result.value}")
+
+    # Array schema
+    array_schema = {
+        "type": "array",
+        "items": {"type": "string"},
+        "minItems": 3,
+        "maxItems": 10,
+    }
+
+    result = m.instruct(
+        "Generate a JSON array of 5 programming languages",
+        requirements=[matches_schema(array_schema)],
+    )
+    print(f"Valid array: {result.value}")
+
+
+def example_code_validation():
+    """Example of code syntax validation."""
+    print("\n=== Code Validation ===")
+
+    m = start_session()
+
+    # Python code validation
+    result = m.instruct(
+        "Write a Python function to calculate the factorial of a number",
+        requirements=[is_code("python")],
+    )
+    print(f"Valid Python code:\n{result.value}\n")
+
+    # JavaScript code validation
+    result = m.instruct(
+        "Write a JavaScript function to reverse a string",
+        requirements=[is_code("javascript")],
+    )
+    print(f"Valid JavaScript code:\n{result.value}\n")
+
+    # Generic code detection
+    result = m.instruct(
+        "Write a simple function in any language to add two numbers",
+        requirements=[is_code()],
+    )
+    print(f"Generic code detected:\n{result.value}\n")
+
+
+def example_factual_grounding():
+    """Example of factual grounding validation."""
+    print("\n=== Factual Grounding ===")
+
+    m = start_session()
+
+    # Provide context
+    context = """
+    Python is a high-level, interpreted programming language created by Guido van Rossum.
+    It was first released in 1991. Python emphasizes code readability and uses significant
+    indentation. It supports multiple programming paradigms including procedural, object-oriented,
+    and functional programming.
+    """
+
+    # Generate grounded summary
+    result = m.instruct(
+        "Summarize the key facts about Python programming language",
+        requirements=[factual_grounding(context, threshold=0.5)],
+    )
+    print(f"Grounded summary: {result.value}")
+
+    # Stricter grounding
+    result = m.instruct(
+        "List the main characteristics of Python",
+        requirements=[factual_grounding(context, threshold=0.3)],
+    )
+    print(f"Grounded characteristics: {result.value}")
+
+
+# ============================================================================
+# COMBINED EXAMPLES: Multiple Guardrails
+# ============================================================================
+
+
+def example_combined_basic():
+    """Example combining multiple basic guardrails."""
+    print("\n=== Combined Basic Guardrails ===")
+
+    m = start_session()
+
+    result = m.instruct(
+        "Generate a JSON profile for a software developer role",
+        requirements=[
+            json_valid(),
+            no_pii(),
+            max_length(500),
+            contains_keywords(["skills", "experience"]),
+            excludes_keywords(["TODO", "placeholder"]),
+        ],
+    )
+    print(f"Combined validation result: {result.value}")
+
+
+def example_combined_advanced():
+    """Example combining multiple advanced guardrails."""
+    print("\n=== Combined Advanced Guardrails ===")
+
+    m = start_session()
+
+    # Define schema for code snippet
+    code_schema = {
+        "type": "object",
+        "properties": {
+            "language": {"type": "string"},
+            "code": {"type": "string"},
+            "description": {"type": "string"},
+        },
+        "required": ["language", "code", "description"],
+    }
+
+    result = m.instruct(
+        "Generate a JSON object with a Python code snippet that sorts a list",
+        requirements=[matches_schema(code_schema), no_harmful_content()],
+    )
+    print(f"Combined validation result: {result.value}")
+
+
+def example_all_guardrails():
+    """Example using all available guardrails."""
+    print("\n=== All Guardrails Combined ===")
+
+    m = start_session()
+
+    # Schema for a code review
+    review_schema = {
+        "type": "object",
+        "properties": {
+            "summary": {"type": "string"},
+            "issues": {"type": "array", "items": {"type": "string"}},
+            "rating": {"type": "number", "minimum": 1, "maximum": 10},
+        },
+        "required": ["summary", "issues", "rating"],
+    }
+
+    context = """
+    Our codebase uses Python 3.11 with FastAPI.
+    We follow PEP 8 style guidelines and use type hints.
+    All functions must have docstrings.
+    """
+
+    result = m.instruct(
+        "Provide a code review in JSON format",
+        requirements=[
+            json_valid(),
+            matches_schema(review_schema),
+            no_pii(),
+            no_harmful_content(),
+            max_length(1000),
+            contains_keywords(["Python", "code"]),
+            excludes_keywords(["TODO", "FIXME"]),
+            factual_grounding(context, threshold=0.2),
+        ],
+    )
+    print(f"Comprehensive validation result: {result.value}")
+
+
+# ============================================================================
+# REAL-WORLD USE CASES
+# ============================================================================
+
+
+def example_use_case_api_documentation():
+    """Real-world use case: API documentation generator."""
+    print("\n=== Use Case: API Documentation Generator ===")
+
+    m = start_session()
+
+    doc_schema = {
+        "type": "object",
+        "properties": {
+            "endpoint": {"type": "string"},
+            "method": {"type": "string", "enum": ["GET", "POST", "PUT", "DELETE"]},
+            "description": {"type": "string"},
+            "parameters": {"type": "array", "items": {"type": "object"}},
+        },
+        "required": ["endpoint", "method", "description"],
+    }
+
+    result = m.instruct(
+        "Generate API documentation for a user registration endpoint",
+        requirements=[
+            json_valid(),
+            matches_schema(doc_schema),
+            no_pii(),
+            contains_keywords(["endpoint", "method"], require_all=True),
+            excludes_keywords(["TODO", "placeholder"]),
+            max_length(800),
+        ],
+    )
+    print(f"API Documentation: {result.value}")
+
+
+def example_use_case_code_review():
+    """Real-world use case: Automated code review assistant."""
+    print("\n=== Use Case: Code Review Assistant ===")
+
+    m = start_session()
+
+    codebase_context = """
+    Our application uses Python 3.11 with FastAPI for the backend.
+    We follow PEP 8 style guidelines and use type hints.
+    All functions must have docstrings.
+    Security is a top priority.
+    """
+
+    review_schema = {
+        "type": "object",
+        "properties": {
+            "issues": {"type": "array", "items": {"type": "string"}},
+            "suggestions": {"type": "array", "items": {"type": "string"}},
+            "rating": {"type": "number", "minimum": 1, "maximum": 10},
+        },
+        "required": ["issues", "suggestions", "rating"],
+    }
+
+    result = m.instruct(
+        "Review this code and provide feedback in JSON format",
+        requirements=[
+            json_valid(),
+            matches_schema(review_schema),
+            factual_grounding(codebase_context, threshold=0.3),
+            no_harmful_content(),
+            no_pii(),
+            contains_keywords(["Python", "code"]),
+            min_length(100),
+        ],
+    )
+    print(f"Code Review: {result.value}")
+
+
+def example_use_case_content_moderation():
+    """Real-world use case: Content moderation system."""
+    print("\n=== Use Case: Content Moderation ===")
+
+    m = start_session()
+
+    result = m.instruct(
+        "Generate a community guidelines summary for a professional forum",
+        requirements=[
+            no_harmful_content(risk_types=["violence", "profanity", "social_bias"]),
+            no_pii(),
+            max_length(500),
+            contains_keywords(["respectful", "professional"]),
+            excludes_keywords(["hate", "discrimination"]),
+        ],
+    )
+    print(f"Community Guidelines: {result.value}")
+
+
+# ============================================================================
+# MAIN EXECUTION
+# ============================================================================
+
+
+if __name__ == "__main__":
+    print("=" * 80)
+    print("MELLEA GUARDRAILS COMPREHENSIVE EXAMPLES")
+    print("=" * 80)
+
+    # Basic Guardrails
+    print("\n" + "=" * 80)
+    print("BASIC GUARDRAILS")
+    print("=" * 80)
+    example_no_pii_basic()
+    example_no_pii_modes()
+    example_json_validation()
+    example_length_constraints()
+    example_keyword_matching()
+    example_case_sensitivity()
+
+    # Advanced Guardrails
+    print("\n" + "=" * 80)
+    print("ADVANCED GUARDRAILS")
+    print("=" * 80)
+    example_harmful_content_detection()
+    example_schema_validation()
+    example_code_validation()
+    example_factual_grounding()
+
+    # Combined Examples
+    print("\n" + "=" * 80)
+    print("COMBINED GUARDRAILS")
+    print("=" * 80)
+    example_combined_basic()
+    example_combined_advanced()
+    example_all_guardrails()
+
+    # Real-World Use Cases
+    print("\n" + "=" * 80)
+    print("REAL-WORLD USE CASES")
+    print("=" * 80)
+    example_use_case_api_documentation()
+    example_use_case_code_review()
+    example_use_case_content_moderation()
+
+    print("\n" + "=" * 80)
+    print("ALL EXAMPLES COMPLETE")
+    print("=" * 80)
diff --git a/docs/examples/guardrails_repair.py b/docs/examples/guardrails_repair.py
new file mode 100644
index 000000000..370cda20f
--- /dev/null
+++ b/docs/examples/guardrails_repair.py
@@ -0,0 +1,179 @@
+# pytest: ollama, llm
+"""Example demonstrating guardrail repair strategies.
+
+This example shows how to use guardrails with repair enabled (check_only=False)
+to guide the LLM in self-correcting outputs that fail validation.
+"""
+
+from mellea import start_session
+from mellea.stdlib.requirements.guardrails import (
+    contains_keywords,
+    excludes_keywords,
+    json_valid,
+    max_length,
+    min_length,
+    no_pii,
+)
+from mellea.stdlib.sampling import RepairTemplateStrategy
+
+
+def example_repair_pii():
+    """Example: Repair output containing PII."""
+    print("\n" + "=" * 80)
+    print("EXAMPLE: Repair PII Detection")
+    print("=" * 80)
+
+    session = start_session()
+
+    # With check_only=False, the guardrail provides actionable repair guidance
+    result = session.instruct(
+        "Generate a sample customer profile with name, email, and phone",
+        requirements=[no_pii(check_only=False)],
+        strategy=RepairTemplateStrategy(loop_budget=3),
+    )
+
+    print(f"\nFinal output (should be PII-free):\n{result.value}")
+
+
+def example_repair_json():
+    """Example: Repair invalid JSON output."""
+    print("\n" + "=" * 80)
+    print("EXAMPLE: Repair JSON Format")
+    print("=" * 80)
+
+    session = start_session()
+
+    result = session.instruct(
+        "Create a JSON object with fields: name (string), age (number), active (boolean)",
+        requirements=[json_valid(check_only=False)],
+        strategy=RepairTemplateStrategy(loop_budget=3),
+    )
+
+    print(f"\nFinal output (should be valid JSON):\n{result.value}")
+
+
+def example_repair_length():
+    """Example: Repair output that's too long or too short."""
+    print("\n" + "=" * 80)
+    print("EXAMPLE: Repair Length Constraints")
+    print("=" * 80)
+
+    session = start_session()
+
+    # Too long - should be shortened
+    result1 = session.instruct(
+        "Write a brief summary of Python programming",
+        requirements=[max_length(100, unit="characters", check_only=False)],
+        strategy=RepairTemplateStrategy(loop_budget=3),
+    )
+
+    print(f"\nShortened output ({len(result1.value or '')} chars):\n{result1.value}")
+
+    # Too short - should be expanded
+    result2 = session.instruct(
+        "Explain machine learning",
+        requirements=[min_length(200, unit="characters", check_only=False)],
+        strategy=RepairTemplateStrategy(loop_budget=3),
+    )
+
+    print(f"\nExpanded output ({len(result2.value or '')} chars):\n{result2.value}")
+
+
+def example_repair_keywords():
+    """Example: Repair missing or forbidden keywords."""
+    print("\n" + "=" * 80)
+    print("EXAMPLE: Repair Keyword Requirements")
+    print("=" * 80)
+
+    session = start_session()
+
+    # Missing keywords - should add them
+    result1 = session.instruct(
+        "Explain web development",
+        requirements=[
+            contains_keywords(
+                ["HTML", "CSS", "JavaScript"], require_all=True, check_only=False
+            )
+        ],
+        strategy=RepairTemplateStrategy(loop_budget=3),
+    )
+
+    print(f"\nOutput with required keywords:\n{result1.value}")
+
+    # Forbidden keywords - should remove them
+    result2 = session.instruct(
+        "Write professional documentation about the project",
+        requirements=[excludes_keywords(["TODO", "FIXME", "hack"], check_only=False)],
+        strategy=RepairTemplateStrategy(loop_budget=3),
+    )
+
+    print(f"\nProfessional output (no forbidden keywords):\n{result2.value}")
+
+
+def example_combined_repair():
+    """Example: Multiple guardrails with repair."""
+    print("\n" + "=" * 80)
+    print("EXAMPLE: Combined Repair Strategies")
+    print("=" * 80)
+
+    session = start_session()
+
+    # Multiple constraints that may need repair
+    result = session.instruct(
+        "Generate a JSON user profile",
+        requirements=[
+            json_valid(check_only=False),
+            no_pii(check_only=False),
+            max_length(300, check_only=False),
+            contains_keywords(["username", "role"], check_only=False),
+        ],
+        strategy=RepairTemplateStrategy(loop_budget=5),
+    )
+
+    print(f"\nFinal output (meets all requirements):\n{result.value}")
+
+
+def example_check_only_vs_repair():
+    """Example: Comparing check_only=True vs check_only=False."""
+    print("\n" + "=" * 80)
+    print("EXAMPLE: Check-Only vs Repair Mode")
+    print("=" * 80)
+
+    session = start_session()
+
+    # check_only=True: Brief reason, hard fail
+    print("\nWith check_only=True (validation only):")
+    try:
+        result1 = session.instruct(
+            "Write a 500-word essay",
+            requirements=[max_length(50, check_only=True)],
+            strategy=RepairTemplateStrategy(loop_budget=1),
+        )
+        print(f"Output: {result1.value}")
+    except Exception as e:
+        print(f"Failed: {e}")
+
+    # check_only=False: Detailed guidance, repair attempts
+    print("\nWith check_only=False (repair enabled):")
+    result2 = session.instruct(
+        "Write a brief summary",
+        requirements=[max_length(50, check_only=False)],
+        strategy=RepairTemplateStrategy(loop_budget=3),
+    )
+    print(f"Output ({len(result2.value or '')} chars): {result2.value}")
+
+
+if __name__ == "__main__":
+    # Run examples
+    example_repair_json()
+    example_repair_length()
+    example_repair_keywords()
+    example_combined_repair()
+    example_check_only_vs_repair()
+
+    # Note: example_repair_pii() requires careful testing as it may
+    # generate PII in the first attempt before repair
+
+    print("\n" + "=" * 80)
+    print("ALL REPAIR EXAMPLES COMPLETE")
+    print("=" * 80)
diff --git a/mellea/stdlib/requirements/__init__.py b/mellea/stdlib/requirements/__init__.py
index c0bd7d3c9..42e34818b 100644
--- a/mellea/stdlib/requirements/__init__.py
+++ b/mellea/stdlib/requirements/__init__.py
@@ -2,6 +2,19 @@
 
 # Import from core for ergonomics.
 from ...core import Requirement, ValidationResult, default_output_to_bool
+from .guardrail_profiles import GuardrailProfiles
+from .guardrails import (
+    contains_keywords,
+    excludes_keywords,
+    factual_grounding,
+    is_code,
+    json_valid,
+    matches_schema,
+    max_length,
+    min_length,
+    no_harmful_content,
+    no_pii,
+)
 from .md import as_markdown_list, is_markdown_list, is_markdown_table
 from .python_reqs import PythonExecutionReq
 from .requirement import (
@@ -13,19 +26,32 @@
     requirement_check_to_bool,
     simple_validate,
 )
+from .requirement_set import RequirementSet
 from .tool_reqs import tool_arg_validator, uses_tool
 
 __all__ = [
     "ALoraRequirement",
+    "GuardrailProfiles",
     "LLMaJRequirement",
     "PythonExecutionReq",
     "Requirement",
+    "RequirementSet",
     "ValidationResult",
     "as_markdown_list",
     "check",
+    "contains_keywords",
     "default_output_to_bool",
+    "excludes_keywords",
+    "factual_grounding",
+    "is_code",
     "is_markdown_list",
     "is_markdown_table",
+    "json_valid",
+    "matches_schema",
+    "max_length",
+    "min_length",
+    "no_harmful_content",
+    "no_pii",
     "req",
     "reqify",
     "requirement_check_to_bool",
diff --git a/mellea/stdlib/requirements/guardrail_profiles.py b/mellea/stdlib/requirements/guardrail_profiles.py
new file mode 100644
index 000000000..94a041161
--- /dev/null
+++ b/mellea/stdlib/requirements/guardrail_profiles.py
@@ -0,0 +1,313 @@
+"""Pre-built guardrail profiles for common use cases.
+
+This module provides ready-to-use RequirementSet configurations for
+common scenarios, making it easy to apply consistent guardrail policies
+across an application.
+"""
+
+from __future__ import annotations
+
+from .guardrails import (
+    contains_keywords,
+    excludes_keywords,
+    factual_grounding,
+    is_code,
+    json_valid,
+    max_length,
+    min_length,
+    no_harmful_content,
+    no_pii,
+)
+from .requirement_set import RequirementSet
+
+
+class GuardrailProfiles:
+    """Pre-built requirement sets for common use cases.
+
+    This class provides static methods that return RequirementSet instances
+    configured for common scenarios. These profiles can be used as-is or
+    customized by adding/removing requirements.
+
+    Examples:
+        Use a pre-built profile:
+        >>> from mellea.stdlib.requirements import GuardrailProfiles
+        >>> from mellea.stdlib.session import start_session
+        >>>
+        >>> m = start_session()
+        >>> result = m.instruct(
+        ...     "Generate Python code",
+        ...     requirements=GuardrailProfiles.code_generation("python")
+        ... )
+
+        Customize a profile:
+        >>> profile = GuardrailProfiles.basic_safety()
+        >>> profile = profile.add(json_valid())
+        >>> result = m.instruct("Generate data", requirements=profile)
+    """
+
+    @staticmethod
+    def basic_safety() -> RequirementSet:
+        """Basic safety guardrails: no PII, no harmful content.
+
+        This is the minimum recommended set of guardrails for any
+        user-facing content generation.
+
+        Returns:
+            RequirementSet with basic safety guardrails
+
+        Examples:
+            >>> profile = GuardrailProfiles.basic_safety()
+            >>> result = m.instruct("Generate text", requirements=profile)
+        """
+        return RequirementSet([no_pii(), no_harmful_content()])
+
+    @staticmethod
+    def json_output(max_size: int = 1000) -> RequirementSet:
+        """JSON output with validation and safety.
+
+        Ensures output is valid JSON, contains no PII, and respects
+        size constraints.
+
+        Args:
+            max_size: Maximum output size in characters (default: 1000)
+
+        Returns:
+            RequirementSet for JSON output
+
+        Examples:
+            >>> profile = GuardrailProfiles.json_output(max_size=500)
+            >>> result = m.instruct("Generate JSON", requirements=profile)
+        """
+        return RequirementSet([json_valid(), max_length(max_size), no_pii()])
+
+    @staticmethod
+    def code_generation(language: str = "python") -> RequirementSet:
+        """Code generation guardrails.
+
+        Validates code syntax, ensures no harmful content, and excludes
+        common placeholder markers.
+
+        Args:
+            language: Programming language for validation (default: "python")
+
+        Returns:
+            RequirementSet for code generation
+
+        Examples:
+            >>> profile = GuardrailProfiles.code_generation("javascript")
+            >>> result = m.instruct("Generate code", requirements=profile)
+        """
+        return RequirementSet(
+            [
+                is_code(language),
+                no_harmful_content(),
+                excludes_keywords(["TODO", "FIXME", "XXX", "HACK"]),
+            ]
+        )
+
+    @staticmethod
+    def professional_content() -> RequirementSet:
+        """Professional, safe content generation.
+
+        Ensures content is appropriate for professional contexts:
+        no PII, no profanity/violence, no placeholder text.
+
+        Returns:
+            RequirementSet for professional content
+
+        Examples:
+            >>> profile = GuardrailProfiles.professional_content()
+            >>> result = m.instruct("Write article", requirements=profile)
+        """
+        return RequirementSet(
+            [
+                no_pii(),
+                no_harmful_content(risk_types=["profanity", "violence"]),
+                excludes_keywords(["TODO", "FIXME", "hack", "workaround", "temporary"]),
+            ]
+        )
+
+    @staticmethod
+    def api_documentation() -> RequirementSet:
+        """API documentation guardrails.
+
+        Ensures documentation is valid JSON, contains required keywords,
+        excludes placeholders, and respects size limits.
+
+        Returns:
+            RequirementSet for API documentation
+
+        Examples:
+            >>> profile = GuardrailProfiles.api_documentation()
+            >>> result = m.instruct("Document API", requirements=profile)
+        """
+        return RequirementSet(
+            [
+                json_valid(),
+                no_pii(),
+                contains_keywords(["endpoint", "method"], require_all=True),
+                excludes_keywords(["TODO", "placeholder", "FIXME"]),
+                max_length(2000),
+            ]
+        )
+
+    @staticmethod
+    def grounded_summary(context: str, threshold: float = 0.5) -> RequirementSet:
+        """Factually grounded summary generation.
+
+        Ensures summaries are grounded in provided context, contain no PII,
+        and respect length constraints.
+
+        Args:
+            context: Reference context for grounding validation
+            threshold: Minimum overlap ratio (0.0-1.0, default: 0.5)
+
+        Returns:
+            RequirementSet for grounded summaries
+
+        Examples:
+            >>> context = "Python is a programming language..."
+            >>> profile = GuardrailProfiles.grounded_summary(context)
+            >>> result = m.instruct("Summarize", requirements=profile)
+        """
+        return RequirementSet(
+            [factual_grounding(context, threshold=threshold), no_pii(), max_length(500)]
+        )
+
+    @staticmethod
+    def safe_chat() -> RequirementSet:
+        """Safe chat/conversation guardrails.
+
+        Appropriate for chatbot or conversational AI applications.
+        Ensures safety without being overly restrictive.
+
+        Returns:
+            RequirementSet for safe chat
+
+        Examples:
+            >>> profile = GuardrailProfiles.safe_chat()
+            >>> result = m.instruct("Respond to user", requirements=profile)
+        """
+        return RequirementSet([no_pii(), no_harmful_content(), max_length(1000)])
+
+    @staticmethod
+    def structured_data(
+        schema: dict | None = None, max_size: int = 2000
+    ) -> RequirementSet:
+        """Structured data generation with optional schema validation.
+
+        For generating structured data outputs. If a schema is provided,
+        validates against it; otherwise just ensures valid JSON.
+
+        Args:
+            schema: Optional JSON schema for validation
+            max_size: Maximum output size in characters (default: 2000)
+
+        Returns:
+            RequirementSet for structured data
+
+        Examples:
+            >>> schema = {"type": "object", "properties": {...}}
+            >>> profile = GuardrailProfiles.structured_data(schema)
+            >>> result = m.instruct("Generate data", requirements=profile)
+        """
+        reqs = RequirementSet([json_valid(), no_pii(), max_length(max_size)])
+
+        if schema is not None:
+            from .guardrails import matches_schema
+
+            reqs = reqs.add(matches_schema(schema))
+
+        return reqs
+
+    @staticmethod
+    def content_moderation() -> RequirementSet:
+        """Content moderation guardrails.
+
+        Strict guardrails for user-generated content or public-facing
+        applications. Checks multiple risk types and excludes problematic
+        keywords.
+
+        Returns:
+            RequirementSet for content moderation
+
+        Examples:
+            >>> profile = GuardrailProfiles.content_moderation()
+            >>> result = m.instruct("Generate content", requirements=profile)
+        """
+        return RequirementSet(
+            [
+                no_pii(),
+                no_harmful_content(
+                    risk_types=[
+                        "violence",
+                        "profanity",
+                        "social_bias",
+                        "sexual_content",
+                        "unethical_behavior",
+                    ]
+                ),
+                excludes_keywords(
+                    ["hate", "discrimination", "offensive", "inappropriate"]
+                ),
+            ]
+        )
+
+    @staticmethod
+    def minimal() -> RequirementSet:
+        """Minimal guardrails: just PII protection.
+
+        Use when you need minimal constraints but still want basic
+        privacy protection.
+
+        Returns:
+            RequirementSet with minimal guardrails
+
+        Examples:
+            >>> profile = GuardrailProfiles.minimal()
+            >>> result = m.instruct("Generate text", requirements=profile)
+        """
+        return RequirementSet([no_pii()])
+
+    @staticmethod
+    def strict() -> RequirementSet:
+        """Strict guardrails for high-risk applications.
+
+        Comprehensive guardrails for applications where safety and
+        compliance are critical.
+
+        Returns:
+            RequirementSet with strict guardrails
+
+        Examples:
+            >>> profile = GuardrailProfiles.strict()
+            >>> result = m.instruct("Generate content", requirements=profile)
+        """
+        return RequirementSet(
+            [
+                no_pii(strict=True),
+                no_harmful_content(
+                    risk_types=[
+                        "harm",
+                        "violence",
+                        "profanity",
+                        "social_bias",
+                        "sexual_content",
+                        "unethical_behavior",
+                        "jailbreak",
+                    ]
+                ),
+                max_length(1000),
+                excludes_keywords(
+                    [
+                        "TODO",
+                        "FIXME",
+                        "XXX",
+                        "HACK",
+                        "hate",
+                        "discrimination",
+                        "offensive",
+                    ]
+                ),
+            ]
+        )
diff --git a/mellea/stdlib/requirements/guardrails.py b/mellea/stdlib/requirements/guardrails.py
new file mode 100644
index 000000000..705a2a2de
--- /dev/null
+++ b/mellea/stdlib/requirements/guardrails.py
@@ -0,0 +1,1197 @@
+"""Pre-built, reusable requirements for common guardrail patterns.
+
+This module provides a library of ready-to-use guardrails that integrations can use
+out of the box for common validation patterns like PII detection, format compliance,
+length constraints, and more.
+
+Examples:
+    >>> from mellea.stdlib.requirements.guardrails import no_pii, json_valid, max_length
+    >>> from mellea.stdlib.session import start_session
+    >>>
+    >>> m = start_session()
+    >>> result = m.instruct(
+    ...     "Generate a customer profile",
+    ...     requirements=[no_pii(), json_valid(), max_length(500)]
+    ... )
+"""
+
+from __future__ import annotations
+
+import re
+from typing import Literal
+
+from ...core import Context, FancyLogger, Requirement, ValidationResult
+from .requirement import simple_validate
+
+logger = FancyLogger.get_logger()
+
+# region PII Detection
+
+# Common PII regex patterns
+_EMAIL_PATTERN = re.compile(r"\b[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Z|a-z]{2,}\b")
+_PHONE_PATTERN = re.compile(
+    r"\b(?:\+?1[-.]?)?\(?([0-9]{3})\)?[-.]?([0-9]{3})[-.]?([0-9]{4})\b"
+)
+_SSN_PATTERN = re.compile(r"\b\d{3}-\d{2}-\d{4}\b")
+_CREDIT_CARD_PATTERN = re.compile(r"\b\d{4}[-\s]?\d{4}[-\s]?\d{4}[-\s]?\d{4}\b")
+
+# Lazy-loaded spaCy model
+_SPACY_NLP = None
+
+# Harmful content keywords for risk detection
+_RISK_KEYWORDS = {
+    "violence": [
+        "kill",
+        "murder",
+        "attack",
+        "assault",
+        "weapon",
+        "blood",
+        "death",
+        "violent",
+    ],
+    "profanity": ["fuck", "shit", "damn", "hell", "ass", "bitch", "bastard"],
+    "social_bias": ["racist", "sexist", "discrimination", "prejudice", "stereotype"],
+    "sexual_content": ["sex", "sexual", "porn", "nude", "explicit"],
+    "unethical_behavior": ["cheat", "steal", "fraud", "illegal", "unethical"],
+    "jailbreak": ["ignore previous", "disregard", "bypass", "override"],
+    "harm": ["harm", "hurt", "damage", "injure", "dangerous"],
+}
+
+
+def _get_spacy_nlp():
+    """Lazy load spaCy model."""
+    global _SPACY_NLP
+    if _SPACY_NLP is None:
+        try:
+            import spacy  # type: ignore[import-not-found]
+
+            try:
+                _SPACY_NLP = spacy.load("en_core_web_sm")
+            except OSError:
+                logger.warning(
+                    "spaCy model 'en_core_web_sm' not found. "
+                    "Install with: python -m spacy download en_core_web_sm"
+                )
+                _SPACY_NLP = False  # Mark as unavailable
+        except ImportError:
+            logger.warning(
+                "spaCy not installed. Install with: pip install spacy\n"
+                "For better PII detection, also run: python -m spacy download en_core_web_sm"
+            )
+            _SPACY_NLP = False
+    return _SPACY_NLP if _SPACY_NLP is not False else None
+
+
+def _detect_pii_regex(text: str) -> tuple[bool, list[str]]:
+    """Detect PII using regex patterns.
+
+    Args:
+        text: Text to check for PII
+
+    Returns:
+        Tuple of (has_pii, list of detected PII types)
+    """
+    detected = []
+
+    if _EMAIL_PATTERN.search(text):
+        detected.append("email")
+    if _PHONE_PATTERN.search(text):
+        detected.append("phone")
+    if _SSN_PATTERN.search(text):
+        detected.append("SSN")
+    if _CREDIT_CARD_PATTERN.search(text):
+        detected.append("credit_card")
+
+    return len(detected) > 0, detected
+
+
+def _detect_pii_spacy(text: str) -> tuple[bool, list[str]]:
+    """Detect PII using spaCy NER.
+
+    Args:
+        text: Text to check for PII
+
+    Returns:
+        Tuple of (has_pii, list of detected entity types)
+    """
+    nlp = _get_spacy_nlp()
+    if nlp is None:
+        return False, []
+
+    doc = nlp(text)
+    pii_entities = ["PERSON", "GPE", "LOC", "ORG"]
+    detected = []
+
+    for ent in doc.ents:
+        if ent.label_ in pii_entities and ent.label_ not in detected:
+            detected.append(ent.label_)
+
+    return len(detected) > 0, detected
+
+
+def _validate_no_pii(
+    ctx: Context,
+    method: Literal["regex", "spacy", "auto"],
+    strict: bool,
+    check_only: bool,
+) -> ValidationResult:
+    """Validation function for no_pii guardrail.
+
+    Args:
+        ctx: Context to validate
+        method: Detection method to use
+        strict: If True, use LLM for final verification
+        check_only: If True, provide brief reason; if False, provide actionable repair guidance
+
+    Returns:
+        ValidationResult indicating if PII was detected
+    """
+    last_output = ctx.last_output()
+    if last_output is None or last_output.value is None:
+        return ValidationResult(result=False, reason="No output found in context")
+
+    text = str(last_output.value)
+    has_pii = False
+    detected_types: list[str] = []
+    pii_examples = []
+
+    # Apply detection method and collect examples
+    if method == "regex":
+        has_pii, detected_types = _detect_pii_regex(text)
+        # Collect examples for repair guidance
+        if has_pii and not check_only:
+            if "email" in detected_types:
+                match = _EMAIL_PATTERN.search(text)
+                if match:
+                    pii_examples.append(f"email address '{match.group()}'")
+            if "phone" in detected_types:
+                match = _PHONE_PATTERN.search(text)
+                if match:
+                    pii_examples.append(f"phone number '{match.group()}'")
+            if "SSN" in detected_types:
+                match = _SSN_PATTERN.search(text)
+                if match:
+                    pii_examples.append(f"SSN '{match.group()}'")
+            if "credit_card" in detected_types:
+                match = _CREDIT_CARD_PATTERN.search(text)
+                if match:
+                    pii_examples.append(f"credit card number '{match.group()}'")
+    elif method == "spacy":
+        has_pii, detected_types = _detect_pii_spacy(text)
+        if not has_pii:  # Fallback to regex if spaCy finds nothing
+            has_pii, regex_types = _detect_pii_regex(text)
+            detected_types.extend(regex_types)
+    else:  # auto
+        # Try spaCy first, fallback to regex
+        has_pii_spacy, spacy_types = _detect_pii_spacy(text)
+        has_pii_regex, regex_types = _detect_pii_regex(text)
+
+        has_pii = has_pii_spacy or has_pii_regex
+        detected_types = list(set(spacy_types + regex_types))
+
+    # Build reason message
+    if has_pii:
+        if check_only:
+            reason = f"Detected potential PII: {', '.join(detected_types)}"
+        else:
+            # Provide actionable repair guidance
+            if pii_examples:
+                reason = (
+                    f"Output contains personally identifiable information (PII): {', '.join(pii_examples)}. "
+                    f"Please remove or redact this sensitive information to protect privacy."
+                )
+            else:
+                reason = (
+                    f"Output contains PII of type(s): {', '.join(detected_types)}. "
+                    f"Please remove or redact all personally identifiable information including "
+                    f"names, email addresses, phone numbers, and other sensitive data."
+                )
+    else:
+        reason = "No PII detected"
+
+    # Note: strict mode with LLM verification can be added in future iteration
+    if strict and has_pii:
+        reason += " (strict mode: consider LLM verification)"
+
+    return ValidationResult(result=not has_pii, reason=reason)
+
+
+def no_pii(
+    *,
+    method: Literal["regex", "spacy", "auto"] = "auto",
+    strict: bool = False,
+    check_only: bool = True,
+) -> Requirement:
+    """Reject outputs containing personally identifiable information (PII).
+
+    This guardrail detects common PII patterns including:
+    - Names (via spaCy NER)
+    - Email addresses
+    - Phone numbers
+    - Social Security Numbers
+    - Credit card numbers
+    - Organizations and locations (via spaCy NER)
+
+    The detection uses a hybrid approach:
+    - **regex**: Fast pattern matching for emails, phones, SSNs, credit cards
+    - **spacy**: NER-based detection for names, organizations, locations (requires spacy)
+    - **auto** (default): Try spaCy first, fallback to regex
+
+    Args:
+        method: Detection method - "regex", "spacy", or "auto" (default)
+        strict: If True, be more conservative in PII detection (future: LLM verification)
+        check_only: If True, only validate without attempting repair (default: True)
+
+    Returns:
+        Requirement that validates output contains no PII
+
+    Examples:
+        Basic usage:
+        >>> from mellea.stdlib.requirements.guardrails import no_pii
+        >>> req = no_pii()
+
+        Regex-only (no dependencies):
+        >>> req = no_pii(method="regex")
+
+        Strict mode:
+        >>> req = no_pii(strict=True)
+
+        In a session:
+        >>> from mellea.stdlib.session import start_session
+        >>> m = start_session()
+        >>> result = m.instruct(
+        ...     "Describe a customer without revealing personal details",
+        ...     requirements=[no_pii()]
+        ... )
+
+    Note:
+        - For best results, install spaCy: `pip install spacy`
+        - Download model: `python -m spacy download en_core_web_sm`
+        - Regex-only mode works without additional dependencies
+        - False positives may occur (e.g., fictional names in creative writing)
+    """
+    return Requirement(
+        description="Output must not contain personally identifiable information (PII) "
+        "such as names, email addresses, phone numbers, or other sensitive data.",
+        validation_fn=lambda ctx: _validate_no_pii(ctx, method, strict, check_only),
+        check_only=check_only,
+    )
+
+
+# endregion
+
+# region JSON Validation
+
+
+def json_valid(*, check_only: bool = True) -> Requirement:
+    """Validate that output is valid JSON format.
+
+    This guardrail ensures the generated output can be parsed as valid JSON.
+    Useful for ensuring structured data outputs.
+
+    Args:
+        check_only: If True, only validate without attempting repair (default: True)
+
+    Returns:
+        Requirement that validates output is valid JSON
+
+    Examples:
+        Basic usage:
+        >>> from mellea.stdlib.requirements.guardrails import json_valid
+        >>> req = json_valid()
+
+        In a session:
+        >>> from mellea.stdlib.session import start_session
+        >>> m = start_session()
+        >>> result = m.instruct(
+        ...     "Generate a JSON object with name and age fields",
+        ...     requirements=[json_valid()]
+        ... )
+    """
+    import json
+
+    def validate_json(ctx: Context) -> ValidationResult:
+        last_output = ctx.last_output()
+        if last_output is None or last_output.value is None:
+            return ValidationResult(result=False, reason="No output found in context")
+
+        text = str(last_output.value).strip()
+
+        try:
+            json.loads(text)
+            return ValidationResult(result=True, reason="Valid JSON")
+        except json.JSONDecodeError as e:
+            if check_only:
+                reason = f"Invalid JSON: {e.msg} at line {e.lineno}, column {e.colno}"
+            else:
+                reason = (
+                    f"Output is not valid JSON. Error: {e.msg} at line {e.lineno}, column {e.colno}. "
+                    f"Please ensure the output is properly formatted JSON with correct syntax, "
+                    f"including proper quotes, commas, and bracket matching."
+                )
+            return ValidationResult(result=False, reason=reason)
+
+    return Requirement(
+        description="Output must be valid JSON format.",
+        validation_fn=validate_json,
+        check_only=check_only,
+    )
+
+
+# endregion
+
+# region Length Constraints
+
+
+def max_length(
+    n: int, *, unit: str = "characters", check_only: bool = True
+) -> Requirement:
+    """Enforce maximum length constraint on output.
+
+    Args:
+        n: Maximum allowed length
+        unit: Unit of measurement - "characters", "words", or "tokens" (default: "characters")
+        check_only: If True, only validate without attempting repair (default: True)
+
+    Returns:
+        Requirement that validates output length
+
+    Examples:
+        Character limit:
+        >>> from mellea.stdlib.requirements.guardrails import max_length
+        >>> req = max_length(500)
+
+        Word limit:
+        >>> req = max_length(100, unit="words")
+
+        In a session:
+        >>> from mellea.stdlib.session import start_session
+        >>> m = start_session()
+        >>> result = m.instruct(
+        ...     "Write a brief summary",
+        ...     requirements=[max_length(200)]
+        ... )
+    """
+
+    def validate_max_length(ctx: Context) -> ValidationResult:
+        last_output = ctx.last_output()
+        if last_output is None or last_output.value is None:
+            return ValidationResult(result=False, reason="No output found in context")
+
+        text = str(last_output.value)
+
+        if unit == "characters":
+            length = len(text)
+        elif unit == "words":
+            length = len(text.split())
+        elif unit == "tokens":
+            # Simple approximation: ~4 characters per token
+            length = len(text) // 4
+        else:
+            return ValidationResult(
+                result=False,
+                reason=f"Invalid unit '{unit}'. Use 'characters', 'words', or 'tokens'.",
+            )
+
+        if length <= n:
+            return ValidationResult(
+                result=True, reason=f"Length {length} {unit} is within limit of {n}"
+            )
+        else:
+            if check_only:
+                reason = f"Length {length} {unit} exceeds maximum of {n}"
+            else:
+                excess = length - n
+                reason = (
+                    f"Output exceeds maximum length of {n} {unit}. "
+                    f"Current length: {length} {unit} (exceeds by {excess} {unit}). "
+                    f"Please shorten the output by removing unnecessary content or being more concise."
+                )
+            return ValidationResult(result=False, reason=reason)
+
+    return Requirement(
+        description=f"Output must not exceed {n} {unit}.",
+        validation_fn=validate_max_length,
+        check_only=check_only,
+    )
+
+
+def min_length(
+    n: int, *, unit: str = "characters", check_only: bool = True
+) -> Requirement:
+    """Enforce minimum length constraint on output.
+
+    Args:
+        n: Minimum required length
+        unit: Unit of measurement - "characters", "words", or "tokens" (default: "characters")
+        check_only: If True, only validate without attempting repair (default: True)
+
+    Returns:
+        Requirement that validates output length
+
+    Examples:
+        Character minimum:
+        >>> from mellea.stdlib.requirements.guardrails import min_length
+        >>> req = min_length(100)
+
+        Word minimum:
+        >>> req = min_length(50, unit="words")
+
+        In a session:
+        >>> from mellea.stdlib.session import start_session
+        >>> m = start_session()
+        >>> result = m.instruct(
+        ...     "Write a detailed explanation",
+        ...     requirements=[min_length(500)]
+        ... )
+    """
+
+    def validate_min_length(ctx: Context) -> ValidationResult:
+        last_output = ctx.last_output()
+        if last_output is None or last_output.value is None:
+            return ValidationResult(result=False, reason="No output found in context")
+
+        text = str(last_output.value)
+
+        if unit == "characters":
+            length = len(text)
+        elif unit == "words":
+            length = len(text.split())
+        elif unit == "tokens":
+            # Simple approximation: ~4 characters per token
+            length = len(text) // 4
+        else:
+            return ValidationResult(
+                result=False,
+                reason=f"Invalid unit '{unit}'. Use 'characters', 'words', or 'tokens'.",
+            )
+
+        if length >= n:
+            return ValidationResult(
+                result=True, reason=f"Length {length} {unit} meets minimum of {n}"
+            )
+        else:
+            if check_only:
+                reason = f"Length {length} {unit} is below minimum of {n}"
+            else:
+                shortage = n - length
+                reason = (
+                    f"Output is below minimum length of {n} {unit}. "
+                    f"Current length: {length} {unit} (short by {shortage} {unit}). "
+                    f"Please expand the output with more detail, examples, or explanation."
+                )
+            return ValidationResult(result=False, reason=reason)
+
+    return Requirement(
+        description=f"Output must be at least {n} {unit}.",
+        validation_fn=validate_min_length,
+        check_only=check_only,
+    )
+
+
+# endregion
+
+# region Keyword Matching
+
+
+def contains_keywords(
+    keywords: list[str],
+    *,
+    case_sensitive: bool = False,
+    require_all: bool = False,
+    check_only: bool = True,
+) -> Requirement:
+    """Require output to contain specific keywords.
+
+    Args:
+        keywords: List of keywords that should appear in output
+        case_sensitive: If True, perform case-sensitive matching (default: False)
+        require_all: If True, all keywords must be present; if False, at least one (default: False)
+        check_only: If True, only validate without attempting repair (default: True)
+
+    Returns:
+        Requirement that validates keyword presence
+
+    Examples:
+        Require any keyword:
+        >>> from mellea.stdlib.requirements.guardrails import contains_keywords
+        >>> req = contains_keywords(["Python", "Java", "JavaScript"])
+
+        Require all keywords:
+        >>> req = contains_keywords(["API", "REST", "JSON"], require_all=True)
+
+        Case-sensitive:
+        >>> req = contains_keywords(["NASA", "SpaceX"], case_sensitive=True)
+
+        In a session:
+        >>> from mellea.stdlib.session import start_session
+        >>> m = start_session()
+        >>> result = m.instruct(
+        ...     "Explain web development",
+        ...     requirements=[contains_keywords(["HTML", "CSS", "JavaScript"])]
+        ... )
+    """
+
+    def validate_keywords(ctx: Context) -> ValidationResult:
+        last_output = ctx.last_output()
+        if last_output is None or last_output.value is None:
+            return ValidationResult(result=False, reason="No output found in context")
+
+        text = str(last_output.value)
+        if not case_sensitive:
+            text = text.lower()
+            keywords_to_check = [k.lower() for k in keywords]
+        else:
+            keywords_to_check = keywords
+
+        found_keywords = [kw for kw in keywords_to_check if kw in text]
+
+        if require_all:
+            if len(found_keywords) == len(keywords):
+                return ValidationResult(
+                    result=True,
+                    reason=f"All required keywords found: {', '.join(keywords)}",
+                )
+            else:
+                missing = [
+                    kw
+                    for kw in keywords
+                    if (kw.lower() if not case_sensitive else kw)
+                    not in list(found_keywords)
+                ]
+                return ValidationResult(
+                    result=False,
+                    reason=f"Missing required keywords: {', '.join(missing)}",
+                )
+        else:
+            if len(found_keywords) > 0:
+                return ValidationResult(
+                    result=True,
+                    reason=f"Found keywords: {', '.join([keywords[keywords_to_check.index(fk)] for fk in found_keywords])}",
+                )
+            else:
+                return ValidationResult(
+                    result=False,
+                    reason=f"None of the required keywords found: {', '.join(keywords)}",
+                )
+
+    mode = "all" if require_all else "any"
+    return Requirement(
+        description=f"Output must contain {mode} of these keywords: {', '.join(keywords)}.",
+        validation_fn=validate_keywords,
+        check_only=check_only,
+    )
+
+
+def excludes_keywords(
+    keywords: list[str], *, case_sensitive: bool = False, check_only: bool = True
+) -> Requirement:
+    """Require output to NOT contain specific keywords.
+
+    Args:
+        keywords: List of keywords that should NOT appear in output
+        case_sensitive: If True, perform case-sensitive matching (default: False)
+        check_only: If True, only validate without attempting repair (default: True)
+
+    Returns:
+        Requirement that validates keyword absence
+
+    Examples:
+        Exclude specific terms:
+        >>> from mellea.stdlib.requirements.guardrails import excludes_keywords
+        >>> req = excludes_keywords(["TODO", "FIXME", "XXX"])
+
+        Case-sensitive exclusion:
+        >>> req = excludes_keywords(["CONFIDENTIAL"], case_sensitive=True)
+
+        In a session:
+        >>> from mellea.stdlib.session import start_session
+        >>> m = start_session()
+        >>> result = m.instruct(
+        ...     "Write professional documentation",
+        ...     requirements=[excludes_keywords(["slang", "informal"])]
+        ... )
+    """
+
+    def validate_exclusions(ctx: Context) -> ValidationResult:
+        last_output = ctx.last_output()
+        if last_output is None or last_output.value is None:
+            return ValidationResult(result=False, reason="No output found in context")
+
+        text = str(last_output.value)
+        if not case_sensitive:
+            text = text.lower()
+            keywords_to_check = [k.lower() for k in keywords]
+        else:
+            keywords_to_check = keywords
+
+        found_keywords = [kw for kw in keywords_to_check if kw in text]
+
+        if len(found_keywords) == 0:
+            return ValidationResult(result=True, reason="No forbidden keywords found")
+        else:
+            # Map back to original case for reporting
+            original_found = [
+                keywords[keywords_to_check.index(fk)] for fk in found_keywords
+            ]
+            if check_only:
+                reason = f"Found forbidden keywords: {', '.join(original_found)}"
+            else:
+                reason = (
+                    f"Output contains forbidden keywords: {', '.join(original_found)}. "
+                    f"Please remove or rephrase to avoid these terms."
+                )
+            return ValidationResult(result=False, reason=reason)
+
+    return Requirement(
+        description=f"Output must not contain these keywords: {', '.join(keywords)}.",
+        validation_fn=validate_exclusions,
+        check_only=check_only,
+    )
+
+
+# endregion
+
+# region Harmful Content Detection
+
+
+def no_harmful_content(
+    *, risk_types: list[str] | None = None, check_only: bool = True
+) -> Requirement:
+    """Detect harmful content using Guardian risk detection.
+
+    This guardrail uses Guardian models to detect various types of harmful content
+    including violence, profanity, social bias, sexual content, and unethical behavior.
+
+    Available risk types:
+    - "harm": General harmful content
+    - "violence": Violent content
+    - "profanity": Profane language
+    - "social_bias": Social bias and discrimination
+    - "sexual_content": Sexual or adult content
+    - "unethical_behavior": Unethical behavior
+    - "jailbreak": Jailbreak attempts
+
+    Args:
+        risk_types: List of specific risk types to check. If None, checks for general harm.
+        check_only: If True, only validate without attempting repair (default: True)
+
+    Returns:
+        Requirement that validates output contains no harmful content
+
+    Examples:
+        Check for general harm:
+        >>> from mellea.stdlib.requirements.guardrails import no_harmful_content
+        >>> req = no_harmful_content()
+
+        Check specific risk types:
+        >>> req = no_harmful_content(risk_types=["violence", "profanity"])
+
+        In a session:
+        >>> from mellea.stdlib.session import start_session
+        >>> m = start_session()
+        >>> result = m.instruct(
+        ...     "Write a story about conflict resolution",
+        ...     requirements=[no_harmful_content()]
+        ... )
+
+    Note:
+        This is a lightweight implementation that uses keyword-based detection.
+        For production use with Guardian models, use the Guardian intrinsics directly
+        or the deprecated GuardianCheck class with appropriate backends.
+    """
+
+    def validate_no_harmful_content(ctx: Context) -> ValidationResult:
+        last_output = ctx.last_output()
+        if last_output is None or last_output.value is None:
+            return ValidationResult(result=False, reason="No output found in context")
+
+        text = str(last_output.value).lower()
+
+        # Determine which risk types to check
+        risks_to_check = risk_types if risk_types else ["harm"]
+
+        # Check for harmful keywords
+        detected_risks = []
+        for risk in risks_to_check:
+            if risk not in _RISK_KEYWORDS:
+                logger.warning(f"Unknown risk type: {risk}. Skipping.")
+                continue
+
+            keywords = _RISK_KEYWORDS[risk]
+            for keyword in keywords:
+                if keyword in text:
+                    detected_risks.append(risk)
+                    break
+
+        if detected_risks:
+            if check_only:
+                reason = f"Detected potentially harmful content: {', '.join(set(detected_risks))}"
+            else:
+                reason = (
+                    f"Output contains potentially harmful content related to: {', '.join(set(detected_risks))}. "
+                    f"Please revise to remove harmful, offensive, or inappropriate content."
+                )
+            return ValidationResult(result=False, reason=reason)
+        else:
+            return ValidationResult(result=True, reason="No harmful content detected")
+
+    risk_desc = ", ".join(risk_types) if risk_types else "harmful content"
+    return Requirement(
+        description=f"Output must not contain {risk_desc}.",
+        validation_fn=validate_no_harmful_content,
+        check_only=check_only,
+    )
+
+
+# endregion
+
+# region JSON Schema Validation
+
+
+def matches_schema(schema: dict, *, check_only: bool = True) -> Requirement:
+    """Validate JSON output against a JSON schema.
+
+    This guardrail validates that the output conforms to a JSON Schema (Draft 7).
+    Requires the jsonschema library to be installed.
+
+    Args:
+        schema: JSON schema dictionary (JSON Schema Draft 7 format)
+        check_only: If True, only validate without attempting repair (default: True)
+
+    Returns:
+        Requirement that validates output matches the schema
+
+    Examples:
+        Basic schema validation:
+        >>> from mellea.stdlib.requirements.guardrails import matches_schema
+        >>> schema = {
+        ...     "type": "object",
+        ...     "properties": {
+        ...         "name": {"type": "string"},
+        ...         "age": {"type": "number", "minimum": 0}
+        ...     },
+        ...     "required": ["name", "age"]
+        ... }
+        >>> req = matches_schema(schema)
+
+        Array validation:
+        >>> schema = {
+        ...     "type": "array",
+        ...     "items": {"type": "string"},
+        ...     "minItems": 1
+        ... }
+        >>> req = matches_schema(schema)
+
+        In a session:
+        >>> from mellea.stdlib.session import start_session
+        >>> m = start_session()
+        >>> result = m.instruct(
+        ...     "Generate a person object with name and age",
+        ...     requirements=[matches_schema(schema)]
+        ... )
+
+    Note:
+        Requires jsonschema library. Install with: pip install jsonschema
+        or: pip install mellea[schema]
+    """
+    import json
+
+    def validate_schema(ctx: Context) -> ValidationResult:
+        last_output = ctx.last_output()
+        if last_output is None or last_output.value is None:
+            return ValidationResult(result=False, reason="No output found in context")
+
+        text = str(last_output.value).strip()
+
+        # First, validate it's valid JSON
+        try:
+            data = json.loads(text)
+        except json.JSONDecodeError as e:
+            return ValidationResult(
+                result=False,
+                reason=f"Invalid JSON: {e.msg} at line {e.lineno}, column {e.colno}",
+            )
+
+        # Try to import jsonschema
+        try:
+            import jsonschema
+        except ImportError:
+            return ValidationResult(
+                result=False,
+                reason="jsonschema library not installed. Install with: pip install jsonschema",
+            )
+
+        # Validate against schema
+        try:
+            jsonschema.validate(instance=data, schema=schema)
+            return ValidationResult(result=True, reason="Output matches schema")
+        except jsonschema.ValidationError as e:
+            if check_only:
+                reason = f"Schema validation failed: {e.message}"
+            else:
+                reason = (
+                    f"Output does not match the required JSON schema. "
+                    f"Validation error: {e.message}. "
+                    f"Please ensure the JSON structure matches the specified schema requirements."
+                )
+            return ValidationResult(result=False, reason=reason)
+        except jsonschema.SchemaError as e:
+            return ValidationResult(result=False, reason=f"Invalid schema: {e.message}")
+
+    return Requirement(
+        description="Output must match the provided JSON schema.",
+        validation_fn=validate_schema,
+        check_only=check_only,
+    )
+
+
+# endregion
+
+# region Code Validation
+
+
+def is_code(language: str | None = None, *, check_only: bool = True) -> Requirement:
+    """Validate that output is valid code in the specified language.
+
+    This guardrail validates code syntax using language-specific parsers or heuristics.
+
+    Supported languages:
+    - "python": Uses ast.parse() for syntax validation
+    - "javascript", "typescript": Heuristic detection (function, const, let, var, =>)
+    - "java", "c", "cpp": Heuristic detection (class, public, void, int)
+    - None: Generic code detection using multiple heuristics
+
+    Args:
+        language: Programming language to validate (python, javascript, java, etc.)
+                 If None, performs generic code detection
+        check_only: If True, only validate without attempting repair (default: True)
+
+    Returns:
+        Requirement that validates output is valid code
+
+    Examples:
+        Python syntax validation:
+        >>> from mellea.stdlib.requirements.guardrails import is_code
+        >>> req = is_code("python")
+
+        Generic code detection:
+        >>> req = is_code()
+
+        JavaScript validation:
+        >>> req = is_code("javascript")
+
+        In a session:
+        >>> from mellea.stdlib.session import start_session
+        >>> m = start_session()
+        >>> result = m.instruct(
+        ...     "Write a Python function to calculate factorial",
+        ...     requirements=[is_code("python")]
+        ... )
+
+    Note:
+        - Python validation uses ast.parse() for accurate syntax checking
+        - Other languages use heuristic detection (may have false positives/negatives)
+        - Generic detection checks for common code patterns
+    """
+
+    def validate_code(ctx: Context) -> ValidationResult:
+        last_output = ctx.last_output()
+        if last_output is None or last_output.value is None:
+            return ValidationResult(result=False, reason="No output found in context")
+
+        text = str(last_output.value).strip()
+
+        if not text:
+            return ValidationResult(result=False, reason="Empty output")
+
+        # Python: Use ast.parse for accurate syntax checking
+        if language and language.lower() == "python":
+            import ast
+
+            try:
+                ast.parse(text)
+                return ValidationResult(result=True, reason="Valid Python syntax")
+            except SyntaxError as e:
+                if check_only:
+                    reason = f"Invalid Python syntax: {e.msg} at line {e.lineno}"
+                else:
+                    reason = (
+                        f"Output is not valid Python code. "
+                        f"Syntax error: {e.msg} at line {e.lineno}. "
+                        f"Please provide syntactically correct Python code."
+                    )
+                return ValidationResult(result=False, reason=reason)
+
+        # For other languages, use heuristic detection
+        lang_lower = language.lower() if language else None
+
+        # Check balanced braces/brackets/parentheses
+        def check_balanced(text: str) -> bool:
+            stack = []
+            pairs = {"(": ")", "[": "]", "{": "}"}
+            for char in text:
+                if char in pairs:
+                    stack.append(char)
+                elif char in pairs.values():
+                    if not stack:
+                        return False
+                    if pairs[stack.pop()] != char:
+                        return False
+            return len(stack) == 0
+
+        if not check_balanced(text):
+            if check_only:
+                reason = "Unbalanced braces, brackets, or parentheses"
+            else:
+                reason = (
+                    "Code has unbalanced braces, brackets, or parentheses. "
+                    "Please ensure all opening symbols have matching closing symbols."
+                )
+            return ValidationResult(result=False, reason=reason)
+
+        # Language-specific heuristics
+        if lang_lower in ["javascript", "typescript", "js", "ts"]:
+            # JavaScript/TypeScript patterns
+            js_patterns = [
+                r"\bfunction\s+\w+\s*\(",
+                r"\bconst\s+\w+",
+                r"\blet\s+\w+",
+                r"\bvar\s+\w+",
+                r"=>",
+                r"\bclass\s+\w+",
+            ]
+            matches = sum(1 for pattern in js_patterns if re.search(pattern, text))
+            if matches >= 2:
+                return ValidationResult(
+                    result=True, reason=f"Valid {language} code detected"
+                )
+            else:
+                if check_only:
+                    reason = f"Does not appear to be valid {language} code"
+                else:
+                    reason = (
+                        f"Output does not appear to be valid {language} code. "
+                        f"Please provide proper {language} code with appropriate syntax and structure."
+                    )
+                return ValidationResult(result=False, reason=reason)
+
+        elif lang_lower in ["java", "c", "cpp", "c++"]:
+            # Java/C/C++ patterns
+            c_patterns = [
+                r"\b(public|private|protected)\s+",
+                r"\bclass\s+\w+",
+                r"\b(void|int|float|double|char|bool)\s+\w+\s*\(",
+                r"\breturn\s+",
+                r";",
+            ]
+            matches = sum(1 for pattern in c_patterns if re.search(pattern, text))
+            if matches >= 2:
+                return ValidationResult(
+                    result=True, reason=f"Valid {language} code detected"
+                )
+            else:
+                if check_only:
+                    reason = f"Does not appear to be valid {language} code"
+                else:
+                    reason = (
+                        f"Output does not appear to be valid {language} code. "
+                        f"Please provide proper {language} code with appropriate syntax and structure."
+                    )
+                return ValidationResult(result=False, reason=reason)
+
+        # Generic code detection (no specific language)
+        else:
+            code_indicators = 0
+
+            # Check for function definitions
+            if re.search(r"\b(function|def|func|fn)\s+\w+\s*\(", text):
+                code_indicators += 1
+
+            # Check for control flow
+            if re.search(r"\b(if|else|for|while|switch|case)\b", text):
+                code_indicators += 1
+
+            # Check for variable declarations
+            if re.search(r"\b(var|let|const|int|string|float|double)\s+\w+", text):
+                code_indicators += 1
+
+            # Check for operators
+            if re.search(r"[=+\-*/]{1,2}", text):
+                code_indicators += 1
+
+            # Check for function calls
+            if re.search(r"\w+\s*\([^)]*\)", text):
+                code_indicators += 1
+
+            # Check for semicolons or significant indentation
+            if ";" in text or re.search(r"\n\s{4,}", text):
+                code_indicators += 1
+
+            # Threshold: at least 3 indicators for generic code
+            if code_indicators >= 3:
+                return ValidationResult(
+                    result=True, reason=f"Code detected ({code_indicators} indicators)"
+                )
+            else:
+                return ValidationResult(
+                    result=False,
+                    reason=f"Does not appear to be code ({code_indicators} indicators, need 3+)",
+                )
+
+    lang_desc = f"{language} code" if language else "code"
+    return Requirement(
+        description=f"Output must be valid {lang_desc}.",
+        validation_fn=validate_code,
+        check_only=check_only,
+    )
+
+
+# endregion
+
+# region Factual Grounding
+
+
+def factual_grounding(
+    context: str, *, threshold: float = 0.5, check_only: bool = True
+) -> Requirement:
+    """Validate that output is grounded in the provided context.
+
+    This guardrail checks that the generated output is factually grounded in the
+    provided reference context. The basic implementation uses keyword overlap;
+    for production use, consider using NLI models or Guardian intrinsics.
+
+    Args:
+        context: Reference context text for grounding validation
+        threshold: Minimum overlap ratio (0.0-1.0) for validation (default: 0.5)
+        check_only: If True, only validate without attempting repair (default: True)
+
+    Returns:
+        Requirement that validates output is grounded in context
+
+    Examples:
+        Basic grounding check:
+        >>> from mellea.stdlib.requirements.guardrails import factual_grounding
+        >>> context = "Python is a high-level programming language created by Guido van Rossum."
+        >>> req = factual_grounding(context)
+
+        Stricter threshold:
+        >>> req = factual_grounding(context, threshold=0.7)
+
+        In a session:
+        >>> from mellea.stdlib.session import start_session
+        >>> m = start_session()
+        >>> context = "The company was founded in 2020 and has 50 employees."
+        >>> result = m.instruct(
+        ...     "Summarize the company information",
+        ...     requirements=[factual_grounding(context)]
+        ... )
+
+    Note:
+        This is a basic implementation using keyword overlap. For production use:
+        - Use NLI (Natural Language Inference) models for semantic validation
+        - Use Guardian intrinsics for hallucination detection
+        - Consider using embedding-based similarity measures
+    """
+    # Simple stopwords list
+    STOPWORDS = {
+        "a",
+        "an",
+        "and",
+        "are",
+        "as",
+        "at",
+        "be",
+        "by",
+        "for",
+        "from",
+        "has",
+        "he",
+        "in",
+        "is",
+        "it",
+        "its",
+        "of",
+        "on",
+        "that",
+        "the",
+        "to",
+        "was",
+        "will",
+        "with",
+        "the",
+        "this",
+        "but",
+        "they",
+        "have",
+        "had",
+        "what",
+        "when",
+        "where",
+        "who",
+        "which",
+        "why",
+        "how",
+    }
+
+    def extract_keywords(text: str) -> set[str]:
+        """Extract keywords from text (remove stopwords and punctuation)."""
+        # Convert to lowercase and split
+        words = re.findall(r"\b\w+\b", text.lower())
+        # Remove stopwords and short words
+        keywords = {w for w in words if w not in STOPWORDS and len(w) > 2}
+        return keywords
+
+    def validate_grounding(ctx: Context) -> ValidationResult:
+        last_output = ctx.last_output()
+        if last_output is None or last_output.value is None:
+            return ValidationResult(result=False, reason="No output found in context")
+
+        output_text = str(last_output.value)
+
+        # Extract keywords from both context and output
+        context_keywords = extract_keywords(context)
+        output_keywords = extract_keywords(output_text)
+
+        if not output_keywords:
+            return ValidationResult(
+                result=False, reason="Output contains no meaningful keywords"
+            )
+
+        if not context_keywords:
+            return ValidationResult(
+                result=False, reason="Context contains no meaningful keywords"
+            )
+
+        # Calculate overlap ratio
+        overlap = context_keywords.intersection(output_keywords)
+        overlap_ratio = len(overlap) / len(output_keywords)
+
+        if overlap_ratio >= threshold:
+            return ValidationResult(
+                result=True,
+                reason=f"Output is grounded in context (overlap: {overlap_ratio:.2%})",
+            )
+        else:
+            if check_only:
+                reason = f"Output not sufficiently grounded (overlap: {overlap_ratio:.2%}, threshold: {threshold:.2%})"
+            else:
+                reason = (
+                    f"Output contains claims not sufficiently supported by the provided context. "
+                    f"Keyword overlap: {overlap_ratio:.2%} (threshold: {threshold:.2%}). "
+                    f"Please ensure all claims are grounded in the given information and avoid adding unsupported facts."
+                )
+            return ValidationResult(result=False, reason=reason)
+
+    return Requirement(
+        description=f"Output must be grounded in the provided context (threshold: {threshold:.2%}).",
+        validation_fn=validate_grounding,
+        check_only=check_only,
+    )
+
+
+# endregion
+
+
+# endregion
diff --git a/mellea/stdlib/requirements/requirement_set.py b/mellea/stdlib/requirements/requirement_set.py
new file mode 100644
index 000000000..f5721ab22
--- /dev/null
+++ b/mellea/stdlib/requirements/requirement_set.py
@@ -0,0 +1,411 @@
+"""RequirementSet: A composable collection of requirements (guardrails).
+
+This module provides utilities for managing, combining, and reusing multiple
+requirements as a cohesive unit, making it easier to maintain consistent
+guardrail policies across an application.
+"""
+
+from __future__ import annotations
+
+from collections.abc import Iterator
+from copy import deepcopy
+
+from ...core import Requirement
+
+
+class RequirementSet:
+    """A composable collection of requirements (guardrails).
+
+    Provides a fluent API for building, combining, and managing
+    multiple requirements as a reusable unit. RequirementSet instances
+    are iterable and can be used anywhere a list of requirements is expected.
+
+    Examples:
+        Basic usage:
+        >>> from mellea.stdlib.requirements import RequirementSet
+        >>> from mellea.stdlib.requirements.guardrails import no_pii, json_valid
+        >>>
+        >>> basic_safety = RequirementSet([no_pii(), no_harmful_content()])
+        >>> result = m.instruct("Generate text", requirements=basic_safety)
+
+        Fluent API:
+        >>> reqs = (RequirementSet()
+        ...     .add(no_pii())
+        ...     .add(json_valid())
+        ...     .add(max_length(500)))
+
+        Composition:
+        >>> safety = RequirementSet([no_pii(), no_harmful_content()])
+        >>> format = RequirementSet([json_valid(), max_length(500)])
+        >>> combined = safety + format
+
+        In-place modification:
+        >>> reqs = RequirementSet([no_pii()])
+        >>> reqs += RequirementSet([json_valid()])
+    """
+
+    def __init__(
+        self, requirements: list[Requirement] | None = None, *, copy: bool = True
+    ):
+        """Initialize RequirementSet with optional list of requirements.
+
+        Args:
+            requirements: Optional list of Requirement instances
+            copy: If True (default), deep copy requirements for immutability.
+                  If False, use references directly (faster but mutable).
+
+        Raises:
+            TypeError: If any item in requirements is not a Requirement instance
+
+        Note:
+            By default, RequirementSet creates deep copies to ensure immutability
+            and prevent unexpected side effects. Set copy=False for performance-critical
+            scenarios where you control the requirement lifecycle.
+        """
+        self._requirements: list[Requirement] = []
+        if requirements:
+            for req in requirements:
+                if not isinstance(req, Requirement):
+                    raise TypeError(
+                        f"All items must be Requirement instances, got {type(req).__name__}"
+                    )
+                self._requirements.append(req)
+            if copy:
+                self._requirements = deepcopy(self._requirements)
+
+    def add(self, requirement: Requirement, *, copy: bool = True) -> RequirementSet:
+        """Add a requirement and return a new RequirementSet (fluent API).
+
+        Args:
+            requirement: Requirement instance to add
+            copy: If True (default), return new instance (immutable).
+                  If False, modify in place and return self (mutable, faster).
+
+        Returns:
+            New RequirementSet with the added requirement (if copy=True),
+            or self modified in place (if copy=False)
+
+        Raises:
+            TypeError: If requirement is not a Requirement instance
+
+        Examples:
+            Immutable (default):
+            >>> reqs = RequirementSet().add(no_pii()).add(json_valid())
+
+            Mutable (faster):
+            >>> reqs = RequirementSet()
+            >>> reqs.add(no_pii(), copy=False).add(json_valid(), copy=False)
+        """
+        if not isinstance(requirement, Requirement):
+            raise TypeError(
+                f"Expected Requirement instance, got {type(requirement).__name__}"
+            )
+        if copy:
+            new_set = self.copy()
+            new_set._requirements.append(requirement)
+            return new_set
+        else:
+            self._requirements.append(requirement)
+            return self
+
+    def remove(self, requirement: Requirement, *, copy: bool = True) -> RequirementSet:
+        """Remove a requirement and return a new RequirementSet (fluent API).
+
+        Args:
+            requirement: Requirement instance to remove
+            copy: If True (default), return new instance (immutable).
+                  If False, modify in place and return self (mutable, faster).
+
+        Returns:
+            New RequirementSet without the specified requirement (if copy=True),
+            or self modified in place (if copy=False).
+            If requirement not found, returns unchanged.
+
+        Examples:
+            Immutable (default):
+            >>> reqs = RequirementSet([no_pii(), json_valid()])
+            >>> reqs_without_pii = reqs.remove(no_pii())
+
+            Mutable (faster):
+            >>> reqs = RequirementSet([no_pii(), json_valid()])
+            >>> reqs.remove(no_pii(), copy=False)
+        """
+        if copy:
+            new_set = self.copy()
+            try:
+                new_set._requirements.remove(requirement)
+            except ValueError:
+                pass  # Requirement not found, return copy unchanged
+            return new_set
+        else:
+            try:
+                self._requirements.remove(requirement)
+            except ValueError:
+                pass  # Requirement not found, return self unchanged
+            return self
+
+    def extend(
+        self, requirements: list[Requirement], *, copy: bool = True
+    ) -> RequirementSet:
+        """Add multiple requirements and return a new RequirementSet (fluent API).
+
+        Args:
+            requirements: List of Requirement instances to add
+            copy: If True (default), return new instance (immutable).
+                  If False, modify in place and return self (mutable, faster).
+
+        Returns:
+            New RequirementSet with all requirements added (if copy=True),
+            or self modified in place (if copy=False)
+
+        Raises:
+            TypeError: If any item is not a Requirement instance
+
+        Examples:
+            Immutable (default):
+            >>> reqs = RequirementSet().extend([no_pii(), json_valid(), max_length(500)])
+
+            Mutable (faster):
+            >>> reqs = RequirementSet()
+            >>> reqs.extend([no_pii(), json_valid()], copy=False)
+        """
+        # Validate all requirements first
+        for req in requirements:
+            if not isinstance(req, Requirement):
+                raise TypeError(
+                    f"All items must be Requirement instances, got {type(req).__name__}"
+                )
+
+        if copy:
+            new_set = self.copy()
+            new_set._requirements.extend(requirements)
+            return new_set
+        else:
+            self._requirements.extend(requirements)
+            return self
+
+    def __add__(self, other: RequirementSet) -> RequirementSet:
+        """Combine two RequirementSets using + operator.
+
+        Creates a new RequirementSet containing requirements from both sets.
+
+        Args:
+            other: Another RequirementSet to combine with
+
+        Returns:
+            New RequirementSet containing requirements from both sets
+
+        Raises:
+            TypeError: If other is not a RequirementSet
+
+        Examples:
+            >>> safety = RequirementSet([no_pii()])
+            >>> format = RequirementSet([json_valid()])
+            >>> combined = safety + format
+        """
+        if not isinstance(other, RequirementSet):
+            raise TypeError(
+                f"Can only add RequirementSet to RequirementSet, got {type(other).__name__}"
+            )
+        new_set = self.copy()
+        new_set._requirements.extend(other._requirements)
+        return new_set
+
+    def __iadd__(self, other: RequirementSet) -> RequirementSet:
+        """In-place addition using += operator.
+
+        Modifies the current RequirementSet by adding requirements from other.
+
+        Args:
+            other: Another RequirementSet to add
+
+        Returns:
+            Self (modified in place)
+
+        Raises:
+            TypeError: If other is not a RequirementSet
+
+        Examples:
+            >>> reqs = RequirementSet([no_pii()])
+            >>> reqs += RequirementSet([json_valid()])
+        """
+        if not isinstance(other, RequirementSet):
+            raise TypeError(
+                f"Can only add RequirementSet to RequirementSet, got {type(other).__name__}"
+            )
+        self._requirements.extend(other._requirements)
+        return self
+
+    def __len__(self) -> int:
+        """Return the number of requirements in the set.
+
+        Returns:
+            Number of requirements
+
+        Examples:
+            >>> reqs = RequirementSet([no_pii(), json_valid()])
+            >>> len(reqs)
+            2
+        """
+        return len(self._requirements)
+
+    def __iter__(self) -> Iterator[Requirement]:
+        """Make RequirementSet iterable.
+
+        This allows RequirementSet to be used anywhere a list of requirements
+        is expected, such as in m.instruct(requirements=...).
+
+        Returns:
+            Iterator over requirements
+
+        Examples:
+            >>> reqs = RequirementSet([no_pii(), json_valid()])
+            >>> for req in reqs:
+            ...     print(req.description)
+        """
+        return iter(self._requirements)
+
+    def __repr__(self) -> str:
+        """Return string representation of RequirementSet.
+
+        Returns:
+            String showing the number of requirements
+
+        Examples:
+            >>> reqs = RequirementSet([no_pii(), json_valid()])
+            >>> repr(reqs)
+            'RequirementSet(2 requirements)'
+        """
+        return f"RequirementSet({len(self._requirements)} requirements)"
+
+    def __str__(self) -> str:
+        """Return detailed string representation.
+
+        Returns:
+            String listing all requirement descriptions
+        """
+        if not self._requirements:
+            return "RequirementSet(empty)"
+
+        descriptions = [
+            req.description or "No description" for req in self._requirements
+        ]
+        return (
+            f"RequirementSet({len(self._requirements)} requirements):\n  - "
+            + "\n  - ".join(descriptions)
+        )
+
+    def copy(self) -> RequirementSet:
+        """Create a deep copy of the RequirementSet.
+
+        Returns:
+            New RequirementSet with copied requirements
+
+        Examples:
+            >>> original = RequirementSet([no_pii()])
+            >>> copy = original.copy()
+            >>> copy.add(json_valid())  # Doesn't affect original
+        """
+        new_set = RequirementSet()
+        new_set._requirements = deepcopy(self._requirements)
+        return new_set
+
+    def deduplicate(
+        self, *, by: str = "description", copy: bool = True
+    ) -> RequirementSet:
+        """Remove duplicate requirements.
+
+        Args:
+            by: Deduplication strategy:
+                - "description": Remove requirements with duplicate descriptions (default)
+                - "identity": Remove requirements with same object identity
+            copy: If True (default), return new instance. If False, modify in place.
+
+        Returns:
+            RequirementSet with duplicates removed (preserves first occurrence)
+
+        Note:
+            Description-based deduplication may incorrectly merge requirements with
+            the same description but different validation functions. This is a
+            pragmatic approach for common use cases where requirements are created
+            using the same factory functions (e.g., `no_pii()`).
+
+        Examples:
+            Remove duplicates from composed profiles:
+            >>> safety = GuardrailProfiles.basic_safety()
+            >>> format = GuardrailProfiles.json_output()
+            >>> combined = (safety + format).deduplicate()
+
+            In-place deduplication:
+            >>> reqs = RequirementSet([no_pii(), no_pii(), json_valid()])
+            >>> reqs.deduplicate(copy=False)
+        """
+        if by == "description":
+            seen_descriptions: set[str | None] = set()
+            unique_reqs: list[Requirement] = []
+            for req in self._requirements:
+                desc = req.description
+                if desc not in seen_descriptions:
+                    seen_descriptions.add(desc)
+                    unique_reqs.append(req)
+
+            if copy:
+                return RequirementSet(unique_reqs, copy=False)
+            else:
+                self._requirements = unique_reqs
+                return self
+
+        elif by == "identity":
+            # Use dict to preserve order while removing identity duplicates
+            unique_dict = {id(req): req for req in self._requirements}
+            unique_reqs = list(unique_dict.values())
+
+            if copy:
+                return RequirementSet(unique_reqs, copy=False)
+            else:
+                self._requirements = unique_reqs
+                return self
+
+        else:
+            raise ValueError(
+                f"Invalid deduplication strategy: {by}. Must be 'description' or 'identity'."
+            )
+
+    def to_list(self) -> list[Requirement]:
+        """Convert to a plain list of requirements.
+
+        Returns:
+            List of Requirement instances
+
+        Examples:
+            >>> reqs = RequirementSet([no_pii(), json_valid()])
+            >>> req_list = reqs.to_list()
+        """
+        return list(self._requirements)
+
+    def clear(self) -> RequirementSet:
+        """Remove all requirements and return a new empty RequirementSet.
+
+        Returns:
+            New empty RequirementSet
+
+        Examples:
+            >>> reqs = RequirementSet([no_pii(), json_valid()])
+            >>> empty = reqs.clear()
+            >>> len(empty)
+            0
+        """
+        return RequirementSet()
+
+    def is_empty(self) -> bool:
+        """Check if the RequirementSet is empty.
+
+        Returns:
+            True if no requirements, False otherwise
+
+        Examples:
+            >>> reqs = RequirementSet()
+            >>> reqs.is_empty()
+            True
+        """
+        return len(self._requirements) == 0
diff --git a/test/stdlib/requirements/test_guardrails.py b/test/stdlib/requirements/test_guardrails.py
new file mode 100644
index 000000000..51de8fe7d
--- /dev/null
+++ b/test/stdlib/requirements/test_guardrails.py
@@ -0,0 +1,788 @@
+"""Tests for pre-built guardrails in mellea.stdlib.requirements.guardrails."""
+
+import pytest
+
+from mellea.core import Context, ModelOutputThunk
+from mellea.stdlib.context import ChatContext
+from mellea.stdlib.requirements.guardrails import (
+    factual_grounding,
+    is_code,
+    matches_schema,
+    no_harmful_content,
+    no_pii,
+)
+
+# Helper functions
+
+
+def _spacy_available() -> bool:
+    """Check if spaCy and the required model are available."""
+    try:
+        import spacy  # type: ignore[import-not-found]
+
+        try:
+            spacy.load("en_core_web_sm")
+            return True
+        except OSError:
+            return False
+    except ImportError:
+        return False
+
+
+def create_context(text: str) -> Context:
+    """Helper to create a context with model output."""
+    ctx = ChatContext()
+    ctx = ctx.add(ModelOutputThunk(value=text))
+    return ctx
+
+
+# Test data
+CLEAN_TEXT = "The weather is nice today. I enjoy programming and solving problems."
+TEXT_WITH_EMAIL = "Contact me at john.doe@example.com for more information."
+TEXT_WITH_PHONE = "Call me at 555-123-4567 or (555) 123-4567."
+TEXT_WITH_SSN = "My SSN is 123-45-6789."
+TEXT_WITH_CREDIT_CARD = "Card number: 1234 5678 9012 3456"
+TEXT_WITH_NAME = "John Smith is a software engineer at Acme Corp."
+TEXT_WITH_LOCATION = "I live in New York City, near Central Park."
+TEXT_WITH_MULTIPLE_PII = """
+John Doe works at IBM in San Francisco.
+You can reach him at john.doe@ibm.com or call 415-555-1234.
+His employee ID is 123-45-6789.
+"""
+
+
+# region Regex-based tests (no dependencies required)
+
+
+def test_no_pii_clean_text_regex():
+    """Test that clean text passes PII check with regex method."""
+    req = no_pii(method="regex")
+    ctx = create_context(CLEAN_TEXT)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "No PII detected" in result.reason
+
+
+def test_no_pii_detects_email_regex():
+    """Test that email addresses are detected with regex method."""
+    req = no_pii(method="regex")
+    ctx = create_context(TEXT_WITH_EMAIL)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "email" in result.reason.lower()
+
+
+def test_no_pii_detects_phone_regex():
+    """Test that phone numbers are detected with regex method."""
+    req = no_pii(method="regex")
+    ctx = create_context(TEXT_WITH_PHONE)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "phone" in result.reason.lower()
+
+
+def test_no_pii_detects_ssn_regex():
+    """Test that SSNs are detected with regex method."""
+    req = no_pii(method="regex")
+    ctx = create_context(TEXT_WITH_SSN)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "ssn" in result.reason.lower()
+
+
+def test_no_pii_detects_credit_card_regex():
+    """Test that credit card numbers are detected with regex method."""
+    req = no_pii(method="regex")
+    ctx = create_context(TEXT_WITH_CREDIT_CARD)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "credit_card" in result.reason.lower()
+
+
+def test_no_pii_detects_multiple_pii_regex():
+    """Test that multiple PII types are detected with regex method."""
+    req = no_pii(method="regex")
+    ctx = create_context(TEXT_WITH_MULTIPLE_PII)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    # Should detect email, phone, and SSN
+    reason_lower = result.reason.lower()
+    assert "email" in reason_lower or "phone" in reason_lower or "ssn" in reason_lower
+
+
+# endregion
+
+# region spaCy-based tests (requires spacy extra)
+
+
+@pytest.mark.skipif(
+    not _spacy_available(), reason="spaCy not installed or model not available"
+)
+def test_no_pii_detects_person_name_spacy():
+    """Test that person names are detected with spaCy method."""
+    req = no_pii(method="spacy")
+    ctx = create_context(TEXT_WITH_NAME)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "PERSON" in result.reason or "ORG" in result.reason
+
+
+@pytest.mark.skipif(
+    not _spacy_available(), reason="spaCy not installed or model not available"
+)
+def test_no_pii_detects_location_spacy():
+    """Test that locations are detected with spaCy method."""
+    req = no_pii(method="spacy")
+    ctx = create_context(TEXT_WITH_LOCATION)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "GPE" in result.reason or "LOC" in result.reason
+
+
+@pytest.mark.skipif(
+    not _spacy_available(), reason="spaCy not installed or model not available"
+)
+def test_no_pii_spacy_fallback_to_regex():
+    """Test that spaCy method falls back to regex for emails/phones."""
+    req = no_pii(method="spacy")
+    ctx = create_context(TEXT_WITH_EMAIL)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "email" in result.reason.lower()
+
+
+# endregion
+
+# region Auto mode tests
+
+
+def test_no_pii_auto_mode_clean_text():
+    """Test auto mode with clean text."""
+    req = no_pii(method="auto")
+    ctx = create_context(CLEAN_TEXT)
+    result = req.validation_fn(ctx)
+
+    # spaCy may detect "Python" as ORG/PRODUCT, which is a false positive for clean text
+    # This is acceptable behavior - the test should verify no actual PII is detected
+    if not result.as_bool():
+        # Allow false positives for programming language names
+        assert (
+            "PERSON" not in result.reason
+            and "GPE" not in result.reason
+            and "LOC" not in result.reason
+        ), f"Detected actual PII in clean text: {result.reason}"
+    else:
+        assert result.as_bool() is True
+
+
+def test_no_pii_auto_mode_detects_email():
+    """Test auto mode detects email (via regex fallback)."""
+    req = no_pii(method="auto")
+    ctx = create_context(TEXT_WITH_EMAIL)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+
+
+def test_no_pii_auto_mode_detects_multiple():
+    """Test auto mode detects multiple PII types."""
+    req = no_pii(method="auto")
+    ctx = create_context(TEXT_WITH_MULTIPLE_PII)
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+
+
+# endregion
+
+# region Edge cases
+
+
+def test_no_pii_empty_context():
+    """Test behavior with empty context."""
+    req = no_pii()
+    ctx = ChatContext()
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "No output found" in result.reason
+
+
+def test_no_pii_none_output():
+    """Test behavior with None output value."""
+    req = no_pii()
+    ctx = ChatContext()
+    ctx = ctx.add(ModelOutputThunk(value=None))
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "No output found" in result.reason
+
+
+def test_no_pii_empty_string():
+    """Test behavior with empty string output."""
+    req = no_pii()
+    ctx = create_context("")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "No PII detected" in result.reason
+
+
+# endregion
+
+# region Requirement properties
+
+
+def test_no_pii_is_check_only_by_default():
+    """Test that no_pii is check_only by default."""
+    req = no_pii()
+    assert req.check_only is True
+
+
+def test_no_pii_has_description():
+    """Test that no_pii has a clear description."""
+    req = no_pii()
+    assert req.description is not None
+    assert (
+        "PII" in req.description or "personally identifiable" in req.description.lower()
+    )
+
+
+def test_no_pii_has_validation_fn():
+    """Test that no_pii has a validation function."""
+    req = no_pii()
+    assert req.validation_fn is not None
+    assert callable(req.validation_fn)
+
+
+# endregion
+
+
+# region JSON validation tests
+
+
+def test_json_valid_with_valid_json():
+    """Test json_valid with valid JSON."""
+    from mellea.stdlib.requirements.guardrails import json_valid
+
+    req = json_valid()
+    ctx = create_context('{"name": "John", "age": 30}')
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "Valid JSON" in result.reason
+
+
+def test_json_valid_with_invalid_json():
+    """Test json_valid with invalid JSON."""
+    from mellea.stdlib.requirements.guardrails import json_valid
+
+    req = json_valid()
+    ctx = create_context('{name: "John", age: 30}')  # Missing quotes on keys
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "Invalid JSON" in result.reason
+
+
+def test_json_valid_with_array():
+    """Test json_valid with JSON array."""
+    from mellea.stdlib.requirements.guardrails import json_valid
+
+    req = json_valid()
+    ctx = create_context('[1, 2, 3, "test"]')
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+
+
+# endregion
+
+# region Length constraint tests
+
+
+def test_max_length_characters():
+    """Test max_length with character limit."""
+    from mellea.stdlib.requirements.guardrails import max_length
+
+    req = max_length(50)
+    ctx = create_context("Short text")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "within limit" in result.reason
+
+
+def test_max_length_exceeds():
+    """Test max_length when limit is exceeded."""
+    from mellea.stdlib.requirements.guardrails import max_length
+
+    req = max_length(10)
+    ctx = create_context("This is a very long text that exceeds the limit")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "exceeds maximum" in result.reason
+
+
+def test_max_length_words():
+    """Test max_length with word limit."""
+    from mellea.stdlib.requirements.guardrails import max_length
+
+    req = max_length(5, unit="words")
+    ctx = create_context("One two three four")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+
+
+def test_min_length_characters():
+    """Test min_length with character minimum."""
+    from mellea.stdlib.requirements.guardrails import min_length
+
+    req = min_length(10)
+    ctx = create_context("This is a longer text")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "meets minimum" in result.reason
+
+
+def test_min_length_below_minimum():
+    """Test min_length when below minimum."""
+    from mellea.stdlib.requirements.guardrails import min_length
+
+    req = min_length(100)
+    ctx = create_context("Short")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "below minimum" in result.reason
+
+
+def test_min_length_words():
+    """Test min_length with word minimum."""
+    from mellea.stdlib.requirements.guardrails import min_length
+
+    req = min_length(3, unit="words")
+    ctx = create_context("One two three four")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+
+
+# endregion
+
+# region Keyword matching tests
+
+
+def test_contains_keywords_any_found():
+    """Test contains_keywords when at least one keyword is found."""
+    from mellea.stdlib.requirements.guardrails import contains_keywords
+
+    req = contains_keywords(["Python", "Java", "JavaScript"])
+    ctx = create_context("I love programming in Python")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "Python" in result.reason
+
+
+def test_contains_keywords_none_found():
+    """Test contains_keywords when no keywords are found."""
+    from mellea.stdlib.requirements.guardrails import contains_keywords
+
+    req = contains_keywords(["Python", "Java"])
+    ctx = create_context("I love programming in Ruby")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "None of the required keywords" in result.reason
+
+
+def test_contains_keywords_require_all():
+    """Test contains_keywords with require_all=True."""
+    from mellea.stdlib.requirements.guardrails import contains_keywords
+
+    req = contains_keywords(["API", "REST", "JSON"], require_all=True)
+    ctx = create_context("This API uses REST and returns JSON")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "All required keywords found" in result.reason
+
+
+def test_contains_keywords_require_all_missing():
+    """Test contains_keywords with require_all=True when some are missing."""
+    from mellea.stdlib.requirements.guardrails import contains_keywords
+
+    req = contains_keywords(["API", "REST", "JSON"], require_all=True)
+    ctx = create_context("This API uses REST")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "Missing required keywords" in result.reason
+    assert "JSON" in result.reason
+
+
+def test_contains_keywords_case_insensitive():
+    """Test contains_keywords with case insensitive matching."""
+    from mellea.stdlib.requirements.guardrails import contains_keywords
+
+    req = contains_keywords(["Python"], case_sensitive=False)
+    ctx = create_context("I love python programming")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+
+
+def test_contains_keywords_case_sensitive():
+    """Test contains_keywords with case sensitive matching."""
+    from mellea.stdlib.requirements.guardrails import contains_keywords
+
+    req = contains_keywords(["Python"], case_sensitive=True)
+    ctx = create_context("I love python programming")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+
+
+def test_excludes_keywords_none_found():
+    """Test excludes_keywords when no forbidden keywords are found."""
+    from mellea.stdlib.requirements.guardrails import excludes_keywords
+
+    req = excludes_keywords(["TODO", "FIXME", "XXX"])
+    ctx = create_context("This is clean production code")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "No forbidden keywords" in result.reason
+
+
+def test_excludes_keywords_found():
+    """Test excludes_keywords when forbidden keywords are found."""
+    from mellea.stdlib.requirements.guardrails import excludes_keywords
+
+    req = excludes_keywords(["TODO", "FIXME"])
+    ctx = create_context("This code needs work. TODO: fix this later")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "Found forbidden keywords" in result.reason
+    assert "TODO" in result.reason
+
+
+def test_excludes_keywords_case_insensitive():
+    """Test excludes_keywords with case insensitive matching."""
+    from mellea.stdlib.requirements.guardrails import excludes_keywords
+
+    req = excludes_keywords(["confidential"], case_sensitive=False)
+    ctx = create_context("This is CONFIDENTIAL information")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+
+
+# endregion
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-v"])
+
+
+# endregion
+
+# region no_harmful_content tests
+
+
+def test_no_harmful_content_clean():
+    """Test that clean content passes harmful content check."""
+    req = no_harmful_content()
+    ctx = create_context("This is a helpful and informative response about technology.")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "No harmful content detected" in result.reason
+
+
+def test_no_harmful_content_detects_violence():
+    """Test that violent content is detected."""
+    req = no_harmful_content(risk_types=["violence"])
+    ctx = create_context("The attacker used a weapon to kill the victim.")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "violence" in result.reason.lower()
+
+
+def test_no_harmful_content_detects_profanity():
+    """Test that profanity is detected."""
+    req = no_harmful_content(risk_types=["profanity"])
+    ctx = create_context("This is fucking terrible shit.")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "profanity" in result.reason.lower()
+
+
+def test_no_harmful_content_multiple_risks():
+    """Test checking multiple risk types."""
+    req = no_harmful_content(risk_types=["violence", "profanity"])
+    ctx = create_context("The violent attack was fucking brutal.")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    # Should detect at least one risk type
+    assert "violence" in result.reason.lower() or "profanity" in result.reason.lower()
+
+
+def test_no_harmful_content_default_harm():
+    """Test default harm detection."""
+    req = no_harmful_content()
+    ctx = create_context("This could harm people if misused.")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "harm" in result.reason.lower()
+
+
+# endregion
+
+# region matches_schema tests
+
+
+def test_matches_schema_valid():
+    """Test that valid JSON matching schema passes."""
+    schema = {
+        "type": "object",
+        "properties": {"name": {"type": "string"}, "age": {"type": "number"}},
+        "required": ["name", "age"],
+    }
+    req = matches_schema(schema)
+    ctx = create_context('{"name": "Alice", "age": 30}')
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "matches schema" in result.reason.lower()
+
+
+def test_matches_schema_missing_required():
+    """Test that missing required fields fail validation."""
+    schema = {
+        "type": "object",
+        "properties": {"name": {"type": "string"}, "age": {"type": "number"}},
+        "required": ["name", "age"],
+    }
+    req = matches_schema(schema)
+    ctx = create_context('{"name": "Alice"}')
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "validation failed" in result.reason.lower()
+
+
+def test_matches_schema_wrong_type():
+    """Test that wrong types fail validation."""
+    schema = {"type": "object", "properties": {"age": {"type": "number"}}}
+    req = matches_schema(schema)
+    ctx = create_context('{"age": "thirty"}')
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "validation failed" in result.reason.lower()
+
+
+def test_matches_schema_array():
+    """Test array schema validation."""
+    schema = {"type": "array", "items": {"type": "string"}, "minItems": 2}
+    req = matches_schema(schema)
+    ctx = create_context('["apple", "banana", "cherry"]')
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+
+
+def test_matches_schema_invalid_json():
+    """Test that invalid JSON fails before schema validation."""
+    schema = {"type": "object"}
+    req = matches_schema(schema)
+    ctx = create_context('{"invalid": json}')
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "Invalid JSON" in result.reason
+
+
+# endregion
+
+# region is_code tests
+
+
+def test_is_code_valid_python():
+    """Test that valid Python code passes."""
+    req = is_code("python")
+    ctx = create_context("""
+def factorial(n):
+    if n <= 1:
+        return 1
+    return n * factorial(n - 1)
+""")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "Valid Python syntax" in result.reason
+
+
+def test_is_code_invalid_python():
+    """Test that invalid Python syntax fails."""
+    req = is_code("python")
+    ctx = create_context("""
+def broken_function(
+    print("missing closing paren"
+""")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "Invalid Python syntax" in result.reason
+
+
+def test_is_code_javascript():
+    """Test JavaScript code detection."""
+    req = is_code("javascript")
+    ctx = create_context("""
+function greet(name) {
+    const message = `Hello, ${name}!`;
+    return message;
+}
+""")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "javascript" in result.reason.lower()
+
+
+def test_is_code_java():
+    """Test Java code detection."""
+    req = is_code("java")
+    ctx = create_context("""
+public class HelloWorld {
+    public static void main(String[] args) {
+        System.out.println("Hello, World!");
+    }
+}
+""")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "java" in result.reason.lower()
+
+
+def test_is_code_generic():
+    """Test generic code detection."""
+    req = is_code()
+    ctx = create_context("""
+function calculate(x, y) {
+    if (x > y) {
+        return x + y;
+    }
+    return x * y;
+}
+""")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "Code detected" in result.reason
+
+
+def test_is_code_not_code():
+    """Test that natural language fails code detection."""
+    req = is_code()
+    ctx = create_context("This is just a regular sentence with no code.")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "Does not appear to be code" in result.reason
+
+
+def test_is_code_unbalanced_braces():
+    """Test that unbalanced braces fail validation."""
+    req = is_code("python")
+    ctx = create_context("def func(): { print('unbalanced'")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+
+
+# endregion
+
+# region factual_grounding tests
+
+
+def test_factual_grounding_high_overlap():
+    """Test that high overlap passes grounding check."""
+    context = "Python is a high-level programming language created by Guido van Rossum in 1991."
+    req = factual_grounding(context)
+    ctx = create_context(
+        "Python is a programming language created by Guido van Rossum."
+    )
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+    assert "grounded" in result.reason.lower()
+
+
+def test_factual_grounding_low_overlap():
+    """Test that low overlap fails grounding check."""
+    context = "Python is a programming language."
+    req = factual_grounding(context, threshold=0.5)
+    ctx = create_context(
+        "JavaScript is used for web development with React and Node.js."
+    )
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+    assert "not sufficiently grounded" in result.reason.lower()
+
+
+def test_factual_grounding_threshold():
+    """Test custom threshold for grounding."""
+    context = "The company was founded in 2020 and has 50 employees."
+    req = factual_grounding(context, threshold=0.3)
+    ctx = create_context("The company has employees.")
+    result = req.validation_fn(ctx)
+
+    # Should pass with low threshold
+    assert result.as_bool() is True
+
+
+def test_factual_grounding_empty_output():
+    """Test that empty output fails grounding check."""
+    context = "Some context text"
+    req = factual_grounding(context)
+    ctx = create_context("")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is False
+
+
+def test_factual_grounding_identical():
+    """Test that identical text has perfect grounding."""
+    context = "Python is a programming language"
+    req = factual_grounding(context, threshold=0.9)
+    ctx = create_context("Python is a programming language")
+    result = req.validation_fn(ctx)
+
+    assert result.as_bool() is True
+
+
+# endregion
diff --git a/test/stdlib/requirements/test_requirement_set.py b/test/stdlib/requirements/test_requirement_set.py
new file mode 100644
index 000000000..59e62621a
--- /dev/null
+++ b/test/stdlib/requirements/test_requirement_set.py
@@ -0,0 +1,494 @@
+"""Tests for RequirementSet and GuardrailProfiles."""
+
+import pytest
+
+from mellea.core import Requirement, ValidationResult
+from mellea.stdlib.requirements import GuardrailProfiles, RequirementSet
+from mellea.stdlib.requirements.guardrails import (
+    json_valid,
+    max_length,
+    no_harmful_content,
+    no_pii,
+)
+
+# region RequirementSet Tests
+
+
+def test_requirement_set_creation_empty():
+    """Test creating an empty RequirementSet."""
+    reqs = RequirementSet()
+    assert len(reqs) == 0
+    assert reqs.is_empty()
+
+
+def test_requirement_set_creation_with_list():
+    """Test creating RequirementSet with initial requirements."""
+    reqs = RequirementSet([no_pii(), json_valid()])
+    assert len(reqs) == 2
+    assert not reqs.is_empty()
+
+
+def test_requirement_set_creation_type_error():
+    """Test that non-Requirement items raise TypeError."""
+    with pytest.raises(TypeError, match="must be Requirement instances"):
+        RequirementSet(["not a requirement"])  # type: ignore
+
+
+def test_requirement_set_add():
+    """Test adding requirements with fluent API."""
+    reqs = RequirementSet().add(no_pii()).add(json_valid())
+    assert len(reqs) == 2
+
+
+def test_requirement_set_add_type_error():
+    """Test that adding non-Requirement raises TypeError."""
+    reqs = RequirementSet()
+    with pytest.raises(TypeError, match="Expected Requirement instance"):
+        reqs.add("not a requirement")  # type: ignore
+
+
+def test_requirement_set_add_immutable():
+    """Test that add() returns new instance (immutable)."""
+    original = RequirementSet([no_pii()])
+    modified = original.add(json_valid())
+
+    assert len(original) == 1
+    assert len(modified) == 2
+
+
+def test_requirement_set_remove():
+    """Test removing requirements by identity with copy=False."""
+    req1 = no_pii()
+    req2 = json_valid()
+    # Use copy=False to preserve object identity
+    reqs = RequirementSet([req1, req2], copy=False)
+
+    # With copy=False, we can remove by reference
+    modified = reqs.remove(req1, copy=False)
+    assert len(modified) == 1
+    assert modified is reqs  # Same object (in-place)
+
+
+def test_requirement_set_remove_immutable():
+    """Test that remove() returns new instance (immutable) by default."""
+    req1 = no_pii()
+    req2 = json_valid()
+    original = RequirementSet([req1, req2], copy=False)
+
+    # With default copy=True, remove() creates a new instance
+    # But deepcopy breaks object identity, so we need to remove by index or use copy=False
+    modified = original.remove(req1, copy=False)
+    new_copy = RequirementSet(modified.to_list())  # Create immutable copy
+
+    assert len(original) == 1  # Modified in place
+    assert len(modified) == 1  # Same as original
+    assert len(new_copy) == 1  # Immutable copy
+    assert modified is original  # Same object (copy=False)
+    assert new_copy is not original  # Different object
+
+
+def test_requirement_set_remove_not_found():
+    """Test that removing non-existent requirement doesn't error."""
+    reqs = RequirementSet([no_pii()])
+    modified = reqs.remove(json_valid())
+    assert len(modified) == 1  # Unchanged
+
+
+def test_requirement_set_add_mutable():
+    """Test that add() with copy=False modifies in place."""
+    original = RequirementSet([no_pii()], copy=False)
+    original_id = id(original)
+    modified = original.add(json_valid(), copy=False)
+
+    assert len(original) == 2
+    assert len(modified) == 2
+    assert id(modified) == original_id  # Same object
+
+
+def test_requirement_set_extend_mutable():
+    """Test that extend() with copy=False modifies in place."""
+    original = RequirementSet([no_pii()], copy=False)
+    original_id = id(original)
+    modified = original.extend([json_valid(), max_length(500)], copy=False)
+
+    assert len(original) == 3
+    assert len(modified) == 3
+    assert id(modified) == original_id  # Same object
+
+
+def test_requirement_set_deduplicate_by_description():
+    """Test deduplication removes requirements with same description."""
+    req1 = no_pii()
+    req2 = no_pii()  # Same description, different instance
+    reqs = RequirementSet([req1, req2, json_valid()], copy=False)
+
+    deduped = reqs.deduplicate()
+    assert len(deduped) == 2  # no_pii + json_valid
+    assert len(reqs) == 3  # Original unchanged
+
+
+def test_requirement_set_deduplicate_preserves_order():
+    """Test that deduplication preserves first occurrence."""
+    reqs = RequirementSet([no_pii(), json_valid(), no_pii()], copy=False)
+    deduped = reqs.deduplicate()
+
+    assert len(deduped) == 2
+    # First requirement should be no_pii
+    first_desc = next(iter(deduped)).description
+    assert first_desc == no_pii().description
+
+
+def test_requirement_set_deduplicate_by_identity():
+    """Test deduplication by identity."""
+    req1 = no_pii()
+    req2 = req1  # Same instance
+    req3 = json_valid()
+    reqs = RequirementSet([req1, req2, req3], copy=False)
+
+    deduped = reqs.deduplicate(by="identity")
+    assert len(deduped) == 2  # req1 and req3 (req2 is same as req1)
+
+
+def test_requirement_set_deduplicate_inplace():
+    """Test in-place deduplication."""
+    reqs = RequirementSet([no_pii(), no_pii(), json_valid()], copy=False)
+    original_id = id(reqs)
+
+    deduped = reqs.deduplicate(copy=False)
+    assert len(deduped) == 2
+    assert id(deduped) == original_id  # Same object
+
+
+def test_requirement_set_deduplicate_invalid_strategy():
+    """Test that invalid deduplication strategy raises ValueError."""
+    reqs = RequirementSet([no_pii()], copy=False)
+    with pytest.raises(ValueError, match="Invalid deduplication strategy"):
+        reqs.deduplicate(by="invalid")  # type: ignore
+
+
+def test_profile_composition_with_dedupe():
+    """Test real-world profile composition with deduplication."""
+    from mellea.stdlib.requirements import GuardrailProfiles
+
+    safety = GuardrailProfiles.basic_safety()
+    format = GuardrailProfiles.json_output()
+
+    # Combine profiles (may have duplicates)
+    combined = safety + format
+    original_len = len(combined)
+
+    # Deduplicate
+    deduped = combined.deduplicate()
+
+    # Should have fewer or equal requirements
+    assert len(deduped) <= original_len
+
+    # Verify no duplicate descriptions
+    descriptions = [r.description for r in deduped]
+    assert len(descriptions) == len(set(descriptions))
+
+    """Test that extend() with copy=False modifies in place."""
+    original = RequirementSet([no_pii()], copy=False)
+    original_id = id(original)
+    modified = original.extend([json_valid(), max_length(500)], copy=False)
+
+    assert len(original) == 3
+    assert len(modified) == 3
+    assert id(modified) == original_id  # Same object
+
+
+def test_requirement_set_extend():
+    """Test extending with multiple requirements."""
+    reqs = RequirementSet().extend([no_pii(), json_valid(), max_length(500)])
+    assert len(reqs) == 3
+
+
+def test_requirement_set_extend_type_error():
+    """Test that extending with non-Requirements raises TypeError."""
+    reqs = RequirementSet()
+    with pytest.raises(TypeError, match="must be Requirement instances"):
+        reqs.extend([no_pii(), "not a requirement"])  # type: ignore
+
+
+def test_requirement_set_addition():
+    """Test combining RequirementSets with + operator."""
+    set1 = RequirementSet([no_pii()])
+    set2 = RequirementSet([json_valid()])
+    combined = set1 + set2
+
+    assert len(combined) == 2
+    assert len(set1) == 1  # Original unchanged
+    assert len(set2) == 1  # Original unchanged
+
+
+def test_requirement_set_addition_type_error():
+    """Test that adding non-RequirementSet raises TypeError."""
+    reqs = RequirementSet([no_pii()])
+    with pytest.raises(TypeError, match="Can only add RequirementSet"):
+        reqs + [json_valid()]  # type: ignore  # noqa: RUF005
+
+
+def test_requirement_set_iadd():
+    """Test in-place addition with += operator."""
+    reqs = RequirementSet([no_pii()])
+    original_id = id(reqs)
+    reqs += RequirementSet([json_valid()])
+
+    assert len(reqs) == 2
+    assert id(reqs) == original_id  # Same object (in-place)
+
+
+def test_requirement_set_iadd_type_error():
+    """Test that += with non-RequirementSet raises TypeError."""
+    reqs = RequirementSet([no_pii()])
+    with pytest.raises(TypeError, match="Can only add RequirementSet"):
+        reqs += [json_valid()]  # type: ignore
+
+
+def test_requirement_set_len():
+    """Test len() function."""
+    reqs = RequirementSet([no_pii(), json_valid(), max_length(500)])
+    assert len(reqs) == 3
+
+
+def test_requirement_set_iter():
+    """Test iteration over RequirementSet."""
+    req1 = no_pii()
+    req2 = json_valid()
+    reqs = RequirementSet([req1, req2])
+
+    items = list(reqs)
+    assert len(items) == 2
+    assert all(isinstance(item, Requirement) for item in items)
+
+
+def test_requirement_set_repr():
+    """Test string representation."""
+    reqs = RequirementSet([no_pii(), json_valid()])
+    repr_str = repr(reqs)
+    assert "RequirementSet" in repr_str
+    assert "2 requirements" in repr_str
+
+
+def test_requirement_set_str():
+    """Test detailed string representation."""
+    reqs = RequirementSet([no_pii(), json_valid()])
+    str_repr = str(reqs)
+    assert "RequirementSet" in str_repr
+    assert "2 requirements" in str_repr
+
+
+def test_requirement_set_str_empty():
+    """Test string representation of empty set."""
+    reqs = RequirementSet()
+    assert "empty" in str(reqs)
+
+
+def test_requirement_set_copy():
+    """Test deep copy."""
+    original = RequirementSet([no_pii(), json_valid()])
+    copy = original.copy()
+
+    assert len(copy) == len(original)
+    assert id(copy) != id(original)
+    assert id(copy._requirements) != id(original._requirements)
+
+
+def test_requirement_set_to_list():
+    """Test conversion to list."""
+    reqs = RequirementSet([no_pii(), json_valid()])
+    req_list = reqs.to_list()
+
+    assert isinstance(req_list, list)
+    assert len(req_list) == 2
+    assert all(isinstance(item, Requirement) for item in req_list)
+
+
+def test_requirement_set_clear():
+    """Test clearing all requirements."""
+    reqs = RequirementSet([no_pii(), json_valid()])
+    empty = reqs.clear()
+
+    assert len(empty) == 0
+    assert empty.is_empty()
+    assert len(reqs) == 2  # Original unchanged
+
+
+def test_requirement_set_is_empty():
+    """Test is_empty() method."""
+    empty = RequirementSet()
+    not_empty = RequirementSet([no_pii()])
+
+    assert empty.is_empty()
+    assert not not_empty.is_empty()
+
+
+def test_requirement_set_chaining():
+    """Test method chaining (fluent API)."""
+    reqs = RequirementSet().add(no_pii()).add(json_valid()).add(max_length(500))
+
+    assert len(reqs) == 3
+
+
+def test_requirement_set_complex_composition():
+    """Test complex composition scenario."""
+    base = RequirementSet([no_pii()])
+    safety = base.add(no_harmful_content())
+    format = RequirementSet([json_valid(), max_length(1000)])
+
+    combined = safety + format
+    assert len(combined) == 4
+
+
+# endregion
+
+# region GuardrailProfiles Tests
+
+
+def test_guardrail_profiles_basic_safety():
+    """Test basic_safety profile."""
+    profile = GuardrailProfiles.basic_safety()
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 2
+
+
+def test_guardrail_profiles_json_output():
+    """Test json_output profile."""
+    profile = GuardrailProfiles.json_output(max_size=500)
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 3
+
+
+def test_guardrail_profiles_code_generation():
+    """Test code_generation profile."""
+    profile = GuardrailProfiles.code_generation("python")
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 3
+
+
+def test_guardrail_profiles_professional_content():
+    """Test professional_content profile."""
+    profile = GuardrailProfiles.professional_content()
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 3
+
+
+def test_guardrail_profiles_api_documentation():
+    """Test api_documentation profile."""
+    profile = GuardrailProfiles.api_documentation()
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 5
+
+
+def test_guardrail_profiles_grounded_summary():
+    """Test grounded_summary profile."""
+    context = "Python is a programming language."
+    profile = GuardrailProfiles.grounded_summary(context, threshold=0.5)
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 3
+
+
+def test_guardrail_profiles_safe_chat():
+    """Test safe_chat profile."""
+    profile = GuardrailProfiles.safe_chat()
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 3
+
+
+def test_guardrail_profiles_structured_data_no_schema():
+    """Test structured_data profile without schema."""
+    profile = GuardrailProfiles.structured_data()
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 3
+
+
+def test_guardrail_profiles_structured_data_with_schema():
+    """Test structured_data profile with schema."""
+    schema = {"type": "object", "properties": {"name": {"type": "string"}}}
+    profile = GuardrailProfiles.structured_data(schema=schema)
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 4  # Includes matches_schema
+
+
+def test_guardrail_profiles_content_moderation():
+    """Test content_moderation profile."""
+    profile = GuardrailProfiles.content_moderation()
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 3
+
+
+def test_guardrail_profiles_minimal():
+    """Test minimal profile."""
+    profile = GuardrailProfiles.minimal()
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 1
+
+
+def test_guardrail_profiles_strict():
+    """Test strict profile."""
+    profile = GuardrailProfiles.strict()
+    assert isinstance(profile, RequirementSet)
+    assert len(profile) == 4
+
+
+def test_guardrail_profiles_customization():
+    """Test that profiles can be customized."""
+    profile = GuardrailProfiles.basic_safety()
+    customized = profile.add(json_valid())
+
+    assert len(profile) == 2  # Original unchanged
+    assert len(customized) == 3
+
+
+def test_guardrail_profiles_composition():
+    """Test composing multiple profiles."""
+    safety = GuardrailProfiles.basic_safety()
+    format = GuardrailProfiles.json_output(max_size=500)
+
+    combined = safety + format
+    assert isinstance(combined, RequirementSet)
+    # Note: May have duplicates (e.g., no_pii appears in both)
+    assert len(combined) >= 3
+
+
+# endregion
+
+# region Integration Tests
+
+
+def test_requirement_set_with_session_compatibility():
+    """Test that RequirementSet is compatible with session.instruct()."""
+    # This test verifies the interface, not actual execution
+    reqs = RequirementSet([no_pii(), json_valid()])
+
+    # Should be iterable
+    req_list = list(reqs)
+    assert len(req_list) == 2
+    assert all(isinstance(r, Requirement) for r in req_list)
+
+
+def test_profile_with_session_compatibility():
+    """Test that GuardrailProfiles work with session.instruct()."""
+    profile = GuardrailProfiles.basic_safety()
+
+    # Should be iterable
+    req_list = list(profile)
+    assert len(req_list) == 2
+    assert all(isinstance(r, Requirement) for r in req_list)
+
+
+def test_real_world_scenario():
+    """Test a realistic usage scenario."""
+
+    # Define application-wide profiles
+    class AppGuardrails:
+        BASE = RequirementSet([no_pii(), no_harmful_content()])
+        JSON_API = BASE + RequirementSet([json_valid(), max_length(1000)])
+
+    # Use in application
+    api_reqs = AppGuardrails.JSON_API
+    assert len(api_reqs) == 4
+    assert isinstance(api_reqs, RequirementSet)
+
+
+# endregion